slyalin
diff --git a/‎.github/workflows/job_cxx_unit_tests.yml
+2 b/‎.github/workflows/job_cxx_unit_tests.yml
+2
diff --git a/‎.github/workflows/job_python_unit_tests.yml
+1-1 b/‎.github/workflows/job_python_unit_tests.yml
+1-1
diff --git a/‎.github/workflows/linux.yml
+1-1 b/‎.github/workflows/linux.yml
+1-1
diff --git a/‎.github/workflows/mac_arm64.yml
+1-1 b/‎.github/workflows/mac_arm64.yml
+1-1
diff --git a/‎CMakeLists.txt
+1-1 b/‎CMakeLists.txt
+1-1
diff --git a/‎cmake/developer_package/cross_compile/native_compile.cmake
+1-1 b/‎cmake/developer_package/cross_compile/native_compile.cmake
+1-1
diff --git a/‎cmake/features.cmake
+9-1 b/‎cmake/features.cmake
+9-1
diff --git a/‎cmake/packaging/debian.cmake
+1 b/‎cmake/packaging/debian.cmake
+1
diff --git a/‎cmake/packaging/rpm.cmake
+1 b/‎cmake/packaging/rpm.cmake
+1
diff --git a/‎cmake/templates/OpenVINOConfig.cmake.in
+12 b/‎cmake/templates/OpenVINOConfig.cmake.in
+12
diff --git a/‎cmake/templates/OpenVINODeveloperPackageConfig.cmake.in
+1-1 b/‎cmake/templates/OpenVINODeveloperPackageConfig.cmake.in
+1-1
diff --git a/‎cmake/templates/OpenVINODeveloperPackageConfigRelocatable.cmake.in
+1-1 b/‎cmake/templates/OpenVINODeveloperPackageConfigRelocatable.cmake.in
+1-1
diff --git a/‎docs/articles_en/assets/snippets/ov_hetero.cpp
-8 b/‎docs/articles_en/assets/snippets/ov_hetero.cpp
-8
diff --git a/‎docs/articles_en/assets/snippets/ov_hetero.py
-12 b/‎docs/articles_en/assets/snippets/ov_hetero.py
-12
diff --git a/‎docs/articles_en/openvino-workflow/running-inference/inference-devices-and-modes/hetero-execution.rst
+17-51 b/‎docs/articles_en/openvino-workflow/running-inference/inference-devices-and-modes/hetero-execution.rst
+17-51
diff --git a/‎docs/nbdoc/consts.py
+1-1 b/‎docs/nbdoc/consts.py
+1-1
@@ -162,6 +162,7 @@ jobs:
                 --gtest_output=xml:${INSTALL_TEST_DIR}/TEST-Transformations.xml
 
       - name: Common test utils tests
+        if: ${{ runner.os != 'macOS' }} # Ticket: 134469
         run: |
           source ${INSTALL_DIR}/setupvars.sh
           ${INSTALL_TEST_DIR}/ov_util_tests --gtest_print_time=1 \
@@ -216,6 +217,7 @@ jobs:
                 --gtest_output=xml:${INSTALL_TEST_DIR}/TEST-TemplateFuncTests.xml
 
       - name: OV utils unit tests
+        if: ${{ runner.os != 'macOS' }} # Ticket: 134469
         run: |
           source ${INSTALL_DIR}/setupvars.sh
           ${INSTALL_TEST_DIR}/ov_util_tests --gtest_print_time=1 \
 
@@ -211,7 +211,7 @@ jobs:
           python3 -m pytest ${LAYER_TESTS_INSTALL_DIR}/py_frontend_tests --junitxml=${INSTALL_TEST_DIR}/TEST-test_py_fontend.xml
 
       - name: PyTorch Layer Tests
-        if: ${{ fromJSON(inputs.affected-components).PyTorch_FE.test && runner.arch != 'ARM64' }} # Ticket: 126287
+        if: ${{ fromJSON(inputs.affected-components).PyTorch_FE.test && runner.arch != 'ARM64' }} # Ticket: 126287, 142196
         run: python3 -m pytest ${LAYER_TESTS_INSTALL_DIR}/pytorch_tests -n logical -m precommit --junitxml=${INSTALL_TEST_DIR}/TEST-pytorch.xml
         env:
           TEST_DEVICE: CPU
 
@@ -695,7 +695,7 @@ jobs:
     if: fromJSON(needs.smart_ci.outputs.affected_components).TOKENIZERS
 
   GPU:
-    name: GPU ${{ matrix.TEST_TYPE }} Tests
+    name: GPU Tests
     needs: [ Build, Smart_CI ]
     if: fromJSON(needs.smart_ci.outputs.affected_components).GPU
     timeout-minutes: 80
 
@@ -180,7 +180,7 @@ jobs:
         run: |
           cmake \
             -DCUSTOM_OPERATIONS="calculate_grid;complex_mul;fft;grid_sample;sparse_conv;sparse_conv_transpose" \
-            -DOPENVINO_EXTRA_MODULES=${{ OPENVINO_CONTRIB_REPO }}/modules/custom_operations \
+            -DOPENVINO_EXTRA_MODULES=${{ env.OPENVINO_CONTRIB_REPO }}/modules/custom_operations \
             -S ${{ env.OPENVINO_REPO }} \
             -B ${{ env.BUILD_DIR }}
           cmake --build ${{ env.BUILD_DIR }} --parallel --config ${{ env.CMAKE_BUILD_TYPE }}
 
@@ -71,7 +71,7 @@ if(OV_GENERATOR_MULTI_CONFIG)
     string(REPLACE ";" " " config_types "${CMAKE_CONFIGURATION_TYPES}")
     message (STATUS "CMAKE_CONFIGURATION_TYPES ............. " ${config_types})
     unset(config_types)
-    if(CMAKE_GENERATOR MATCHES "^Ninja Multi-Config$")
+    if(CMAKE_GENERATOR STREQUAL "Ninja Multi-Config")
         message (STATUS "CMAKE_DEFAULT_BUILD_TYPE .............. " ${CMAKE_DEFAULT_BUILD_TYPE})
     endif()
 else()
 
@@ -71,7 +71,7 @@ function(ov_native_compile_external_project)
     endif()
 
     if(OV_GENERATOR_MULTI_CONFIG)
-        if(CMAKE_GENERATOR MATCHES "^Ninja Multi-Config$")
+        if(CMAKE_GENERATOR STREQUAL "Ninja Multi-Config")
             list(APPEND ARG_CMAKE_ARGS "-DCMAKE_CONFIGURATION_TYPES=${CMAKE_DEFAULT_BUILD_TYPE}")
             list(APPEND ARG_CMAKE_ARGS "-DCMAKE_DEFAULT_BUILD_TYPE=${CMAKE_DEFAULT_BUILD_TYPE}")
         endif()
 
@@ -162,7 +162,15 @@ else()
     set(ENABLE_SYSTEM_FLATBUFFERS_DEFAULT ON)
 endif()
 
-ov_dependent_option (ENABLE_SYSTEM_TBB  "Enables use of system TBB" OFF "THREADING MATCHES TBB" OFF)
+# use system TBB only for Debian / RPM packages
+if(CPACK_GENERATOR MATCHES "^(DEB|RPM|CONDA-FORGE|BREW|CONAN|VCPKG)$")
+    set(ENABLE_SYSTEM_TBB_DEFAULT ${ENABLE_SYSTEM_LIBS_DEFAULT})
+else()
+    set(ENABLE_SYSTEM_TBB_DEFAULT OFF)
+endif()
+
+ov_dependent_option (ENABLE_SYSTEM_TBB  "Enables use of system TBB" ${ENABLE_SYSTEM_TBB_DEFAULT}
+    "THREADING MATCHES TBB" OFF)
 ov_option (ENABLE_SYSTEM_PUGIXML "Enables use of system PugiXML" OFF)
 # the option is on by default, because we use only flatc compiler and don't use any libraries
 ov_dependent_option(ENABLE_SYSTEM_FLATBUFFERS "Enables use of system flatbuffers" ${ENABLE_SYSTEM_FLATBUFFERS_DEFAULT}
 
@@ -93,6 +93,7 @@ macro(ov_cpack_settings)
         2023.3.0 2023.3.1 2023.3.2 2023.3.3 2023.3.4 2023.3.5
         2024.0.0
         2024.1.0
+        2024.2.0
         )
 
     ov_check_conflicts_versions(conflicting_versions)
 
@@ -81,6 +81,7 @@ macro(ov_cpack_settings)
         2023.3.0 2023.3.1 2023.3.2 2023.3.3 2023.3.4 2023.3.5
         2024.0.0
         2024.1.0
+        2024.2.0
         )
 
     ov_check_conflicts_versions(conflicting_versions)
 
@@ -92,9 +92,16 @@
 #   `OpenVINO_VERSION_PATCH`
 #   Patch version component
 #
+#  OpenVINO build configuration variables:
+#
+#   `OpenVINO_GLIBCXX_USE_CXX11_ABI`
+#   Linux only: defines _GLIBCXX_USE_CXX11_ABI used to compiled OpenVINO
+#
 
 @PACKAGE_INIT@
 
+set(OpenVINO_GLIBCXX_USE_CXX11_ABI "@OV_GLIBCXX_USE_CXX11_ABI@")
+
 #
 # Common functions
 #
@@ -473,6 +480,11 @@ set(_OV_ENABLE_OPENVINO_BUILD_SHARED "@BUILD_SHARED_LIBS@")
 if(NOT TARGET openvino)
     set(_ov_as_external_package ON)
     include("${CMAKE_CURRENT_LIST_DIR}/OpenVINOTargets.cmake")
+
+    # since OpenVINO is compiled with _GLIBCXX_USE_CXX11_ABI=0
+    if(NOT OpenVINO_GLIBCXX_USE_CXX11_ABI STREQUAL "")
+        add_definitions(-D_GLIBCXX_USE_CXX11_ABI=${OpenVINO_GLIBCXX_USE_CXX11_ABI})
+    endif()
 endif()
 
 if(NOT _OV_ENABLE_OPENVINO_BUILD_SHARED)
 
@@ -22,7 +22,7 @@ endif()
 get_property(_OV_GENERATOR_MULTI_CONFIG GLOBAL PROPERTY GENERATOR_IS_MULTI_CONFIG)
 if(_OV_GENERATOR_MULTI_CONFIG)
     list(APPEND ov_options CMAKE_CONFIGURATION_TYPES)
-    if(CMAKE_GENERATOR MATCHES "^Ninja Multi-Config$")
+    if(CMAKE_GENERATOR STREQUAL "Ninja Multi-Config")
         list(APPEND ov_options CMAKE_DEFAULT_BUILD_TYPE)
     endif()
 else()
 
@@ -18,7 +18,7 @@ endif()
 get_property(_OV_GENERATOR_MULTI_CONFIG GLOBAL PROPERTY GENERATOR_IS_MULTI_CONFIG)
 if(_OV_GENERATOR_MULTI_CONFIG)
     list(APPEND ov_options CMAKE_CONFIGURATION_TYPES)
-    if(CMAKE_GENERATOR MATCHES "^Ninja Multi-Config$")
+    if(CMAKE_GENERATOR STREQUAL "Ninja Multi-Config")
         list(APPEND ov_options CMAKE_DEFAULT_BUILD_TYPE)
     endif()
 else()
 
@@ -53,13 +53,5 @@ auto compiled_model = core.compile_model(model, "HETERO",
 );
 //! [configure_fallback_devices]
 }
-
-{
-//! [set_pipeline_parallelism]
-std::set<ov::hint::ModelDistributionPolicy> model_policy = {ov::hint::ModelDistributionPolicy::PIPELINE_PARALLEL};
-auto compiled_model =
-    core.compile_model(model, "HETERO:GPU.1,GPU.2", ov::hint::model_distribution_policy(model_policy));
-//! [set_pipeline_parallelism]
-}
 return 0;
 }
@@ -53,15 +53,3 @@ def main():
     core.set_property("CPU", {hints.inference_precision: ov.Type.f32})
     compiled_model = core.compile_model(model=model, device_name="HETERO")
     #! [configure_fallback_devices]
-
-    #! [set_pipeline_parallelism]
-    import openvino.properties.hint as hints
-
-    compiled_model = core.compile_model(
-        model,
-        device_name="HETERO:GPU.1,GPU.2",
-        config={
-            hints.model_distribution_policy:
-            "PIPELINE_PARALLEL"
-        })
-    #! [set_pipeline_parallelism]
@@ -18,36 +18,29 @@ Execution via the heterogeneous mode can be divided into two independent steps:
 
 1. Setting hardware affinity to operations (`ov::Core::query_model <https://docs.openvino.ai/2024/api/c_cpp_api/classov_1_1_core.html#doxid-classov-1-1-core-1acdf8e64824fe4cf147c3b52ab32c1aab>`__ is used internally by the Hetero device).
 2. Compiling a model to the Heterogeneous device assumes splitting the model to parts, compiling them on the specified devices (via `ov::device::priorities <https://docs.openvino.ai/2024/api/c_cpp_api/structov_1_1device_1_1_priorities.html>`__), and executing them in the Heterogeneous mode. The model is split to subgraphs in accordance with the affinities, where a set of connected operations with the same affinity is to be a dedicated subgraph. Each subgraph is compiled on a dedicated device and multiple `ov::CompiledModel <https://docs.openvino.ai/2024/api/c_cpp_api/classov_1_1_compiled_model.html#doxid-classov-1-1-compiled-model>`__ objects are made, which are connected via automatically allocated intermediate tensors.
-   
-   If you set pipeline parallel (via ``ov::hint::model_distribution_policy``), the model is split into multiple stages, and each stage is assigned to a different device. The output of one stage is fed as input to the next stage.
 
 These two steps are not interconnected and affinities can be set in one of two ways, used separately or in combination (as described below): in the ``manual`` or the ``automatic`` mode.
 
 Defining and Configuring the Hetero Device
-##########################################
+++++++++++++++++++++++++++++++++++++++++++
 
 Following the OpenVINO™ naming convention, the Hetero execution plugin is assigned the label of ``"HETERO".`` It may be defined with no additional parameters, resulting in defaults being used, or configured further with the following setup options:
 
 
-+--------------------------------------------+-------------------------------------------------------------+-----------------------------------------------------------+
-| Parameter Name & C++ property              | Property values                                             | Description                                               |
-+============================================+=============================================================+===========================================================+
-| | "MULTI_DEVICE_PRIORITIES"                | | ``HETERO: <device names>``                                | | Lists the devices available for selection.              |
-| | ``ov::device::priorities``               | |                                                           | | The device sequence will be taken as priority           |
-| |                                          | | comma-separated, no spaces                                | | from high to low.                                       |
-+--------------------------------------------+-------------------------------------------------------------+-----------------------------------------------------------+
-| |                                          | | ``empty``                                                 | | Model distribution policy for inference with            |
-| | "MODEL_DISTRIBUTION_POLICY"              | | ``ov::hint::ModelDistributionPolicy::PIPELINE_PARALLEL``  | | multiple devices. Distribute model to multiple          |
-| |                                          | |                                                           | | devices during model compilation.                       |
-| | ``ov::hint::model_distribution_policy``  | | HETERO only support PIPELINE_PARALLEL, The default value  | |                                                         |
-| |                                          | | is empty                                                  | |                                                         |
-+--------------------------------------------+-------------------------------------------------------------+-----------------------------------------------------------+
++-------------------------------+--------------------------------------------+-----------------------------------------------------------+
+| Parameter Name & C++ property | Property values                            | Description                                               |
++===============================+============================================+===========================================================+
+| | "MULTI_DEVICE_PRIORITIES"   | | HETERO: <device names>                   | | Lists the devices available for selection.              |
+| | ``ov::device::priorities``  | | comma-separated, no spaces               | | The device sequence will be taken as priority           |
+| |                             | |                                          | | from high to low.                                       |
++-------------------------------+--------------------------------------------+-----------------------------------------------------------+
+
 
 Manual and Automatic modes for assigning affinities
-###################################################
++++++++++++++++++++++++++++++++++++++++++++++++++++
 
 The Manual Mode
-++++++++++++++++++
+--------------------
 
 It assumes setting affinities explicitly for all operations in the model using `ov::Node::get_rt_info <https://docs.openvino.ai/2024/api/c_cpp_api/classov_1_1_node.html#doxid-classov-1-1-node-1a6941c753af92828d842297b74df1c45a>`__ with the ``"affinity"`` key.
 
@@ -73,10 +66,7 @@ Randomly selecting operations and setting affinities may lead to decrease in mod
 
 
 The Automatic Mode
-++++++++++++++++++
-
-Without pipeline parallelism
------------------------------
+--------------------
 
 It decides automatically which operation is assigned to which device according to the support from dedicated devices (``GPU``, ``CPU``, etc.) and query model step is called implicitly by Hetero device during model compilation.
 
@@ -100,33 +90,9 @@ It does not take into account device peculiarities such as the inability to infe
          :language: cpp
          :fragment: [compile_model]
 
-Pipeline parallelism
-------------------------
-
-The pipeline parallelism is set via ``ov::hint::model_distribution_policy``. This mode is an efficient technique to infer large models on multiple devices. The model is split into multiple stages, and each stage is assigned to a different device (``dGPU``, ``iGPU``, ``CPU``, etc.). This mode assign operations to different devices as reasonably as possible, ensuring that different stages can be executed in sequence and minimizing the amount of data transfer between different devices.
-
-For large models which don’t fit on a single first priority device, model pipeline parallelism is employed where certain parts of the model are placed on different devices to ensure that the device has enough memory to infer these operations.
-
-
-.. tab-set::
-
-   .. tab-item:: Python
-      :sync: py
-
-      .. doxygensnippet:: docs/articles_en/assets/snippets/ov_hetero.py
-         :language: Python
-         :fragment: [set_pipeline_parallelism]
-
-   .. tab-item:: C++
-      :sync: cpp
-
-      .. doxygensnippet:: docs/articles_en/assets/snippets/ov_hetero.cpp
-         :language: cpp
-         :fragment: [set_pipeline_parallelism]
-
 
 Using Manual and Automatic Modes in Combination
-+++++++++++++++++++++++++++++++++++++++++++++++
+-----------------------------------------------
 
 In some cases you may need to consider manually adjusting affinities which were set automatically. It usually serves minimizing the number of total subgraphs to optimize memory transfers. To do it, you need to "fix" the automatically assigned affinities like so:
 
@@ -155,7 +121,7 @@ Importantly, the automatic mode will not work if any operation in a model has it
    `ov::Core::query_model <https://docs.openvino.ai/2024/api/c_cpp_api/classov_1_1_core.html#doxid-classov-1-1-core-1acdf8e64824fe4cf147c3b52ab32c1aab>`__ does not depend on affinities set by a user. Instead, it queries for an operation support based on device capabilities.
 
 Configure fallback devices
-##########################
+++++++++++++++++++++++++++
 
 If you want different devices in Hetero execution to have different device-specific configuration options, you can use the special helper property `ov::device::properties <https://docs.openvino.ai/2024/api/c_cpp_api/structov_1_1device_1_1_properties.html#doxid-group-ov-runtime-cpp-prop-api-1ga794d09f2bd8aad506508b2c53ef6a6fc>`__:
 
@@ -180,15 +146,15 @@ If you want different devices in Hetero execution to have different device-speci
 In the example above, the ``GPU`` device is configured to enable profiling data and uses the default execution precision, while ``CPU`` has the configuration property to perform inference in ``fp32``.
 
 Handling of Difficult Topologies
-################################
+++++++++++++++++++++++++++++++++
 
 Some topologies are not friendly to heterogeneous execution on some devices, even to the point of being unable to execute.
 For example, models having activation operations that are not supported on the primary device are split by Hetero into multiple sets of subgraphs which leads to suboptimal execution.
 If transmitting data from one subgraph to another part of the model in the heterogeneous mode takes more time than under normal execution, heterogeneous execution may be unsubstantiated.
 In such cases, you can define the heaviest part manually and set the affinity to avoid sending data back and forth many times during one inference.
 
 Analyzing Performance of Heterogeneous Execution
-################################################
+++++++++++++++++++++++++++++++++++++++++++++++++
 
 After enabling the ``OPENVINO_HETERO_VISUALIZE`` environment variable, you can dump GraphViz ``.dot`` files with annotations of operations per devices.
 
@@ -220,7 +186,7 @@ Here is an example of the output for Googlenet v1 running on HDDL (device no lon
 
 
 Sample Usage
-############
+++++++++++++++++++++
 
 OpenVINO™ sample programs can use the Heterogeneous execution used with the ``-d`` option:
 
 
@@ -6,7 +6,7 @@
 repo_owner = "openvinotoolkit"
 repo_name = "openvino_notebooks"
 repo_branch = "tree/main"
-artifacts_link = "http://repository.toolbox.iotg.sclab.intel.com/projects/ov-notebook/0.1.0-latest/20240506220807/dist/rst_files/"
+artifacts_link = "http://repository.toolbox.iotg.sclab.intel.com/projects/ov-notebook/0.1.0-latest/20240515220822/dist/rst_files/"
 blacklisted_extensions = ['.xml', '.bin']
 notebooks_repo = "https://github.com/openvinotoolkit/openvino_notebooks/blob/latest/"
 notebooks_binder = "https://mybinder.org/v2/gh/openvinotoolkit/openvino_notebooks/HEAD?filepath="
Original file line number	Diff line number	Diff line change
`@@ -93,6 +93,7 @@ macro(ov_cpack_settings)`
`93`	`93`	`2023.3.0 2023.3.1 2023.3.2 2023.3.3 2023.3.4 2023.3.5`
`94`	`94`	`2024.0.0`
`95`	`95`	`2024.1.0`
	`96`	`+ 2024.2.0`
`96`	`97`	`)`
`97`	`98`
`98`	`99`	`ov_check_conflicts_versions(conflicting_versions)`
Original file line number	Diff line number	Diff line change
`@@ -81,6 +81,7 @@ macro(ov_cpack_settings)`
`81`	`81`	`2023.3.0 2023.3.1 2023.3.2 2023.3.3 2023.3.4 2023.3.5`
`82`	`82`	`2024.0.0`
`83`	`83`	`2024.1.0`
	`84`	`+ 2024.2.0`
`84`	`85`	`)`
`85`	`86`
`86`	`87`	`ov_check_conflicts_versions(conflicting_versions)`
Original file line number	Diff line number	Diff line change
`@@ -53,13 +53,5 @@ auto compiled_model = core.compile_model(model, "HETERO",`
`53`	`53`	`);`
`54`	`54`	`//! [configure_fallback_devices]`
`55`	`55`	`}`
`56`		`-`
`57`		`-{`
`58`		`-//! [set_pipeline_parallelism]`
`59`		`-std::set<ov::hint::ModelDistributionPolicy> model_policy = {ov::hint::ModelDistributionPolicy::PIPELINE_PARALLEL};`
`60`		`-auto compiled_model =`
`61`		`- core.compile_model(model, "HETERO:GPU.1,GPU.2", ov::hint::model_distribution_policy(model_policy));`
`62`		`-//! [set_pipeline_parallelism]`
`63`		`-}`
`64`	`56`	`return 0;`
`65`	`57`	`}`