diff --git a/.circleci/port-linux.txt b/.circleci/port-linux.txt index 598bee82..43fa892d 100644 --- a/.circleci/port-linux.txt +++ b/.circleci/port-linux.txt @@ -3,4 +3,5 @@ grpc[codegen] flatbuffers abseil liblzma -onnxruntime +onnx[disable-static-registration] +onnxruntime[training] diff --git a/ports/onnxruntime/fix-clang-cl-simd-compile.patch b/ports/onnxruntime/fix-clang-cl-simd-compile.patch index 18c598c5..4afe7967 100644 --- a/ports/onnxruntime/fix-clang-cl-simd-compile.patch +++ b/ports/onnxruntime/fix-clang-cl-simd-compile.patch @@ -1,8 +1,8 @@ diff --git a/cmake/onnxruntime_mlas.cmake b/cmake/onnxruntime_mlas.cmake -index bee83ff07c..04b4cf42b7 100644 +index 682dcfc..405c65b 100644 --- a/cmake/onnxruntime_mlas.cmake +++ b/cmake/onnxruntime_mlas.cmake -@@ -159,15 +159,27 @@ function(setup_mlas_source_for_windows) +@@ -158,15 +158,31 @@ function(setup_mlas_source_for_windows) ) set_source_files_properties(${mlas_platform_srcs_avx2} PROPERTIES COMPILE_FLAGS "/arch:AVX2") @@ -16,6 +16,9 @@ index bee83ff07c..04b4cf42b7 100644 + if (CMAKE_CXX_COMPILER_ID MATCHES "Clang") + set_source_files_properties(${mlas_platform_srcs_avx512} PROPERTIES COMPILE_FLAGS "/arch:AVX512") + set_source_files_properties(${mlas_platform_srcs_amx} PROPERTIES COMPILE_FLAGS "/arch:AVX512 -mamx-tile -mamx-int8") ++ # https://clang.llvm.org/docs/UsersManual.html#cpu-architectures-features-and-limitations ++ set_source_files_properties(${MLAS_SRC_DIR}/qgemm_kernel_sse.cpp PROPERTIES COMPILE_FLAGS "-march=x86-64") ++ set_source_files_properties(${MLAS_SRC_DIR}/qgemm_kernel_sse41.cpp PROPERTIES COMPILE_FLAGS "-march=x86-64-v2") + endif() + target_sources(onnxruntime_mlas PRIVATE @@ -25,14 +28,15 @@ index bee83ff07c..04b4cf42b7 100644 - ${MLAS_SRC_DIR}/qgemm_kernel_amx.cpp + ${mlas_platform_srcs_avx512} + ${mlas_platform_srcs_amx} ++ # ... ${MLAS_SRC_DIR}/qgemm_kernel_avx2.cpp ${MLAS_SRC_DIR}/qgemm_kernel_sse.cpp ${MLAS_SRC_DIR}/qgemm_kernel_sse41.cpp - ${MLAS_SRC_DIR}/intrinsics/avx512/quantize_avx512f.cpp - ${MLAS_SRC_DIR}/amd64/QgemmU8S8KernelAmx.asm - ${MLAS_SRC_DIR}/amd64/QgemmU8S8KernelAvx2.asm - ${MLAS_SRC_DIR}/amd64/QgemmU8U8KernelAvx2.asm -@@ -205,9 +217,15 @@ function(setup_mlas_source_for_windows) + ${MLAS_SRC_DIR}/sqnbitgemm_kernel_avx2.cpp + ${MLAS_SRC_DIR}/sqnbitgemm_kernel_avx512.cpp + ${MLAS_SRC_DIR}/sqnbitgemm_kernel_avx512vnni.cpp +@@ -208,9 +224,15 @@ function(setup_mlas_source_for_windows) ${MLAS_SRC_DIR}/amd64/ErfKernelFma3.asm ) if (NOT onnxruntime_ORT_MINIMAL_BUILD) @@ -48,20 +52,6 @@ index bee83ff07c..04b4cf42b7 100644 + target_sources(onnxruntime_mlas PRIVATE ${onnxruntime_mlas_q4gemm_avx512}) endif() else() - target_sources(onnxruntime_mlas PRIVATE -diff --git a/cmake/onnxruntime_mlas.cmake b/cmake/onnxruntime_mlas.cmake -index 5c294b5..a466c77 100644 ---- a/cmake/onnxruntime_mlas.cmake -+++ b/cmake/onnxruntime_mlas.cmake -@@ -169,6 +169,9 @@ function(setup_mlas_source_for_windows) - if (CMAKE_CXX_COMPILER_ID MATCHES "Clang") - set_source_files_properties(${mlas_platform_srcs_avx512} PROPERTIES COMPILE_FLAGS "/arch:AVX512") - set_source_files_properties(${mlas_platform_srcs_amx} PROPERTIES COMPILE_FLAGS "/arch:AVX512 -mamx-tile -mamx-int8") -+ # https://clang.llvm.org/docs/UsersManual.html#cpu-architectures-features-and-limitations -+ set_source_files_properties(${MLAS_SRC_DIR}/qgemm_kernel_sse.cpp PROPERTIES COMPILE_FLAGS "-march=x86-64") -+ set_source_files_properties(${MLAS_SRC_DIR}/qgemm_kernel_sse41.cpp PROPERTIES COMPILE_FLAGS "-march=x86-64-v2") - endif() - target_sources(onnxruntime_mlas PRIVATE diff --git a/onnxruntime/core/mlas/lib/qgemm_kernel_sse41.cpp b/onnxruntime/core/mlas/lib/qgemm_kernel_sse41.cpp index 68931c5..6c095bd 100644 diff --git a/ports/onnxruntime/fix-cmake-cuda.patch b/ports/onnxruntime/fix-cmake-cuda.patch new file mode 100644 index 00000000..137a019d --- /dev/null +++ b/ports/onnxruntime/fix-cmake-cuda.patch @@ -0,0 +1,37 @@ +diff --git a/cmake/CMakeLists.txt b/cmake/CMakeLists.txt +index f829cea..bda2d4c 100644 +--- a/cmake/CMakeLists.txt ++++ b/cmake/CMakeLists.txt +@@ -715,6 +715,13 @@ if (onnxruntime_USE_CUDA) + if (onnxruntime_USE_CUDA_NHWC_OPS) + add_compile_definitions(ENABLE_CUDA_NHWC_OPS) + endif() ++ # Give more hints for the generator, with FindCUDAToolkit.cmake ++ find_package(CUDAToolkit REQUIRED) ++ if(CMAKE_GENERATOR MATCHES "Visual Studio") ++ set(CMAKE_VS_PLATFORM_TOOLSET_CUDA "${CUDAToolkit_VERSION_MAJOR}.${CUDAToolkit_VERSION_MINOR}") ++ set(CMAKE_VS_PLATFORM_TOOLSET_CUDA_CUSTOM_DIR "${CUDAToolkit_TARGET_DIR}/") ++ endif() ++ get_filename_component(CMAKE_CUDA_COMPILER "${CUDAToolkit_NVCC_EXECUTABLE}" ABSOLUTE) + enable_language(CUDA) + message( STATUS "CMAKE_CUDA_COMPILER_VERSION: ${CMAKE_CUDA_COMPILER_VERSION}") + +diff --git a/cmake/onnxruntime_providers_cuda.cmake b/cmake/onnxruntime_providers_cuda.cmake +index 1346a9c..fd60dd8 100644 +--- a/cmake/onnxruntime_providers_cuda.cmake ++++ b/cmake/onnxruntime_providers_cuda.cmake +@@ -211,8 +211,12 @@ + target_link_libraries(${target} PRIVATE CUDA::cuda_driver) + endif() + +- include(cutlass) +- target_include_directories(${target} PRIVATE ${cutlass_SOURCE_DIR}/include ${cutlass_SOURCE_DIR}/examples ${cutlass_SOURCE_DIR}/tools/util/include) ++ find_package(NvidiaCutlass REQUIRED) ++ target_link_libraries(${target} PRIVATE nvidia::cutlass::cutlass) ++ if(MSVC) ++ # CUTLASS_CONSTEXPR_IF_CXX17 must be constexpr. Correct the __cplusplus value with MSVC ++ target_compile_options(${target} PRIVATE $<$:-Xcompiler /Zc:__cplusplus>) ++ endif() + + target_include_directories(${target} PRIVATE ${ONNXRUNTIME_ROOT} ${CMAKE_CURRENT_BINARY_DIR} ${eigen_INCLUDE_DIRS} ${TVM_INCLUDES} + PUBLIC ${CUDAToolkit_INCLUDE_DIRS}) diff --git a/ports/onnxruntime/fix-cmake-training.patch b/ports/onnxruntime/fix-cmake-training.patch new file mode 100644 index 00000000..87fa6afe --- /dev/null +++ b/ports/onnxruntime/fix-cmake-training.patch @@ -0,0 +1,43 @@ +diff --git a/cmake/tensorboard/compat/proto/CMakeLists.txt b/cmake/tensorboard/compat/proto/CMakeLists.txt +index ad31e40..3e80a6e 100644 +--- a/cmake/tensorboard/compat/proto/CMakeLists.txt ++++ b/cmake/tensorboard/compat/proto/CMakeLists.txt +@@ -1,14 +1,21 @@ + # Copyright (c) Microsoft Corporation. All rights reserved. + # Licensed under the MIT License. + +-FetchContent_Declare( +- tensorboard +- URL ${DEP_URL_tensorboard} +- URL_HASH SHA1=${DEP_SHA1_tensorboard} +-) +-FetchContent_MakeAvailable(tensorboard) +- +-set(TENSORBOARD_ROOT ${tensorboard_SOURCE_DIR}) ++if(onnxruntime_USE_VCPKG) ++ if(NOT DEFINED TENSORBOARD_ROOT) ++ message(FATAL_ERROR "TENSORBOARD_ROOT not defined") ++ endif() ++ find_path(PROTOBUF_IMPORT_DIR NAMES "google/protobuf/api.proto" REQUIRED) ++else() ++ FetchContent_Declare( ++ tensorboard ++ URL ${DEP_URL_tensorboard} ++ URL_HASH SHA1=${DEP_SHA1_tensorboard} ++ ) ++ FetchContent_MakeAvailable(tensorboard) ++ set(TENSORBOARD_ROOT ${tensorboard_SOURCE_DIR}) ++ set(PROTOBUF_IMPORT_DIR ${protobuf_SOURCE_DIR}/src) ++endif() + + # tensorboard protos + file(GLOB_RECURSE tensorboard_proto_srcs CONFIGURE_DEPENDS +@@ -16,7 +23,7 @@ file(GLOB_RECURSE tensorboard_proto_srcs CONFIGURE_DEPENDS + ) + + add_library(tensorboard STATIC ${tensorboard_proto_srcs}) +-onnxruntime_protobuf_generate(APPEND_PATH IMPORT_DIRS ${tensorboard_SOURCE_DIR} ${protobuf_SOURCE_DIR}/src TARGET tensorboard) ++onnxruntime_protobuf_generate(APPEND_PATH IMPORT_DIRS ${TENSORBOARD_ROOT} ${PROTOBUF_IMPORT_DIR} TARGET tensorboard) + onnxruntime_add_include_to_target(tensorboard ${PROTOBUF_LIB}) + target_include_directories(tensorboard PRIVATE ${PROJECT_BINARY_DIR}) + add_dependencies(tensorboard ${onnxruntime_EXTERNAL_DEPENDENCIES}) diff --git a/ports/onnxruntime/fix-cmake.patch b/ports/onnxruntime/fix-cmake.patch index 075df607..69c4bc78 100644 --- a/ports/onnxruntime/fix-cmake.patch +++ b/ports/onnxruntime/fix-cmake.patch @@ -2,32 +2,15 @@ diff --git a/cmake/CMakeLists.txt b/cmake/CMakeLists.txt index 8edbb6ad6f..4987d5af5a 100644 --- a/cmake/CMakeLists.txt +++ b/cmake/CMakeLists.txt -@@ -38,6 +38,7 @@ include(CheckLanguage) +@@ -38,6 +38,8 @@ include(CheckLanguage) include(CMakeDependentOption) include(FetchContent) include(CheckFunctionExists) +include(GNUInstallDirs) # onnxruntime_providers_* require CMAKE_INSTALL_* variables ++list(APPEND CMAKE_MODULE_PATH "${CMAKE_CURRENT_SOURCE_DIR}/external") # TODO: update this once all system adapt c++20 if(CMAKE_SYSTEM_NAME STREQUAL "Darwin") -@@ -583,7 +584,7 @@ get_filename_component(ORTTRAINING_ROOT "${ORTTRAINING_ROOT}" ABSOLUTE) - get_filename_component(REPO_ROOT "${REPO_ROOT}" ABSOLUTE) - set(ONNXRUNTIME_INCLUDE_DIR ${REPO_ROOT}/include/onnxruntime) - --include(external/onnxruntime_external_deps.cmake) -+include(external/onnxruntime_vcpkg_deps.cmake) - - set(ORT_WARNING_FLAGS) - if (WIN32) -@@ -956,7 +975,7 @@ function(onnxruntime_set_compile_flags target_name) - target_compile_definitions(${target_name} PRIVATE ORT_NEURAL_SPEED) - endif() - -- set_target_properties(${target_name} PROPERTIES COMPILE_WARNING_AS_ERROR ON) -+ set_target_properties(${target_name} PROPERTIES COMPILE_WARNING_AS_ERROR OFF) - if (onnxruntime_USE_CUDA) - # Suppress a "conversion_function_not_usable" warning in gsl/span - target_compile_options(${target_name} PRIVATE "$<$:SHELL:-Xcudafe \"--diag_suppress=conversion_function_not_usable\">") diff --git a/cmake/onnxruntime.cmake b/cmake/onnxruntime.cmake index e15c8a046d..d3a2e64bb9 100644 --- a/cmake/onnxruntime.cmake @@ -66,50 +49,17 @@ index 66df115..bd313d8 100644 if (MSVC) # The warning means the type of two integral values around a binary operator is narrow than their result. -@@ -959,6 +959,9 @@ target_compile_definitions(onnx_test_data_proto PRIVATE "-DONNX_API=") +diff --git a/cmake/onnxruntime_unittests.cmake b/cmake/onnxruntime_unittests.cmake +index 2ae07d5..9ee95a7 100644 +--- a/cmake/onnxruntime_unittests.cmake ++++ b/cmake/onnxruntime_unittests.cmake +@@ -962,7 +962,8 @@ target_compile_definitions(onnx_test_data_proto PRIVATE "-DONNX_API=") onnxruntime_add_include_to_target(onnx_test_data_proto onnx_proto) target_include_directories(onnx_test_data_proto PRIVATE ${CMAKE_CURRENT_BINARY_DIR}) set_target_properties(onnx_test_data_proto PROPERTIES FOLDER "ONNXRuntimeTest") -+if(NOT DEFINED onnx_SOURCE_DIR) -+ find_path(onnx_SOURCE_DIR NAMES "onnx/onnx-ml.proto3" "onnx/onnx-ml.proto" REQUIRED) -+endif() - onnxruntime_protobuf_generate(APPEND_PATH IMPORT_DIRS ${onnx_SOURCE_DIR} TARGET onnx_test_data_proto) +-onnxruntime_protobuf_generate(APPEND_PATH IMPORT_DIRS ${onnx_SOURCE_DIR} TARGET onnx_test_data_proto) ++find_path(ONNX_IMPORT_DIR NAMES onnx/onnx-ml.proto REQUIRED) ++onnxruntime_protobuf_generate(APPEND_PATH IMPORT_DIRS ${ONNX_IMPORT_DIR} TARGET onnx_test_data_proto) # -diff --git a/cmake/CMakeLists.txt b/cmake/CMakeLists.txt -index f829cea..bda2d4c 100644 ---- a/cmake/CMakeLists.txt -+++ b/cmake/CMakeLists.txt -@@ -715,6 +715,13 @@ if (onnxruntime_USE_CUDA) - if (onnxruntime_USE_CUDA_NHWC_OPS) - add_compile_definitions(ENABLE_CUDA_NHWC_OPS) - endif() -+ # Give more hints for the generator, with FindCUDAToolkit.cmake -+ find_package(CUDAToolkit REQUIRED) -+ if(CMAKE_GENERATOR MATCHES "Visual Studio") -+ set(CMAKE_VS_PLATFORM_TOOLSET_CUDA "${CUDAToolkit_VERSION_MAJOR}.${CUDAToolkit_VERSION_MINOR}") -+ set(CMAKE_VS_PLATFORM_TOOLSET_CUDA_CUSTOM_DIR "${CUDAToolkit_TARGET_DIR}/") -+ endif() -+ get_filename_component(CMAKE_CUDA_COMPILER "${CUDAToolkit_NVCC_EXECUTABLE}" ABSOLUTE) - enable_language(CUDA) - message( STATUS "CMAKE_CUDA_COMPILER_VERSION: ${CMAKE_CUDA_COMPILER_VERSION}") - -diff --git a/cmake/onnxruntime_providers_cuda.cmake b/cmake/onnxruntime_providers_cuda.cmake -index 1346a9c..fd60dd8 100644 ---- a/cmake/onnxruntime_providers_cuda.cmake -+++ b/cmake/onnxruntime_providers_cuda.cmake -@@ -211,8 +211,12 @@ - target_link_libraries(${target} PRIVATE CUDA::cuda_driver) - endif() - -- include(cutlass) -- target_include_directories(${target} PRIVATE ${cutlass_SOURCE_DIR}/include ${cutlass_SOURCE_DIR}/examples ${cutlass_SOURCE_DIR}/tools/util/include) -+ find_package(NvidiaCutlass REQUIRED) -+ target_link_libraries(${target} PRIVATE nvidia::cutlass::cutlass) -+ if(MSVC) -+ # CUTLASS_CONSTEXPR_IF_CXX17 must be constexpr. Correct the __cplusplus value with MSVC -+ target_compile_options(${target} PRIVATE $<$:-Xcompiler /Zc:__cplusplus>) -+ endif() - - target_include_directories(${target} PRIVATE ${ONNXRUNTIME_ROOT} ${CMAKE_CURRENT_BINARY_DIR} ${eigen_INCLUDE_DIRS} ${TVM_INCLUDES} - PUBLIC ${CUDAToolkit_INCLUDE_DIRS}) + # onnxruntime_ir_graph test data diff --git a/ports/onnxruntime/fix-llvm-rc-unicode.patch b/ports/onnxruntime/fix-llvm-rc-unicode.patch deleted file mode 100644 index 6c8db167..00000000 --- a/ports/onnxruntime/fix-llvm-rc-unicode.patch +++ /dev/null @@ -1,16 +0,0 @@ -diff --git a/onnxruntime/core/dll/onnxruntime.rc b/onnxruntime/core/dll/onnxruntime.rc -index 4b08dfdb7e..c566a4f713 100644 ---- a/onnxruntime/core/dll/onnxruntime.rc -+++ b/onnxruntime/core/dll/onnxruntime.rc -@@ -32,9 +32,9 @@ BEGIN - VALUE "FileDescription", "ONNX Runtime" - VALUE "FileVersion", VER_STRING - VALUE "InternalName", "ONNX Runtime" -- VALUE "LegalCopyright", "\251 Microsoft Corporation. All rights reserved." -+ VALUE "LegalCopyright", L"\251 Microsoft Corporation. All rights reserved." - VALUE "OriginalFilename", FILE_NAME -- VALUE "ProductName", "Microsoft\256 Windows\256 Operating System" -+ VALUE "ProductName", L"Microsoft\256 Windows\256 Operating System" - VALUE "ProductVersion", VER_STRING - END - END diff --git a/ports/onnxruntime/fix-onnxruntime-pr-19966.patch b/ports/onnxruntime/fix-onnxruntime-pr-19966.patch deleted file mode 100644 index 874965d7..00000000 --- a/ports/onnxruntime/fix-onnxruntime-pr-19966.patch +++ /dev/null @@ -1,2284 +0,0 @@ -diff --git a/cmake/CMakeLists.txt b/cmake/CMakeLists.txt -index 02b568abdf8dad08b142c87418a4111340c710d8..6700c96d84cb411ce3100cb75a38babf6a3ac65b 100644 ---- a/cmake/CMakeLists.txt -+++ b/cmake/CMakeLists.txt -@@ -1290,34 +1290,6 @@ if (onnxruntime_USE_OPENVINO) - - add_definitions(-DUSE_OPENVINO=1) - -- if (EXISTS "$ENV{INTEL_OPENVINO_DIR}/deployment_tools/inference_engine/version.txt") -- file(READ $ENV{INTEL_OPENVINO_DIR}/deployment_tools/inference_engine/version.txt VER) -- endif() -- -- if (NOT DEFINED ENV{INTEL_OPENVINO_DIR}) -- message(FATAL_ERROR "[Couldn't locate OpenVINO] OpenVINO may not have been initialized") -- endif() -- -- # Check OpenVINO version for support -- if ($ENV{INTEL_OPENVINO_DIR} MATCHES "2023.0") -- set(OPENVINO_VERSION "2023.0") -- add_definitions(-DOPENVINO_2023_0=1) -- elseif ($ENV{INTEL_OPENVINO_DIR} MATCHES "2023.1") -- set(OPENVINO_VERSION "2023.1") -- add_definitions(-DOPENVINO_2023_1=1) -- elseif ($ENV{INTEL_OPENVINO_DIR} MATCHES "2023.2") -- set(OPENVINO_VERSION "2023.2") -- add_definitions(-DOPENVINO_2023_2=1) -- elseif ($ENV{INTEL_OPENVINO_DIR} MATCHES "2023.3") -- set(OPENVINO_VERSION "2023.3") -- add_definitions(-DOPENVINO_2023_3=1) -- elseif ($ENV{INTEL_OPENVINO_DIR} MATCHES "openvino") -- set(OPENVINO_VERSION "2023.3") -- add_definitions(-DOPENVINO_2023_3=1) -- else() -- message(FATAL_ERROR "Unsupported OpenVINO version: ${INTEL_OPENVINO_DIR}") -- endif() -- - if (onnxruntime_USE_OPENVINO_GPU_FP32) - add_definitions(-DOPENVINO_CONFIG_GPU_FP32=1) - endif() -@@ -1334,6 +1306,10 @@ if (onnxruntime_USE_OPENVINO) - add_definitions(-DOPENVINO_CONFIG_CPU_FP16=1) - endif() - -+ if (onnxruntime_USE_OPENVINO_NPU) -+ add_definitions(-DOPENVINO_CONFIG_NPU=1) -+ endif() -+ - if (onnxruntime_USE_OPENVINO_GPU_FP32_NP) - add_definitions(-DOPENVINO_CONFIG_GPU_FP32=1) - add_definitions(-DOPENVINO_DISABLE_GRAPH_PARTITION=1) -@@ -1354,6 +1330,11 @@ if (onnxruntime_USE_OPENVINO) - add_definitions(-DOPENVINO_DISABLE_GRAPH_PARTITION=1) - endif() - -+ if (onnxruntime_USE_OPENVINO_NPU_NP) -+ add_definitions(-DOPENVINO_CONFIG_NPU=1) -+ add_definitions(-DOPENVINO_DISABLE_GRAPH_PARTITION=1) -+ endif() -+ - if (onnxruntime_USE_OPENVINO_HETERO) - add_definitions(-DOPENVINO_CONFIG_HETERO=1) - add_definitions(-DDEVICE_NAME="${onnxruntime_USE_OPENVINO_DEVICE}") -diff --git a/cmake/onnxruntime_providers_openvino.cmake b/cmake/onnxruntime_providers_openvino.cmake -index e26f0bfc0b75183dd490bcebfbe4042055ae35f3..5876b2b5c448bcafdbd067f408be6b6b1993a3f5 100644 ---- a/cmake/onnxruntime_providers_openvino.cmake -+++ b/cmake/onnxruntime_providers_openvino.cmake -@@ -16,23 +16,19 @@ - endif() - - # Header paths -- find_package(InferenceEngine REQUIRED) -- find_package(ngraph REQUIRED) -- -- if (OPENVINO_2022_1 OR OPENVINO_2022_2) - find_package(OpenVINO REQUIRED COMPONENTS Runtime ONNX) -- list (OV_20_LIBS openvino::frontend::onnx openvino::runtime) -+ if(OpenVINO_VERSION VERSION_LESS 2023.0) -+ message(FATAL_ERROR "OpenVINO 2023.0 and newer are supported. Please, latest OpenVINO release") - endif() - - if (WIN32) - unset(CMAKE_MAP_IMPORTED_CONFIG_RELWITHDEBINFO) - endif() - -+ list(APPEND OPENVINO_LIB_LIST openvino::frontend::onnx openvino::runtime ${PYTHON_LIBRARIES}) - if ((DEFINED ENV{OPENCL_LIBS}) AND (DEFINED ENV{OPENCL_INCS})) - add_definitions(-DIO_BUFFER_ENABLED=1) -- list(APPEND OPENVINO_LIB_LIST $ENV{OPENCL_LIBS} ${OV_20_LIBS} ${InferenceEngine_LIBRARIES} ${NGRAPH_LIBRARIES} ngraph::onnx_importer ${PYTHON_LIBRARIES}) -- else() -- list(APPEND OPENVINO_LIB_LIST ${OV_20_LIBS} ${InferenceEngine_LIBRARIES} ${NGRAPH_LIBRARIES} ngraph::onnx_importer ${PYTHON_LIBRARIES}) -+ list(APPEND OPENVINO_LIB_LIST $ENV{OPENCL_LIBS}) - endif() - - source_group(TREE ${ONNXRUNTIME_ROOT}/core FILES ${onnxruntime_providers_openvino_cc_srcs}) -@@ -75,7 +71,14 @@ - message(FATAL_ERROR "onnxruntime_providers_openvino unknown platform, need to specify shared library exports for it") - endif() - -- install(TARGETS onnxruntime_providers_openvino -- ARCHIVE DESTINATION ${CMAKE_INSTALL_LIBDIR} -- LIBRARY DESTINATION ${CMAKE_INSTALL_LIBDIR} -- RUNTIME DESTINATION ${CMAKE_INSTALL_BINDIR}) -\ No newline at end of file -+ if (CMAKE_OPENVINO_LIBRARY_INSTALL_DIR) -+ install(TARGETS onnxruntime_providers_openvino -+ ARCHIVE DESTINATION ${CMAKE_INSTALL_LIBDIR} -+ LIBRARY DESTINATION ${CMAKE_OPENVINO_LIBRARY_INSTALL_DIR} -+ RUNTIME DESTINATION ${CMAKE_INSTALL_BINDIR}) -+ else() -+ install(TARGETS onnxruntime_providers_openvino -+ ARCHIVE DESTINATION ${CMAKE_INSTALL_LIBDIR} -+ LIBRARY DESTINATION ${CMAKE_INSTALL_LIBDIR} -+ RUNTIME DESTINATION ${CMAKE_INSTALL_BINDIR}) -+ endif() -diff --git a/dockerfiles/Dockerfile.openvino b/dockerfiles/Dockerfile.openvino -index 78d04a51ba162a2fd36425fb519d27878e335204..049916fac92f118722aba9ae6ab4cb734030ac6a 100644 ---- a/dockerfiles/Dockerfile.openvino -+++ b/dockerfiles/Dockerfile.openvino -@@ -1,9 +1,9 @@ - #------------------------------------------------------------------------- --# Copyright(C) 2021-2023 Intel Corporation. -+# Copyright(C) 2021-2024 Intel Corporation. - # SPDX-License-Identifier: MIT - #-------------------------------------------------------------------------- - --ARG OPENVINO_VERSION=2023.0.0 -+ARG OPENVINO_VERSION=2024.0.0 - - - # Build stage -@@ -17,7 +17,7 @@ ARG DEVICE=CPU_FP32 - ARG ONNXRUNTIME_REPO=https://github.com/microsoft/onnxruntime.git - ARG ONNXRUNTIME_BRANCH=main - --ENV InferenceEngine_DIR=${INTEL_OPENVINO_DIR}/runtime/cmake -+ENV OpenVINO_DIR=${INTEL_OPENVINO_DIR}/runtime/cmake - - USER root - RUN apt update; apt install -y git protobuf-compiler libprotobuf-dev -diff --git a/dockerfiles/Dockerfile.openvino-centos7 b/dockerfiles/Dockerfile.openvino-centos7 -deleted file mode 100755 -index 697db44801e3bc5b87d187a71bec797e977b2e4d..0000000000000000000000000000000000000000 ---- a/dockerfiles/Dockerfile.openvino-centos7 -+++ /dev/null -@@ -1,105 +0,0 @@ --#------------------------------------------------------------------------- --# Copyright(C) 2021 Intel Corporation. --# SPDX-License-Identifier: MIT --#-------------------------------------------------------------------------- -- --FROM centos:7.8.2003 -- --WORKDIR /code -- --ARG MY_ROOT=/code --ARG YUM_OV_PACKAGE=intel-openvino-runtime-centos7-2021.4.752.x86_64 --ARG DEVICE=CPU_FP32 --ARG ONNXRUNTIME_REPO=https://github.com/microsoft/onnxruntime --ARG ONNXRUNTIME_BRANCH=main -- --ENV INTEL_OPENVINO_DIR=/opt/intel/openvino_2021.4.752 --ENV InferenceEngine_DIR=${INTEL_OPENVINO_DIR}/deployment_tools/inference_engine/share --ENV IE_PLUGINS_PATH=${INTEL_OPENVINO_DIR}/deployment_tools/inference_engine/lib/intel64 --ENV ngraph_DIR=${INTEL_OPENVINO_DIR}/deployment_tools/ngraph/cmake --ENV LD_LIBRARY_PATH=/opt/intel/opencl:${INTEL_OPENVINO_DIR}/inference_engine/external/gna/lib:${INTEL_OPENVINO_DIR}/deployment_tools/inference_engine/external/mkltiny_lnx/lib:$INTEL_OPENVINO_DIR/deployment_tools/ngraph/lib:${INTEL_OPENVINO_DIR}/deployment_tools/inference_engine/external/omp/lib:${INTEL_OPENVINO_DIR}/deployment_tools/inference_engine/external/tbb/lib:${IE_PLUGINS_PATH}:${LD_LIBRARY_PATH} --ENV OpenCV_DIR=${INTEL_OPENVINO_DIR}/opencv/share/OpenCV --ENV LD_LIBRARY_PATH=${INTEL_OPENVINO_DIR}/opencv/lib:${INTEL_OPENVINO_DIR}/opencv/share/OpenCV/3rdparty/lib:${LD_LIBRARY_PATH} --ENV HDDL_INSTALL_DIR=${INTEL_OPENVINO_DIR}/deployment_tools/inference_engine/external/hddl --ENV LD_LIBRARY_PATH=${INTEL_OPENVINO_DIR}/deployment_tools/inference_engine/external/hddl/lib:$LD_LIBRARY_PATH --ENV LD_LIBRARY_PATH=/usr/local/lib:/usr/lib:/usr/local/lib64:/usr/lib64:/lib64:$LD_LIBRARY_PATH -- --# Install packages --RUN yum update -y && \ -- yum groupinstall "Development Tools" -y && \ -- yum install -y yum-utils autoconf automake libtool unzip udev wget zlib-devel libffi-devel openssl-devel boost-devel-1.53.0 && \ -- yum clean packages && yum clean all && rm -rf /var/cache/yum && \ --# Install cmake -- cd $MY_ROOT && \ -- wget https://github.com/Kitware/CMake/releases/download/v3.27.3/cmake-3.27.3.tar.gz && \ -- tar -zxvf cmake-3.27.3.tar.gz && rm -rf cmake-3.27.3.tar.gz && \ -- cd cmake-3.27.3 && \ -- ./bootstrap && \ -- make && \ -- make install && \ -- cd $MY_ROOT && \ --# libusb1.0.22 -- cd /opt/ && wget https://github.com/libusb/libusb/archive/v1.0.22.zip && \ -- unzip v1.0.22.zip && rm -rf v1.0.22.zip && cd /opt/libusb-1.0.22 && \ --# bootstrap steps -- ./bootstrap.sh && \ -- ./configure --disable-udev --enable-shared && \ -- make -j4 && \ --# configure libusb1.0.22 -- cd /opt/libusb-1.0.22/libusb && \ -- /bin/mkdir -p '/usr/local/lib' && \ -- /bin/bash ../libtool --mode=install /usr/bin/install -c libusb-1.0.la '/usr/local/lib' && \ -- /bin/mkdir -p '/usr/local/include/libusb-1.0' && \ -- /usr/bin/install -c -m 644 libusb.h '/usr/local/include/libusb-1.0' && \ -- /bin/mkdir -p '/usr/local/lib/pkgconfig' && \ --# Install openvino -- yum-config-manager --add-repo https://yum.repos.intel.com/openvino/2021/setup/intel-openvino-2021.repo && \ -- rpm --import https://yum.repos.intel.com/openvino/2021/setup/RPM-GPG-KEY-INTEL-OPENVINO-2021 && \ -- yum update -y && yum list intel-openvino* && \ -- yum install -y $YUM_OV_PACKAGE && \ -- cd ${INTEL_OPENVINO_DIR}/install_dependencies/ && ./install_openvino_dependencies.sh -y && \ -- printf "\nexport LD_LIBRARY_PATH=\${LD_LIBRARY_PATH}:/usr/local/lib\n" >> /opt/intel/openvino_2021.4.752/bin/setupvars.sh && \ -- cd /opt/libusb-1.0.22 && \ -- /usr/bin/install -c -m 644 libusb-1.0.pc '/usr/local/lib/pkgconfig' && \ -- cp /opt/intel/openvino_2021/deployment_tools/inference_engine/external/97-myriad-usbboot.rules /etc/udev/rules.d/ && \ -- ldconfig && \ --# Install GPU runtime and drivers -- cd ${MY_ROOT} && \ -- mkdir /tmp/opencl && \ -- cd /tmp/opencl && \ -- yum install -y epel-release && \ -- yum install -y ocl-icd ocl-icd-devel && \ -- wget -O intel-igc-core-1.0.2597-1.el7.x86_64.rpm https://sourceforge.net/projects/intel-compute-runtime/files/19.41.14441/centos-7/intel-igc-core-1.0.2597-1.el7.x86_64.rpm/download && \ -- wget -O intel-opencl-19.41.14441-1.el7.x86_64.rpm https://sourceforge.net/projects/intel-compute-runtime/files/19.41.14441/centos-7/intel-opencl-19.41.14441-1.el7.x86_64.rpm/download && \ -- wget -O intel-igc-opencl-devel-1.0.2597-1.el7.x86_64.rpm https://sourceforge.net/projects/intel-compute-runtime/files/19.41.14441/centos-7/intel-igc-opencl-devel-1.0.2597-1.el7.x86_64.rpm/download && \ -- wget -O intel-igc-opencl-1.0.2597-1.el7.x86_64.rpm https://sourceforge.net/projects/intel-compute-runtime/files/19.41.14441/centos-7/intel-igc-opencl-1.0.2597-1.el7.x86_64.rpm/download && \ -- wget -O intel-gmmlib-19.3.2-1.el7.x86_64.rpm https://sourceforge.net/projects/intel-compute-runtime/files/19.41.14441/centos-7/intel-gmmlib-19.3.2-1.el7.x86_64.rpm/download && \ -- wget -O intel-gmmlib-devel-19.3.2-1.el7.x86_64.rpm https://sourceforge.net/projects/intel-compute-runtime/files/19.41.14441/centos-7/intel-gmmlib-devel-19.3.2-1.el7.x86_64.rpm/download && \ -- rpm -i /tmp/opencl/*.rpm && \ -- ldconfig && \ -- rm -rf /tmp/opencl && \ --# Installing gcc-10 -- yum install -y centos-release-scl && \ -- yum install -y devtoolset-10-gcc* && \ -- echo 'source scl_source enable devtoolset-10' >> ~/.bashrc && \ --# python installation -- source scl_source enable devtoolset-10 && \ -- cd /code/ && \ -- wget https://www.python.org/ftp/python/3.8.3/Python-3.8.3.tgz && tar xvf Python-3.8.3.tgz && \ -- cd Python-3.8*/ && ./configure && make && make install && \ -- cd ../ && mkdir -p /usr/bin/Python38 && ln -s Python-3.8.3/ /usr/bin/Python38 && \ --# installing dependancies -- yum install -y python3-lxml python3-six libusb.x86_64 && \ -- yum clean packages && yum clean all && rm -rf /var/cache/yum && \ --# Build onnxruntime -- cd $MY_ROOT && \ -- pip3 install numpy wheel setuptools cython && \ -- git clone --recursive -b ${ONNXRUNTIME_BRANCH} ${ONNXRUNTIME_REPO} && \ -- pip3 install onnx && \ -- cd /code/onnxruntime && ./build.sh --allow_running_as_root --config Release --update --build --parallel --use_openvino ${DEVICE} --build_shared_lib --build_wheel && \ -- pip3 install /code/onnxruntime/build/Linux/Release/dist/*-linux_x86_64.whl && \ --# Clean up -- cd $MY_ROOT && rm -rf onnxruntime Python-3* && \ -- cd ${MY_ROOT}/ && rm -rf cmake* && \ -- cd /usr/share/ && rm -rf gcc* && cd /usr/lib/ && rm -rf gcc cd && rm -rf .cache && \ -- cd ${INTEL_OPENVINO_DIR}/ && rm -rf documentation data_processing && cd deployment_tools/ && rm -rf tools -diff --git a/dockerfiles/Dockerfile.openvino-csharp b/dockerfiles/Dockerfile.openvino-csharp -deleted file mode 100644 -index 2529ef4b7320925b9ebeb66e3b5209b1c1623979..0000000000000000000000000000000000000000 ---- a/dockerfiles/Dockerfile.openvino-csharp -+++ /dev/null -@@ -1,90 +0,0 @@ --#------------------------------------------------------------------------- --# Copyright(C) 2021-2023 Intel Corporation. --# SPDX-License-Identifier: MIT --#-------------------------------------------------------------------------- -- --ARG OPENVINO_VERSION=2023.0.0 -- --# Build stage --FROM openvino/ubuntu20_runtime:${OPENVINO_VERSION} AS base -- --ENV WORKDIR_PATH=/home/openvino --WORKDIR $WORKDIR_PATH --ENV DEBIAN_FRONTEND noninteractive -- --USER root --RUN apt update; apt install -y --no-install-recommends wget gnupg && \ -- rm -rf /var/lib/apt/lists/* -- --# Install Mono --RUN wget http://download.mono-project.com/repo/xamarin.gpg && apt-key add xamarin.gpg && rm xamarin.gpg && \ -- echo "deb https://download.mono-project.com/repo/ubuntu stable-bionic main" | tee /etc/apt/sources.list.d/mono-official-stable.list && \ -- apt update -y && \ -- apt install -y mono-devel -- --# Install nuget.exe --RUN wget https://dist.nuget.org/win-x86-commandline/latest/nuget.exe && \ -- mv nuget.exe /usr/local/bin/nuget.exe && \ -- echo 'mono /usr/local/bin/nuget.exe $@' > /usr/local/bin/nuget && \ -- chmod a+x /usr/local/bin/nuget -- --# Install .NET core --RUN wget https://packages.microsoft.com/config/ubuntu/20.04/packages-microsoft-prod.deb -O packages-microsoft-prod.deb && \ -- dpkg -i packages-microsoft-prod.deb && \ -- apt-get update -y &&\ -- apt-get install -y apt-transport-https && \ -- apt-get update -y && \ -- apt-get install -y dotnet-sdk-5.0 -- --# Build stage --FROM base AS builder -- --ENV WORKDIR_PATH=/home/openvino --WORKDIR $WORKDIR_PATH --ENV DEBIAN_FRONTEND noninteractive -- --ARG DEVICE=CPU_FP32 --ARG ONNXRUNTIME_REPO=https://github.com/microsoft/onnxruntime.git --ARG ONNXRUNTIME_BRANCH=main -- --ENV InferenceEngine_DIR=${INTEL_OPENVINO_DIR}/runtime/cmake --ENV LANG en_US.UTF-8 -- --USER root --RUN apt update; apt install -y --no-install-recommends git protobuf-compiler libprotobuf-dev ca-certificates unattended-upgrades && \ -- unattended-upgrade && \ -- rm -rf /var/lib/apt/lists/* -- --RUN git clone --recursive -b ${ONNXRUNTIME_BRANCH} ${ONNXRUNTIME_REPO} --RUN /bin/sh onnxruntime/dockerfiles/scripts/install_common_deps.sh --RUN ln -s cmake-* cmake-dir --RUN python3 -m pip install wheel --ENV PATH=${WORKDIR_PATH}/cmake-dir/bin:$PATH --RUN pip3 install onnx --RUN ln -s /usr/bin/python3 /usr/bin/python --RUN apt install locales && \ -- locale-gen en_US en_US.UTF-8 && \ -- dpkg-reconfigure locales --RUN cd onnxruntime && ./build.sh --allow_running_as_root --config Release --update --build --parallel --use_openvino ${DEVICE} --build_nuget --build_shared_lib --RUN cp /home/openvino/onnxruntime/build/Linux/Release/Microsoft.ML.OnnxRuntime.Managed* /home/openvino/onnxruntime/build/Linux/Release/nuget-artifacts -- --# Deploy stage --FROM base -- --ENV DEBIAN_FRONTEND noninteractive --USER root -- --RUN apt update; apt install -y unattended-upgrades fonts-freefont-ttf && \ -- unattended-upgrade --ARG BUILD_UID=1001 --ARG BUILD_USER=onnxruntimedev --RUN adduser --uid $BUILD_UID $BUILD_USER --RUN usermod -a -G video,users ${BUILD_USER} --ENV WORKDIR_PATH /home/${BUILD_USER} --WORKDIR ${WORKDIR_PATH} --COPY --from=builder /home/openvino/onnxruntime/build/Linux/Release/nuget-artifacts ${WORKDIR_PATH}/nuget-artifacts -- --USER ${BUILD_USER} --ENV PATH=${WORKDIR_PATH}/miniconda/bin:${WORKDIR_PATH}/cmake-dir/bin:$PATH --ENV IE_PLUGINS_PATH=${INTEL_OPENVINO_DIR}/runtime/lib/intel64 --ENV LD_LIBRARY_PATH=/opt/intel/opencl:${INTEL_OPENVINO_DIR}/runtime/3rdparty/tbb/lib:${IE_PLUGINS_PATH}:${LD_LIBRARY_PATH} -diff --git a/dockerfiles/Dockerfile.openvino-rhel8 b/dockerfiles/Dockerfile.openvino-rhel8 -deleted file mode 100644 -index 5c504cfa553a17eb58b46c27d04fb2c5ff5d969d..0000000000000000000000000000000000000000 ---- a/dockerfiles/Dockerfile.openvino-rhel8 -+++ /dev/null -@@ -1,87 +0,0 @@ --# Build stage --FROM registry.access.redhat.com/ubi8/ubi:8.4 -- --WORKDIR /code -- --ARG MY_ROOT=/code --ARG DEVICE=CPU_FP32 --ARG ONNXRUNTIME_REPO=https://github.com/microsoft/onnxruntime --ARG ONNXRUNTIME_BRANCH=main -- --ENV INTEL_OPENVINO_DIR=/opt/intel/openvino_2022.3.0 -- --ENV InferenceEngine_DIR=${INTEL_OPENVINO_DIR}/runtime/cmake --ENV IE_PLUGINS_PATH=${INTEL_OPENVINO_DIR}/runtime/lib/intel64/ --ENV ngraph_DIR=${INTEL_OPENVINO_DIR}/runtime/cmake --ENV LD_LIBRARY_PATH=${INTEL_OPENVINO_DIR}/runtime/3rdparty/tbb/lib/:${IE_PLUGINS_PATH}:${LD_LIBRARY_PATH} --ENV OpenCV_DIR=${INTEL_OPENVINO_DIR}/extras/opencv/cmake --ENV LD_LIBRARY_PATH=${INTEL_OPENVINO_DIR}/extras/opencv/lib:${LD_LIBRARY_PATH} --ENV LD_LIBRARY_PATH=/usr/local/lib:/usr/lib:/usr/local/lib64:/usr/lib64:/lib64:${LD_LIBRARY_PATH} --ENV PATH=${MY_ROOT}/cmake-dir/bin:$PATH -- --# Install packages --RUN yum install -y yum-utils autoconf automake libtool unzip udev wget zlib-devel libffi-devel openssl-devel git make gcc && \ -- yum clean packages && yum clean all && rm -rf /var/cache/yum && \ --# Install python 3.8 -- cd $MY_ROOT && \ -- wget https://www.python.org/ftp/python/3.8.9/Python-3.8.9.tgz && tar xvf Python-3.8.9.tgz && rm -rf Python-3.8.9.tgz && \ -- cd Python-3.8*/ && ./configure && make && make install && \ -- cd ../ && mkdir -p /usr/bin/Python38 && ln -s Python-3.8.9/ /usr/bin/Python38 && ln -s /usr/bin/pip3 /usr/bin/pip && \ --# libusb1.0.22 -- cd /opt/ && wget https://github.com/libusb/libusb/archive/v1.0.22.zip && \ -- unzip v1.0.22.zip && rm -rf v1.0.22.zip && cd /opt/libusb-1.0.22 && \ --# bootstrap steps -- ./bootstrap.sh && \ -- ./configure --disable-udev --enable-shared && \ -- make -j4 && \ --# configure libusb1.0.22 -- cd /opt/libusb-1.0.22/libusb && \ -- /bin/mkdir -p '/usr/local/lib' && \ -- /bin/bash ../libtool --mode=install /usr/bin/install -c libusb-1.0.la '/usr/local/lib' && \ -- /bin/mkdir -p '/usr/local/include/libusb-1.0' && \ -- /usr/bin/install -c -m 644 libusb.h '/usr/local/include/libusb-1.0' && \ -- /bin/mkdir -p '/usr/local/lib/pkgconfig' && \ --# Install openvino -- cd /opt/ && mkdir intel/ && cd intel && \ -- wget https://storage.openvinotoolkit.org/repositories/openvino/packages/2022.3/linux/l_openvino_toolkit_rhel8_2022.3.0.9052.9752fafe8eb_x86_64.tgz && \ -- tar xvf l_openvino_toolkit_rhel8_2022.3.0.9052.9752fafe8eb_x86_64.tgz && \ -- rm -rf l_openvino_toolkit_rhel8_2022.3.0.9052.9752fafe8eb_x86_64.tgz && \ -- mv l_openvino_toolkit_rhel8_2022.3.0.9052.9752fafe8eb_x86_64 openvino_2022.3.0 && \ -- cd ${INTEL_OPENVINO_DIR}/install_dependencies/ && ./install_openvino_dependencies.sh -y && ./install_NEO_OCL_driver.sh -y && \ -- printf "\nexport LD_LIBRARY_PATH=\${LD_LIBRARY_PATH}:/usr/local/lib\n" >> /opt/intel/openvino_2022.3.0/setupvars.sh && \ -- cd /opt/libusb-1.0.22 && \ -- /usr/bin/install -c -m 644 libusb-1.0.pc '/usr/local/lib/pkgconfig' && \ -- # MYRIAD plugins are not available for openvino 2022.3.0 release -- #cp /opt/intel/openvino_2022.3.0/install_dependencies/97-myriad-usbboot.rules /etc/udev/rules.d/ && \ -- ldconfig && \ --#Install protobuf -- cd $MY_ROOT && \ -- git clone https://github.com/protocolbuffers/protobuf.git && \ -- cd protobuf && \ -- git checkout v3.16.0 && \ -- git submodule update --init --recursive && \ -- mkdir build_source && cd build_source && \ -- cmake ../cmake -DCMAKE_INSTALL_LIBDIR=lib64 -Dprotobuf_BUILD_SHARED_LIBS=OFF -DCMAKE_INSTALL_PREFIX=/usr -DCMAKE_INSTALL_SYSCONFDIR=/etc -DCMAKE_POSITION_INDEPENDENT_CODE=ON -Dprotobuf_BUILD_TESTS=OFF -DCMAKE_BUILD_TYPE=Release && \ -- make -j$(nproc) && \ -- make install && \ --# Build onnxruntime -- cd $MY_ROOT && \ -- pip3 install numpy wheel setuptools cython onnx && \ -- git clone --recursive -b ${ONNXRUNTIME_BRANCH} ${ONNXRUNTIME_REPO} && \ -- bash onnxruntime/dockerfiles/scripts/install_common_deps.sh && \ -- ln -s cmake-* cmake-dir && \ -- source /opt/intel/openvino_2022.3.0/setupvars.sh && \ -- cd /code/onnxruntime && ./build.sh --allow_running_as_root --config Release --update --build --parallel --use_openvino ${DEVICE} --build_shared_lib --build_wheel && \ -- pip3 install /code/onnxruntime/build/Linux/Release/dist/*-linux_x86_64.whl && \ --# Clean up -- cd ${MY_ROOT} && rm -rf onnxruntime && rm -rf Python-3.8.9 && rm -rf protobuf -- --# Deploy stage --ARG BUILD_UID=1001 --ARG BUILD_USER=onnxruntimedev --RUN adduser --uid $BUILD_UID $BUILD_USER --RUN usermod -a -G video,users,render ${BUILD_USER} --ENV WORKDIR_PATH /home/${BUILD_USER} -- --WORKDIR ${WORKDIR_PATH} --USER ${BUILD_USER} -diff --git a/onnxruntime/core/providers/openvino/backend_manager.cc b/onnxruntime/core/providers/openvino/backend_manager.cc -index 330b464ffd1bb8804e0b9aa6084c0912931d7126..3252603e333897f8ba9ee5e26041201e77267d2b 100644 ---- a/onnxruntime/core/providers/openvino/backend_manager.cc -+++ b/onnxruntime/core/providers/openvino/backend_manager.cc -@@ -1,8 +1,9 @@ --// Copyright (C) 2019-2022 Intel Corporation -+// Copyright (C) Intel Corporation - // Licensed under the MIT License - - #include - #include -+#include - - #include "core/providers/shared_library/provider_api.h" - #include "contexts.h" -@@ -24,15 +25,6 @@ BackendManager::BackendManager(const GlobalContext& global_context, - global_context_ = global_context; - - auto prec_str = GetGlobalContext().precision_str; -- if (prec_str == "FP32") { -- subgraph_context_.precision = "FP32"; -- } else if (prec_str == "FP16") { -- subgraph_context_.precision = "FP16"; -- } else if (prec_str == "U8") { -- subgraph_context_.precision = "U8"; -- } else { -- throw std::string("Invalid OpenVINO Precision type: " + prec_str); -- } - - // Save the indexes of graph inputs among fused_node's inputDefs - // (which also contains initializers). -@@ -47,7 +39,7 @@ BackendManager::BackendManager(const GlobalContext& global_context, - for (auto input : graph_inputs) { - auto it = subgraph_context_.input_names.find(input->Name()); - if (it == subgraph_context_.input_names.end()) { -- throw std::string("Input not found in the input defs list"); -+ ORT_THROW("Input not found in the input defs list"); - } - int index = it->second; - subgraph_context_.input_indexes.push_back(index); -@@ -61,6 +53,7 @@ BackendManager::BackendManager(const GlobalContext& global_context, - } - subgraph_context_.subgraph_name = fused_node.Name(); - model_proto_ = GetModelProtoFromFusedNode(fused_node, subgraph, logger); -+ std::string device_type = openvino_ep::BackendManager::GetGlobalContext().device_type; - - if (ModelHasSymbolicInputDims(subgraph)) { - subgraph_context_.has_dynamic_input_shape = true; -@@ -75,7 +68,7 @@ BackendManager::BackendManager(const GlobalContext& global_context, - GetGlobalContext(), - subgraph_context_); - } catch (std::string const& msg) { -- throw msg; -+ ORT_THROW(msg); - } - LOGS_DEFAULT(INFO) << "[OpenVINO-EP] " - << "Backend created for graph " << subgraph_context_.subgraph_name; -@@ -87,12 +80,29 @@ BackendManager::BackendManager(const GlobalContext& global_context, - << subgraph_context_.subgraph_name; - - subgraph_context_.has_dynamic_input_shape = false; -+ -+ // OV NPU plugin is supported with fallback to OV CPU upon compilation failures. - try { - concrete_backend_ = BackendFactory::MakeBackend(*model_proto_, - GetGlobalContext(), - subgraph_context_); -- } catch (std::string const& msg) { -- throw msg; -+ } catch (const OnnxRuntimeException& ex) { -+ if (device_type.find("NPU") != std::string::npos) { -+ LOGS_DEFAULT(WARNING) << ex.what(); -+ LOGS_DEFAULT(WARNING) << "Model compilation failed at OV NPU." -+ << "Falling back to OV CPU for execution"; -+ GetGlobalContext().device_type = "CPU"; -+ GetGlobalContext().precision_str = "FP32"; -+ try { -+ concrete_backend_ = BackendFactory::MakeBackend(*model_proto_, -+ GetGlobalContext(), -+ subgraph_context_); -+ } catch (std::string const& msg) { -+ ORT_THROW(msg); -+ } -+ } else { -+ ORT_THROW(ex.what()); -+ } - } - } - } -@@ -254,8 +264,13 @@ void BackendManager::Compute(OrtKernelContext* context) { - LOGS_DEFAULT(INFO) << "Start Compute"; - } - #endif -+ // OV NPU doesn't support dynamic shaped model inference. -+ // if disable_dynamic_shapes is set to true then execution of dynamic model is done -+ // by rewriting the model to static shaped model at runtime based on input shape. -+ // disable_dynamic_shapes is always set to true for OV NPU plugin. - bool use_dynamic_backend = true; -- if (!GetGlobalContext().disable_dynamic_shapes && subgraph_context_.has_dynamic_input_shape && -+ if (subgraph_context_.has_dynamic_input_shape && -+ !GetGlobalContext().disable_dynamic_shapes && - (GetGlobalContext().device_type.find("CPU") != std::string::npos || - GetGlobalContext().device_type.find("GPU") != std::string::npos)) { - concrete_backend_->Infer(context); -@@ -263,12 +278,11 @@ void BackendManager::Compute(OrtKernelContext* context) { - } else if (use_dynamic_backend && subgraph_context_.has_dynamic_input_shape) { - std::vector> tensor_shapes = GetInputTensorShapes(ctx); - auto key = MakeMapKeyString(tensor_shapes, GetGlobalContext().device_type); -- - std::shared_ptr dynamic_backend; - auto search = backend_map_.find(key); - if (search == backend_map_.end()) { - LOGS_DEFAULT(INFO) << "[OpenVINO-EP] " -- << "Creating concrete backend for key: " << key; -+ << "Creating dynamic backend for key: " << key; - LOGS_DEFAULT(INFO) << "[OpenVINO-EP] " - << "Backend created for graph " << subgraph_context_.subgraph_name; - auto modelproto_with_concrete_shapes = ReWriteInputShapeInfo(*model_proto_, tensor_shapes); -@@ -276,8 +290,22 @@ void BackendManager::Compute(OrtKernelContext* context) { - dynamic_backend = BackendFactory::MakeBackend(*modelproto_with_concrete_shapes, - GetGlobalContext(), - subgraph_context_); -- } catch (std::string const& msg) { -- throw msg; -+ } catch (const OnnxRuntimeException& ex) { -+ if (GetGlobalContext().device_type.find("NPU") != std::string::npos) { -+ LOGS_DEFAULT(WARNING) << ex.what(); -+ LOGS_DEFAULT(WARNING) << "Model compilation failed at OV NPU." -+ << "Falling back to OV CPU for execution"; -+ GetGlobalContext().device_type = "CPU"; -+ GetGlobalContext().precision_str = "FP32"; -+ key = MakeMapKeyString(tensor_shapes, GetGlobalContext().device_type); -+ try { -+ dynamic_backend = BackendFactory::MakeBackend(*modelproto_with_concrete_shapes, -+ GetGlobalContext(), -+ subgraph_context_); -+ } catch (std::string const& msg) { -+ ORT_THROW(msg); -+ } -+ } - } - backend_map_.insert({key, dynamic_backend}); - } else { -diff --git a/onnxruntime/core/providers/openvino/backend_manager.h b/onnxruntime/core/providers/openvino/backend_manager.h -index 59bda7ca640ee3c130fa1d2193110b1c320408c4..376ebea225a2bef7b285e9a6580ef7c03ae04076 100644 ---- a/onnxruntime/core/providers/openvino/backend_manager.h -+++ b/onnxruntime/core/providers/openvino/backend_manager.h -@@ -1,4 +1,4 @@ --// Copyright (C) 2019-2022 Intel Corporation -+// Copyright (C) Intel Corporation - // Licensed under the MIT License - - #pragma once -diff --git a/onnxruntime/core/providers/openvino/backend_utils.cc b/onnxruntime/core/providers/openvino/backend_utils.cc -index 50c839017df2a00ca18104596e40d1d4a5d35bd3..32b5ad7d5b66debf18faa4fddb22abd1f4ed3dc3 100644 ---- a/onnxruntime/core/providers/openvino/backend_utils.cc -+++ b/onnxruntime/core/providers/openvino/backend_utils.cc -@@ -1,4 +1,4 @@ --// Copyright (C) 2019-2022 Intel Corporation -+// Copyright (C) Intel Corporation - // Licensed under the MIT License - - #include -@@ -11,12 +11,7 @@ - #include "core/providers/shared_library/provider_api.h" - #include "backend_utils.h" - --#if defined(OV_API_20) - using Exception = ov::Exception; --#else --using Exception = InferenceEngine::details::InferenceEngineException; --using WaitMode = InferenceEngine::IInferRequest::WaitMode; --#endif - - namespace onnxruntime { - namespace openvino_ep { -@@ -47,7 +42,6 @@ struct static_cast_int64 { - - std::shared_ptr - CreateOVModel(const ONNX_NAMESPACE::ModelProto& model_proto, const GlobalContext& global_context, -- const SubGraphContext& subgraph_context, - std::map>& const_outputs_map) { - if (IsCILogEnabled()) { - std::cout << "CreateNgraphFunc" << std::endl; -@@ -55,28 +49,6 @@ CreateOVModel(const ONNX_NAMESPACE::ModelProto& model_proto, const GlobalContext - const std::string model = model_proto.SerializeAsString(); - try { - auto cnn_network = global_context.ie_core.ReadModel(model, global_context.onnx_model_path_name); -- if ((subgraph_context.precision == "FP16") && -- (global_context.device_type.find("NPU") == std::string::npos)) { -- // FP16 transformations -- ov::pass::ConvertFP32ToFP16 pass_obj; -- pass_obj.run_on_model(cnn_network); -- cnn_network->validate_nodes_and_infer_types(); -- -- auto proc = ov::preprocess::PrePostProcessor(cnn_network); -- for (size_t i = 0; i < cnn_network->inputs().size(); i++) { -- if (cnn_network->inputs()[i].get_element_type() == ov::element::f16) { -- proc.input(i).tensor().set_element_type(ov::element::f32); -- proc.input(i).preprocess().convert_element_type(ov::element::f16); -- } -- } -- -- for (size_t i = 0; i < cnn_network->outputs().size(); i++) { -- if (cnn_network->outputs()[i].get_element_type() == ov::element::f16) { -- proc.output(i).postprocess().convert_element_type(ov::element::f32); -- } -- } -- cnn_network = proc.build(); -- } - - // Check for Constant Folding - if (!global_context.is_wholly_supported_graph) { -@@ -103,7 +75,7 @@ CreateOVModel(const ONNX_NAMESPACE::ModelProto& model_proto, const GlobalContext - #endif - return cnn_network; - } catch (std::string const& msg) { -- throw msg; -+ ORT_THROW(msg); - } - } - -@@ -127,7 +99,7 @@ GetOutputTensor(Ort::KernelContext& context, size_t batch_size, - } - auto it = output_names.find(output_name); - if (it == output_names.end()) { -- throw std::string(log_tag + "Output names mismatch between OpenVINO and ONNX"); -+ ORT_THROW(log_tag + "Output names mismatch between OpenVINO and ONNX"); - } - int index = it->second; - return context.GetOutput(index, output_shape.get(), num_dims); -@@ -145,7 +117,7 @@ GetOutputTensor(Ort::KernelContext& context, - - auto it = output_names.find(output_name); - if (it == output_names.end()) { -- throw std::string(log_tag + "Output names mismatch between OpenVINO and ONNX"); -+ ORT_THROW(log_tag + "Output names mismatch between OpenVINO and ONNX"); - } - int index = it->second; - auto shape = node->get_shape(); -@@ -204,7 +176,7 @@ void FillOutputsWithConstantData(std::shared_ptr node, Ort::UnownedVal - break; - } - default: -- throw std::string(log_tag + "Unsupported output data type"); -+ ORT_THROW(log_tag + "Unsupported output data type"); - } - } - -@@ -232,7 +204,7 @@ void FillInputBlob(OVTensorPtr inputBlob, size_t batch_slice_idx, - auto tensor = context.GetInput(subgraph_context.input_names.at(input_name)); - auto mem_info = tensor.GetTensorMemoryInfo(); - if (mem_info.GetAllocatorName() == OpenVINO_GPU) { -- throw std::string(log_tag + "IO Buffering is not enabled, Please enable Input on CPU"); -+ ORT_THROW(log_tag + "IO Buffering is not enabled, Please enable Input on CPU"); - } - // Copy input data into OpenVINO's input buffer - const char* tensor_data = tensor.GetTensorData(); -diff --git a/onnxruntime/core/providers/openvino/backend_utils.h b/onnxruntime/core/providers/openvino/backend_utils.h -index 82b0351e87da5d901e58249ae942d210fb4603de..93fa874774469214be3afafd3c46714046483707 100644 ---- a/onnxruntime/core/providers/openvino/backend_utils.h -+++ b/onnxruntime/core/providers/openvino/backend_utils.h -@@ -1,4 +1,4 @@ --// Copyright (C) 2019-2022 Intel Corporation -+// Copyright (C) Intel Corporation - // Licensed under the MIT License - - #pragma once -@@ -65,7 +65,6 @@ void FillOutputBlob(OVTensorPtr outputBlob, Ort::UnownedValue& output_tensor, - std::shared_ptr - CreateOVModel(const ONNX_NAMESPACE::ModelProto& model_proto, - const GlobalContext& global_context, -- const SubGraphContext& subgraph_context, - std::map>& const_outputs_map); - - void printPerformanceCounts(const std::vector& performanceMap, -diff --git a/onnxruntime/core/providers/openvino/backends/backend_factory.cc b/onnxruntime/core/providers/openvino/backends/backend_factory.cc -index c586dd8b38af98198476e474aa9315c58b016664..a0f4ce8f843b060c1c10e49f3f69c344323be096 100644 ---- a/onnxruntime/core/providers/openvino/backends/backend_factory.cc -+++ b/onnxruntime/core/providers/openvino/backends/backend_factory.cc -@@ -1,4 +1,4 @@ --// Copyright (C) 2019-2022 Intel Corporation -+// Copyright (C) Intel Corporation - // Licensed under the MIT License - - #include -@@ -24,11 +24,11 @@ BackendFactory::MakeBackend(const ONNX_NAMESPACE::ModelProto& model_proto, - try { - concrete_backend_ = std::make_shared(model_proto, global_context, subgraph_context); - } catch (std::string const& msg) { -- throw msg; -+ ORT_THROW(msg); - } - return concrete_backend_; - } else { -- throw std::string("[OpenVINO-EP] Backend factory error: Unknown backend type: " + type); -+ ORT_THROW("[OpenVINO-EP] Backend factory error: Unknown backend type: " + type); - } - } - } // namespace openvino_ep -diff --git a/onnxruntime/core/providers/openvino/backends/basic_backend.cc b/onnxruntime/core/providers/openvino/backends/basic_backend.cc -index 0779940983aea0133e67b08c7a90b5066a6b5b28..69d234a7c55efd95451cfb75f74c05edfda81da4 100644 ---- a/onnxruntime/core/providers/openvino/backends/basic_backend.cc -+++ b/onnxruntime/core/providers/openvino/backends/basic_backend.cc -@@ -1,4 +1,4 @@ --// Copyright (C) 2019-2022 Intel Corporation -+// Copyright (C) Intel Corporation - // Licensed under the MIT License - - #include -@@ -79,20 +79,20 @@ BasicBackend::BasicBackend(const ONNX_NAMESPACE::ModelProto& model_proto, - subgraph_context_.subgraph_name); - LOGS_DEFAULT(INFO) << log_tag << "Loaded model to the plugin"; - } else { -- ie_cnn_network_ = CreateOVModel(model_proto, global_context_, subgraph_context_, const_outputs_map_); -+ ie_cnn_network_ = CreateOVModel(model_proto, global_context_, const_outputs_map_); - exe_network_ = global_context_.ie_core.LoadNetwork( - ie_cnn_network_, hw_target, device_config, subgraph_context_.subgraph_name); - LOGS_DEFAULT(INFO) << log_tag << "Loaded model to the plugin"; - } - #endif - } else { -- ie_cnn_network_ = CreateOVModel(model_proto, global_context_, subgraph_context_, const_outputs_map_); -+ ie_cnn_network_ = CreateOVModel(model_proto, global_context_, const_outputs_map_); - exe_network_ = global_context_.ie_core.LoadNetwork( - ie_cnn_network_, hw_target, device_config, subgraph_context_.subgraph_name); - LOGS_DEFAULT(INFO) << log_tag << "Loaded model to the plugin"; - } - } catch (const char* msg) { -- throw(msg); -+ ORT_THROW(msg); - } - - inferRequestsQueue_ = std::unique_ptr(new InferRequestsQueue(exe_network_, 1)); -@@ -125,21 +125,17 @@ void BasicBackend::PopulateConfigValue(ov::AnyMap& device_config) { - if (global_context_.device_type.find("NPU") != std::string::npos) { - std::pair device_property; - device_property = std::make_pair("NPU_COMPILER_TYPE", "DRIVER"); -+ -+ const std::string env_npu_compiler_type = onnxruntime::GetEnvironmentVar("ORT_OPENVINO_NPU_COMPILER_TYPE"); -+ if (!env_npu_compiler_type.empty()) { -+ device_property = std::make_pair("NPU_COMPILER_TYPE", env_npu_compiler_type); -+ } - device_config.emplace(ov::device::properties("NPU", device_property)); - } - } - - void BasicBackend::EnableCaching() { - if (!global_context_.cache_dir.empty()) { -- if (global_context_.is_wholly_supported_graph) { --#if defined(OPENVINO_2022_3) --#if defined(_WIN32) || defined(WIN32) || defined(__CYGWIN__) || defined(__MINGW32__) || defined(__BORLANDC__) -- _putenv_s("OV_GPU_CACHE_MODEL", "1"); --#else -- setenv("OV_GPU_CACHE_MODEL", "1", 1); --#endif --#endif -- } - LOGS_DEFAULT(INFO) << log_tag << "Enables Caching"; - global_context_.ie_core.SetCache(global_context_.cache_dir); - } -@@ -162,7 +158,7 @@ void BasicBackend::EnableStreams() { - (global_context_.device_type.find("HETERO") != std::string::npos) || - (global_context_.device_type.find("AUTO") != std::string::npos)) { - if (global_context_.num_streams != 1) { -- throw(log_tag + "Cannot set NUM_STREAMS to " + std::to_string(global_context_.num_streams) + " for device " + global_context_.device_type); -+ ORT_THROW(log_tag + "Cannot set NUM_STREAMS to " + std::to_string(global_context_.num_streams) + " for device " + global_context_.device_type); - } - // Do nothing - } else { -@@ -198,9 +194,9 @@ void BasicBackend::StartAsyncInference(Ort::KernelContext& context, OVInferReque - if (input_names.find(onnx_input_name) != input_names.end()) { - input_name = onnx_input_name; - } else { -- throw(log_tag + -- "Input names mismatch between OpenVINO and ONNX. " + onnx_input_name + -- " doesn't exist in the list of OpenVINO input tensor names"); -+ ORT_THROW(log_tag + -+ "Input names mismatch between OpenVINO and ONNX. " + onnx_input_name + -+ " doesn't exist in the list of OpenVINO input tensor names"); - } - size_t batch_slice_idx = 0; - if (subgraph_context_.has_dynamic_input_shape && -@@ -232,14 +228,14 @@ void BasicBackend::StartAsyncInference(Ort::KernelContext& context, OVInferReque - try { - infer_request->SetTensor(input_name, tensor_ptr); - } catch (const char* msg) { -- throw(msg); -+ ORT_THROW(msg); - } - } else { - OVTensorPtr graph_input_blob; - try { - graph_input_blob = infer_request->GetTensor(input_name); - } catch (const char* msg) { -- throw(msg); -+ ORT_THROW(msg); - } - FillInputBlob(graph_input_blob, batch_slice_idx, input_name, context, subgraph_context_); - } -@@ -248,7 +244,7 @@ void BasicBackend::StartAsyncInference(Ort::KernelContext& context, OVInferReque - // Start Async inference - infer_request->StartAsync(); - } catch (const char* msg) { -- throw(msg); -+ ORT_THROW(msg); - } - } - -@@ -274,10 +270,10 @@ void BasicBackend::StartRemoteAsyncInference(Ort::KernelContext& context, OVInfe - if (input_names.find(onnx_input_name) != input_names.end()) { - input_name = onnx_input_name; - } else { -- throw(log_tag + -- "Input names mismatch between OpenVINO and ONNX. " + -- onnx_input_name + -- " doesn't exist in the list of OpenVINO input tensor names"); -+ ORT_THROW(log_tag + -+ "Input names mismatch between OpenVINO and ONNX. " + -+ onnx_input_name + -+ " doesn't exist in the list of OpenVINO input tensor names"); - } - input_idx++; - // Kernel Context Input Buffer -@@ -322,7 +318,7 @@ void BasicBackend::StartRemoteAsyncInference(Ort::KernelContext& context, OVInfe - } - } - if (!output_name_found) { -- throw std::string( -+ ORT_THROW( - log_tag + - "Output names mismatch between OpenVINO and ONNX. [ONNX Output: ] " + - onnx_output_name + " doesn't exist in the list of OpenVINO output tensor names"); -@@ -344,7 +340,7 @@ void BasicBackend::StartRemoteAsyncInference(Ort::KernelContext& context, OVInfe - try { - infer_request->SetTensor(output_name, tensor_ptr); - } catch (const char* msg) { -- throw(msg); -+ ORT_THROW(msg); - } - } - } -@@ -352,7 +348,7 @@ void BasicBackend::StartRemoteAsyncInference(Ort::KernelContext& context, OVInfe - // Start Async inference - infer_request->StartAsync(); - } catch (const char* msg) { -- throw(msg); -+ ORT_THROW(msg); - } - } - #endif -@@ -382,17 +378,18 @@ void BasicBackend::CompleteAsyncInference(Ort::KernelContext& context, OVInferRe - } - } - if (!output_name_found) { -- throw(log_tag + -- "Output names mismatch between OpenVINO and ONNX. " -- "[ONNX Output: ] " + -- onnx_output_name + -- " doesn't exist in the " -- "list of OpenVINO output tensor names"); -+ ORT_THROW( -+ log_tag + -+ "Output names mismatch between OpenVINO and ONNX. " -+ "[ONNX Output: ] " + -+ onnx_output_name + -+ " doesn't exist in the " -+ "list of OpenVINO output tensor names"); - } - try { - graph_output_blob = infer_request->GetTensor(output_name); - } catch (const char* msg) { -- throw(msg); -+ ORT_THROW(msg); - } - size_t batch_size = 1; - auto output_tensor = -@@ -413,14 +410,14 @@ void BasicBackend::CompleteAsyncInference(Ort::KernelContext& context, OVInferRe - auto output_tensor = GetOutputTensor(context, out_name, subgraph_context_.output_names, node); - auto mem_info = output_tensor.GetTensorMemoryInfo(); - if (mem_info.GetAllocatorName() == OpenVINO_GPU) { -- throw(log_tag + "IO Buffering is not supported for constant subgraphs"); -+ ORT_THROW(log_tag + "IO Buffering is not supported for constant subgraphs"); - } else { - FillOutputsWithConstantData(node, output_tensor); - } - } - } - } catch (const char* msg) { -- throw(msg); -+ ORT_THROW(msg); - } - } - -@@ -440,7 +437,7 @@ void BasicBackend::Infer(OrtKernelContext* ctx) { - auto output_tensor = GetOutputTensor(context, out_name, subgraph_context_.output_names, node); - FillOutputsWithConstantData(node, output_tensor); - } catch (std::string const& msg) { -- throw msg; -+ ORT_THROW(msg); - } - } - // Get Output tensors -@@ -461,26 +458,26 @@ void BasicBackend::Infer(OrtKernelContext* ctx) { - try { - StartRemoteAsyncInference(context, infer_request); - } catch (std::string const& msg) { -- throw msg; -+ ORT_THROW(msg); - } - } else { - try { - StartAsyncInference(context, infer_request); - } catch (std::string const& msg) { -- throw msg; -+ ORT_THROW(msg); - } - } - #else - try { - StartAsyncInference(context, infer_request); -- } catch (std::string const& msg) { -- throw msg; -+ } catch (const std::runtime_error& e) { -+ ORT_THROW(log_tag + " Exception at StartAsyncInference: " + e.what()); - } - #endif - try { - CompleteAsyncInference(context, infer_request); -- } catch (std::string const& msg) { -- throw msg; -+ } catch (const std::runtime_error& e) { -+ ORT_THROW(log_tag + " Exception at CompleteAsyncInference: " + e.what()); - } - - // Get Output tensors -diff --git a/onnxruntime/core/providers/openvino/backends/basic_backend.h b/onnxruntime/core/providers/openvino/backends/basic_backend.h -index aa96dadbf0e2d49563e52045029185a93fd6a976..3502f660bbb2094a7604f2c70cc52e44b649ead0 100644 ---- a/onnxruntime/core/providers/openvino/backends/basic_backend.h -+++ b/onnxruntime/core/providers/openvino/backends/basic_backend.h -@@ -1,4 +1,4 @@ --// Copyright (C) 2019-2022 Intel Corporation -+// Copyright (C) Intel Corporation - // Licensed under the MIT License - - #pragma once -diff --git a/onnxruntime/core/providers/openvino/contexts.h b/onnxruntime/core/providers/openvino/contexts.h -index 5f19c71683f24a9d897dc310a6756dd98704454e..8701d9f676ffdc6ae15d0897e966b2a894f3d6fb 100644 ---- a/onnxruntime/core/providers/openvino/contexts.h -+++ b/onnxruntime/core/providers/openvino/contexts.h -@@ -1,4 +1,4 @@ --// Copyright (C) 2019-2022 Intel Corporation -+// Copyright (C) Intel Corporation - // Licensed under the MIT License - - #pragma once -@@ -31,6 +31,7 @@ struct GlobalContext { - int onnx_opset_version; - void* context = 0; - bool use_api_2; -+ std::vector OpenVINO_Version = {}; // Ov Major and OV minor version from OV headers - }; - - // Holds context specific to subgraph. -@@ -44,7 +45,6 @@ struct SubGraphContext { - std::vector input_indexes; - std::unordered_map input_names; - std::unordered_map output_names; -- std::string precision; - }; - - } // namespace openvino_ep -diff --git a/onnxruntime/core/providers/openvino/ibackend.h b/onnxruntime/core/providers/openvino/ibackend.h -index 8aacce19c14d5909a2a8fac80903f06d5c9e6419..ece855c6167c6c1c1b7c6f9541e854d16b598bbf 100644 ---- a/onnxruntime/core/providers/openvino/ibackend.h -+++ b/onnxruntime/core/providers/openvino/ibackend.h -@@ -1,4 +1,4 @@ --// Copyright (C) 2019-2022 Intel Corporation -+// Copyright (C) Intel Corporation - // Licensed under the MIT License - - #pragma once -diff --git a/onnxruntime/core/providers/openvino/openvino_execution_provider.cc b/onnxruntime/core/providers/openvino/openvino_execution_provider.cc -index e3948cc94b348db80e60ad2bd14569f067ee5a38..913440d2fb6ea72a7ffd170f8eff0d38a20e38cf 100644 ---- a/onnxruntime/core/providers/openvino/openvino_execution_provider.cc -+++ b/onnxruntime/core/providers/openvino/openvino_execution_provider.cc -@@ -1,4 +1,4 @@ --// Copyright (C) 2019-2022 Intel Corporation -+// Copyright (C) Intel Corporation - // Licensed under the MIT License - - #include "core/providers/shared_library/provider_api.h" -@@ -6,6 +6,7 @@ - #include "contexts.h" - #include "backend_manager.h" - #include "ov_versions/capability.h" -+#include "openvino/core/version.hpp" - - #define MEMCPY_S(dest, src, destsz, srcsz) memcpy(dest, src, std::min(destsz, srcsz)) - -@@ -25,6 +26,7 @@ OpenVINOExecutionProvider::OpenVINOExecutionProvider(const OpenVINOExecutionProv - global_context_->enable_opencl_throttling = info.enable_opencl_throttling_; - global_context_->disable_dynamic_shapes = info.disable_dynamic_shapes_; - global_context_->num_of_threads = info.num_of_threads_; -+ global_context_->OpenVINO_Version = {OPENVINO_VERSION_MAJOR, OPENVINO_VERSION_MINOR}; - - // to check if target device is available - // using ie_core capability GetAvailableDevices to fetch list of devices plugged in -@@ -50,8 +52,7 @@ OpenVINOExecutionProvider::OpenVINOExecutionProvider(const OpenVINOExecutionProv - device_found = true; - break; - } -- if ((info.device_type_.find("NPU") != std::string::npos) && -- (info.precision_ == "FP16" || info.precision_ == "U8")) { -+ if (info.device_type_.find("NPU") != std::string::npos) { - device_found = true; - break; - } -@@ -113,27 +114,10 @@ OpenVINOExecutionProvider::GetCapability(const GraphViewer& graph_viewer, - global_context_->onnx_opset_version = - graph_viewer.DomainToVersionMap().at(kOnnxDomain); - --#if defined(OPENVINO_2023_0) - openvino_ep::GetCapability obj(graph_viewer, - global_context_->device_type, -- global_context_->precision_str, "V_2023_0"); -+ global_context_->precision_str); - result = obj.Execute(); --#elif defined(OPENVINO_2023_1) -- openvino_ep::GetCapability obj(graph_viewer, -- global_context_->device_type, -- global_context_->precision_str, "V_2023_1"); -- result = obj.Execute(); --#elif defined(OPENVINO_2023_2) -- openvino_ep::GetCapability obj(graph_viewer, -- global_context_->device_type, -- global_context_->precision_str, "V_2023_2"); -- result = obj.Execute(); --#elif defined(OPENVINO_2023_3) -- openvino_ep::GetCapability obj(graph_viewer, -- global_context_->device_type, -- global_context_->precision_str, "V_2023_3"); -- result = obj.Execute(); --#endif - - global_context_->is_wholly_supported_graph = obj.IsWhollySupportedGraph(); - -diff --git a/onnxruntime/core/providers/openvino/openvino_execution_provider.h b/onnxruntime/core/providers/openvino/openvino_execution_provider.h -index b0c92828d8a38d9ee4303ffb64ae3dd3e93e967f..b0dc881c36f3320682556854bf56c6c6f53a37bb 100644 ---- a/onnxruntime/core/providers/openvino/openvino_execution_provider.h -+++ b/onnxruntime/core/providers/openvino/openvino_execution_provider.h -@@ -1,4 +1,4 @@ --// Copyright (C) 2019-2022 Intel Corporation -+// Copyright (C) Intel Corporation - // Licensed under the MIT License - - #pragma once -@@ -20,7 +20,7 @@ static void print_build_options() { - << "you want to build" - << std::endl; - std::cout << "The different hardware devices that can be added with HETERO/MULTI/AUTO build " -- << "are ['CPU','GPU']" -+ << "are ['CPU','GPU','NPU']" - << std::endl; - std::cout << "An example of how to specify the HETERO or MULTI or AUTO build type. " - << "Ex: HETERO:GPU,CPU Ex: MULTI:GPU,CPU Ex: AUTO:GPU,CPU" -@@ -48,7 +48,7 @@ static std::vector parseDevices(const std::string& device_string) { - print_build_options(); - ORT_THROW("Invalid device string: " + device_string); - } -- std::vector dev_options = {"CPU", "GPU"}; -+ std::vector dev_options = {"CPU", "GPU", "NPU"}; - for (std::string dev : devices) { - if (!std::count(dev_options.begin(), dev_options.end(), dev)) { - print_build_options(); -@@ -98,12 +98,9 @@ struct OpenVINOExecutionProviderInfo { - #elif defined OPENVINO_CONFIG_GPU_FP16 - device_type_ = "GPU"; - precision_ = "FP16"; --#elif defined OPENVINO_CONFIG_NPU_FP16 -+#elif defined OPENVINO_CONFIG_NPU - device_type_ = "NPU"; -- precision_ = "FP16"; --#elif defined OPENVINO_CONFIG_NPU_U8 -- device_type_ = "NPU"; -- precision_ = "U8"; -+ precision_ = ""; - #elif defined OPENVINO_CONFIG_HETERO || defined OPENVINO_CONFIG_MULTI || defined OPENVINO_CONFIG_AUTO - #ifdef DEVICE_NAME - #define DEVICE DEVICE_NAME -@@ -142,12 +139,9 @@ struct OpenVINOExecutionProviderInfo { - } else if (dev_type == "GPU.1_FP16") { - device_type_ = "GPU.1"; - precision_ = "FP16"; -- } else if (dev_type == "NPU_FP16") { -- device_type_ = "NPU"; -- precision_ = "FP16"; -- } else if (dev_type == "NPU_U8") { -+ } else if (dev_type == "NPU") { - device_type_ = "NPU"; -- precision_ = "U8"; -+ precision_ = ""; - } else if (dev_type.find("HETERO") == 0 || dev_type.find("MULTI") == 0) { - std::vector devices = parseDevices(dev_type); - precision_ = "FP16"; -diff --git a/onnxruntime/core/providers/openvino/openvino_provider_factory.cc b/onnxruntime/core/providers/openvino/openvino_provider_factory.cc -index 068456777beceb900511f66fdae92fd5828b477f..17511c54aab860140eec58c5b03144be5ddb089e 100644 ---- a/onnxruntime/core/providers/openvino/openvino_provider_factory.cc -+++ b/onnxruntime/core/providers/openvino/openvino_provider_factory.cc -@@ -1,4 +1,4 @@ --// Copyright (C) 2019-2022 Intel Corporation -+// Copyright (C) Intel Corporation - // Licensed under the MIT License - - #include "core/providers/shared_library/provider_api.h" -@@ -78,7 +78,6 @@ struct OpenVINO_Provider : Provider { - // with this value at runtime. - bool enable_opencl_throttling = false; // [enable_opencl_throttling]: Enables OpenCL queue throttling for GPU - // device (Reduces CPU Utilization when using GPU) -- bool disable_dynamic_shapes = false; // [disable_dynamic_shapes]: Execute model with default static shape for optimal performance. - void* context = nullptr; - - if (provider_options_map.find("device_type") != provider_options_map.end()) { -@@ -86,7 +85,7 @@ struct OpenVINO_Provider : Provider { - - std::set ov_supported_device_types = {"CPU_FP32", "CPU_FP16", "GPU_FP32", - "GPU.0_FP32", "GPU.1_FP32", "GPU_FP16", -- "GPU.0_FP16", "GPU.1_FP16"}; -+ "GPU.0_FP16", "GPU.1_FP16", "NPU"}; - if (!((ov_supported_device_types.find(device_type) != ov_supported_device_types.end()) || - (device_type.find("HETERO:") == 0) || - (device_type.find("MULTI:") == 0) || -@@ -94,7 +93,7 @@ struct OpenVINO_Provider : Provider { - ORT_THROW( - "[ERROR] [OpenVINO] You have selcted wrong configuration value for the key 'device_type'. " - "Select from 'CPU_FP32', 'CPU_FP16', 'GPU_FP32', 'GPU.0_FP32', 'GPU.1_FP32', 'GPU_FP16', " -- "'GPU.0_FP16', 'GPU.1_FP16' or from" -+ "'GPU.0_FP16', 'GPU.1_FP16', 'NPU' or from" - " HETERO/MULTI/AUTO options available. \n"); - } - } -@@ -147,12 +146,24 @@ struct OpenVINO_Provider : Provider { - bool_flag = ""; - } - -+ // [disable_dynamic_shapes]: Rewrite dynamic shaped models to static shape at runtime and execute. -+ // Always true for NPU plugin. -+ bool disable_dynamic_shapes = false; -+ if (device_type.find("NPU") != std::string::npos) { -+ disable_dynamic_shapes = true; -+ } - if (provider_options_map.find("disable_dynamic_shapes") != provider_options_map.end()) { - bool_flag = provider_options_map.at("disable_dynamic_shapes"); - if (bool_flag == "true" || bool_flag == "True") - disable_dynamic_shapes = true; -- else if (bool_flag == "false" || bool_flag == "False") -- disable_dynamic_shapes = false; -+ else if (bool_flag == "false" || bool_flag == "False") { -+ if (device_type.find("NPU") != std::string::npos) { -+ disable_dynamic_shapes = true; -+ LOGS_DEFAULT(INFO) << "[OpenVINO-EP] The value for the key 'disable_dynamic_shapes' will be set to TRUE for NPU backend.\n "; -+ } else { -+ disable_dynamic_shapes = false; -+ } -+ } - } - return std::make_shared(const_cast(device_type.c_str()), - enable_npu_fast_compile, -diff --git a/onnxruntime/core/providers/openvino/ov_interface.cc b/onnxruntime/core/providers/openvino/ov_interface.cc -index ea481791111fc42d866b72608d2332cdc1ff2a2c..d7c6654c90f812117b6b75671ebacb9d3697fdee 100644 ---- a/onnxruntime/core/providers/openvino/ov_interface.cc -+++ b/onnxruntime/core/providers/openvino/ov_interface.cc -@@ -1,4 +1,4 @@ --// Copyright (C) 2019-2022 Intel Corporation -+// Copyright (C) Intel Corporation - // Licensed under the MIT License - - #include "ov_interface.h" -@@ -8,12 +8,7 @@ - #include "core/providers/shared_library/provider_api.h" - #include "backend_utils.h" - --#if defined(OV_API_20) - using Exception = ov::Exception; --#else --using Exception = InferenceEngine::details::InferenceEngineException; --using WaitMode = InferenceEngine::IInferRequest::WaitMode; --#endif - - namespace onnxruntime { - namespace openvino_ep { -@@ -36,9 +31,9 @@ std::shared_ptr OVCore::ReadModel(const std::string& model, const std - } - return FE->convert(inputModel); - } catch (const Exception& e) { -- throw std::string(log_tag + "[OpenVINO-EP] Exception while Reading network: " + std::string(e.what())); -+ ORT_THROW(log_tag + "[OpenVINO-EP] Exception while Reading network: " + std::string(e.what())); - } catch (...) { -- throw std::string(log_tag + "[OpenVINO-EP] Unknown exception while Reading network"); -+ ORT_THROW(log_tag + "[OpenVINO-EP] Unknown exception while Reading network"); - } - } - -@@ -81,9 +76,9 @@ OVExeNetwork OVCore::LoadNetwork(std::shared_ptr& ie_cnn_network, - OVExeNetwork exe(obj); - return exe; - } catch (const Exception& e) { -- throw std::string(log_tag + " Exception while Loading Network for graph: " + name + e.what()); -+ ORT_THROW(log_tag + " Exception while Loading Network for graph: " + name + e.what()); - } catch (...) { -- throw std::string(log_tag + " Exception while Loading Network for graph " + name); -+ ORT_THROW(log_tag + " Exception while Loading Network for graph " + name); - } - } - -@@ -113,9 +108,9 @@ OVExeNetwork OVCore::LoadNetwork(std::shared_ptr& model, OVRemoteCont - auto obj = oe.compile_model(model, *context); - return OVExeNetwork(obj); - } catch (const Exception& e) { -- throw std::string(log_tag + " Exception while Loading Network for graph: " + name + e.what()); -+ ORT_THROW(log_tag + " Exception while Loading Network for graph: " + name + e.what()); - } catch (...) { -- throw std::string(log_tag + " Exception while Loading Network for graph " + name); -+ ORT_THROW(log_tag + " Exception while Loading Network for graph " + name); - } - } - #endif -@@ -135,9 +130,9 @@ OVInferRequest OVExeNetwork::CreateInferRequest() { - OVInferRequest inf_obj(infReq); - return inf_obj; - } catch (const Exception& e) { -- throw std::string(log_tag + "Exception while creating InferRequest object: " + e.what()); -+ ORT_THROW(log_tag + "Exception while creating InferRequest object: " + e.what()); - } catch (...) { -- throw std::string(log_tag + "Exception while creating InferRequest object."); -+ ORT_THROW(log_tag + "Exception while creating InferRequest object."); - } - } - -@@ -147,9 +142,9 @@ OVTensorPtr OVInferRequest::GetTensor(const std::string& input_name) { - OVTensorPtr blob = std::make_shared(tobj); - return blob; - } catch (const Exception& e) { -- throw std::string(log_tag + " Cannot access IE Blob for input: " + input_name + e.what()); -+ ORT_THROW(log_tag + " Cannot access IE Blob for input: " + input_name + e.what()); - } catch (...) { -- throw std::string(log_tag + " Cannot access IE Blob for input: " + input_name); -+ ORT_THROW(log_tag + " Cannot access IE Blob for input: " + input_name); - } - } - -@@ -157,9 +152,9 @@ void OVInferRequest::SetTensor(const std::string& name, OVTensorPtr& blob) { - try { - ovInfReq.set_tensor(name, *(blob.get())); - } catch (const Exception& e) { -- throw std::string(log_tag + " Cannot set Remote Blob for output: " + name + e.what()); -+ ORT_THROW(log_tag + " Cannot set Remote Blob for output: " + name + e.what()); - } catch (...) { -- throw std::string(log_tag + " Cannot set Remote Blob for output: " + name); -+ ORT_THROW(log_tag + " Cannot set Remote Blob for output: " + name); - } - } - -@@ -167,9 +162,9 @@ void OVInferRequest::StartAsync() { - try { - ovInfReq.start_async(); - } catch (const Exception& e) { -- throw std::string(log_tag + " Couldn't start Inference: " + e.what()); -+ ORT_THROW(log_tag + " Couldn't start Inference: " + e.what()); - } catch (...) { -- throw std::string(log_tag + " In Error Couldn't start Inference"); -+ ORT_THROW(log_tag + " In Error Couldn't start Inference"); - } - } - -@@ -177,9 +172,9 @@ void OVInferRequest::Infer() { - try { - ovInfReq.infer(); - } catch (const Exception& e) { -- throw std::string(log_tag + " Couldn't start Inference: " + e.what()); -+ ORT_THROW(log_tag + " Couldn't start Inference: " + e.what()); - } catch (...) { -- throw std::string(log_tag + " In Error Couldn't start Inference"); -+ ORT_THROW(log_tag + " In Error Couldn't start Inference"); - } - } - -@@ -187,9 +182,9 @@ void OVInferRequest::WaitRequest() { - try { - ovInfReq.wait(); - } catch (const Exception& e) { -- throw std::string(log_tag + " Wait Model Failed: " + e.what()); -+ ORT_THROW(log_tag + " Wait Model Failed: " + e.what()); - } catch (...) { -- throw std::string(log_tag + " Wait Mode Failed"); -+ ORT_THROW(log_tag + " Wait Mode Failed"); - } - } - -diff --git a/onnxruntime/core/providers/openvino/ov_interface.h b/onnxruntime/core/providers/openvino/ov_interface.h -index cf4d867d4df5520919fd315ce7ddd5c893c786da..2a13fafb99fd303f64d02e60657747b07dd4836e 100644 ---- a/onnxruntime/core/providers/openvino/ov_interface.h -+++ b/onnxruntime/core/providers/openvino/ov_interface.h -@@ -1,4 +1,4 @@ --// Copyright (C) 2019-2022 Intel Corporation -+// Copyright (C) Intel Corporation - // Licensed under the MIT License - - #pragma once -@@ -6,14 +6,11 @@ - #include - #include - --#define OV_API_20 - #include "openvino/openvino.hpp" - #include "openvino/pass/convert_fp32_to_fp16.hpp" - #include "openvino/frontend/manager.hpp" - - #ifdef IO_BUFFER_ENABLED --#include --#include - #include - #endif - -diff --git a/onnxruntime/core/providers/openvino/ov_versions/capability.cc b/onnxruntime/core/providers/openvino/ov_versions/capability.cc -index 11c8a1629b073c34f3857abf5bc258bb534ac4fe..3970bf6ff68a7bfd4427c8502693d754f1daa972 100644 ---- a/onnxruntime/core/providers/openvino/ov_versions/capability.cc -+++ b/onnxruntime/core/providers/openvino/ov_versions/capability.cc -@@ -1,4 +1,4 @@ --// Copyright (C) 2019-2022 Intel Corporation -+// Copyright (C) 2019- Intel Corporation - // Licensed under the MIT License - - #include "core/providers/shared_library/provider_api.h" -@@ -6,6 +6,7 @@ - #include "../backend_manager.h" - #include "capability.h" - #include "utils.h" -+#include "openvino/core/version.hpp" - - #if defined(_MSC_VER) - #pragma warning(disable : 4244 4245 5208) -@@ -25,20 +26,22 @@ namespace openvino_ep { - // Constructor - GetCapability::GetCapability(const GraphViewer& graph_viewer_param, - const std::string device_type_param, -- const std::string device_precision, -- const std::string version_param) -+ const std::string device_precision) - : graph_viewer_(graph_viewer_param), device_type_(device_type_param), device_precision_(device_precision) { -- if (version_param == "V_2023_0") { -- data_ops_ = new DataOps(graph_viewer_, V_2023_0, device_type_, device_precision_); -- } else if (version_param == "V_2023_1") { -- data_ops_ = new DataOps(graph_viewer_, V_2023_1, device_type_, device_precision_); -- } else if (version_param == "V_2023_2") { -- data_ops_ = new DataOps(graph_viewer_, V_2023_2, device_type_, device_precision_); -- } else if (version_param == "V_2023_3") { -- data_ops_ = new DataOps(graph_viewer_, V_2023_3, device_type_, device_precision_); -- } else { -- data_ops_ = new DataOps(graph_viewer_, V_2023_3, device_type_, device_precision_); -+ if (device_type_.find("NPU") != std::string::npos) { -+ device_type_ = "CPU_FP32"; - } -+#if OPENVINO_VERSION_MAJOR == 2023 && OPENVINO_VERSION_MINOR == 1 -+ data_ops_ = new DataOps(graph_viewer_, V_2023_1, device_type_, device_precision_); -+#elif OPENVINO_VERSION_MAJOR == 2023 && OPENVINO_VERSION_MINOR == 2 -+ data_ops_ = new DataOps(graph_viewer_, V_2023_2, device_type_, device_precision_); -+#elif OPENVINO_VERSION_MAJOR == 2023 && OPENVINO_VERSION_MINOR == 3 -+ data_ops_ = new DataOps(graph_viewer_, V_2023_3, device_type_, device_precision_); -+#elif OPENVINO_VERSION_MAJOR == 2024 && OPENVINO_VERSION_MINOR == 0 -+ data_ops_ = new DataOps(graph_viewer_, V_2024_0, device_type_, device_precision_); -+#else -+ data_ops_ = new DataOps(graph_viewer_, V_2024_0, device_type_, device_precision_); -+#endif - } - - std::vector> GetCapability::Execute() { -diff --git a/onnxruntime/core/providers/openvino/ov_versions/capability.h b/onnxruntime/core/providers/openvino/ov_versions/capability.h -index 2040634cc45d9712682efd6cbabbc646c796c796..d9fe5a95ef8333c137212f75976c4737101d978e 100644 ---- a/onnxruntime/core/providers/openvino/ov_versions/capability.h -+++ b/onnxruntime/core/providers/openvino/ov_versions/capability.h -@@ -1,4 +1,4 @@ --// Copyright (C) 2019-2022 Intel Corporation -+// Copyright (C) Intel Corporation - // Licensed under the MIT License - - #pragma once -@@ -21,8 +21,7 @@ class GetCapability { - public: - GetCapability(const GraphViewer& graph_viewer_param, - const std::string device_type_param, -- const std::string precision, -- const std::string version_param); -+ const std::string precision); - virtual std::vector> Execute(); - bool IsWhollySupportedGraph() { - return is_wholly_supported_graph_; -diff --git a/onnxruntime/core/providers/openvino/ov_versions/data_ops.cc b/onnxruntime/core/providers/openvino/ov_versions/data_ops.cc -index e829bf377b1954a99783beb36d29dddac88c6fd7..c7c3e93595719b003fffca854ba0d0af1826021f 100644 ---- a/onnxruntime/core/providers/openvino/ov_versions/data_ops.cc -+++ b/onnxruntime/core/providers/openvino/ov_versions/data_ops.cc -@@ -1,4 +1,4 @@ --// Copyright (C) 2019-2022 Intel Corporation -+// Copyright (C) Intel Corporation - // Licensed under the MIT License - - #include -@@ -14,6 +14,7 @@ - #include "data_ops.h" - #include "capability.h" - #include "utils.h" -+#include "../ov_interface.h" - - #if defined(_MSC_VER) - #pragma warning(disable : 4244 4245 5208) -@@ -36,6 +37,7 @@ namespace openvino_ep { - std::set ops_supported_only_in_model = { - "Add", - "Cast", -+ "Celu", - "Concat", - "ConstantOfShape", - "DequantizeLinear", -@@ -46,6 +48,7 @@ std::set ops_supported_only_in_model = { - "EyeLike", - "GatherElements", - "GatherND", -+ "GridSample", - "Identity", - "LayerNormalization", - "Loop", -@@ -72,293 +75,171 @@ std::set ops_supported_only_in_model = { - std::set ops_supported_as_function = { - "LessOrEqual", - "GreaterOrEqual", -- "LayerNormalization"}; -+ "LayerNormalization", -+ "Celu"}; - - std::vector supported_op_mode = { - {"Abs", V_2020_4, {"CPU", "GPU"}}, -- {"Abs", V_2023_0, {"NPU"}}, - {"Acos", V_2020_4, {"CPU"}}, - {"Acos", V_2022_1, {"GPU"}}, -- {"Acos", V_2023_1, {"NPU"}}, - {"Acosh", V_2020_4, {"CPU"}}, - {"Acosh", V_2022_1, {"GPU"}}, -- {"Acosh", V_2023_1, {"NPU"}}, - {"Add", V_2020_4, {"CPU", "GPU"}}, -- {"Add", V_2023_0, {"NPU"}}, - {"And", V_2020_4, {"CPU", "GPU"}}, -- {"And", V_2023_1, {"NPU"}}, - {"ArgMax", V_2020_4, {"CPU"}}, - {"ArgMax", V_2021_1, {"GPU"}}, - {"ArgMin", V_2020_4, {"CPU"}}, - {"ArgMin", V_2022_1, {"GPU"}}, - {"Asin", V_2020_4, {"CPU", "GPU"}}, -- {"Asin", V_2023_1, {"NPU"}}, - {"Asinh", V_2020_4, {"CPU", "GPU"}}, -- {"Asinh", V_2023_1, {"NPU"}}, - {"Atan", V_2020_4, {"CPU", "GPU"}}, -- {"Atan", V_2023_1, {"NPU"}}, - {"Atanh", V_2020_4, {"CPU"}}, - {"Atanh", V_2022_1, {"GPU"}}, -- {"Atanh", V_2023_1, {"NPU"}}, - {"AveragePool", V_2020_4, {"CPU", "GPU"}}, -- {"AveragePool", V_2023_0, {"NPU"}}, - {"BatchNormalization", V_2020_4, {"CPU", "GPU"}}, -- {"BatchNormalization", V_2023_0, {"NPU"}}, - {"BitShift", V_2022_1, {"CPU"}}, -- {"BitShift", V_2023_1, {"NPU"}}, - {"Cast", V_2020_4, {"CPU", "GPU"}}, -- {"Cast", V_2023_0, {"NPU"}}, -- {"CastLike", V_2023_1, {"CPU", "GPU", "NPU"}}, -+ {"CastLike", V_2023_1, {"CPU", "GPU"}}, - {"Ceil", V_2020_4, {"GPU"}}, - {"Ceil", V_2021_4, {"CPU"}}, -- {"Ceil", V_2023_1, {"NPU"}}, - {"Celu", V_2022_1, {"CPU", "GPU"}}, - {"Clip", V_2020_4, {"CPU", "GPU"}}, -- {"Clip", V_2023_0, {"NPU"}}, - {"Compress", V_2023_1, {"CPU", "GPU"}}, - {"Concat", V_2020_4, {"CPU", "GPU"}}, -- {"Concat", V_2023_0, {"NPU"}}, - {"Constant", V_2020_4, {"CPU", "GPU"}}, -- {"Constant", V_2023_0, {"NPU"}}, - {"ConstantOfShape", V_2020_4, {"CPU", "GPU"}}, -- {"ConstantOfShape", V_2023_0, {"NPU"}}, // Gets mapped to broadcast op in the plugin. - {"Conv", V_2020_4, {"CPU", "GPU"}}, -- {"Conv", V_2023_0, {"NPU"}}, - {"ConvInteger", V_2022_1, {"CPU", "GPU"}}, -- {"ConvInteger", V_2023_1, {"NPU"}}, - {"ConvTranspose", V_2020_4, {"CPU", "GPU"}}, -- {"ConvTranspose", V_2023_1, {"NPU"}}, - {"Cos", V_2020_4, {"CPU"}}, - {"Cos", V_2022_1, {"GPU"}}, -- {"Cos", V_2023_0, {"NPU"}}, - {"Cosh", V_2020_4, {"CPU"}}, - {"Cosh", V_2022_1, {"GPU"}}, -- {"Cosh", V_2023_1, {"NPU"}}, - {"CumSum", V_2022_1, {"CPU", "GPU"}}, -- {"CumSum", V_2023_0, {"NPU"}}, - {"DepthToSpace", V_2020_4, {"CPU", "GPU"}}, -- {"DepthToSpace", V_2023_0, {"NPU"}}, - {"DequantizeLinear", V_2021_4, {"CPU", "GPU"}}, -- {"DequantizeLinear", V_2023_0, {"NPU"}}, - {"Div", V_2020_4, {"CPU", "GPU"}}, -- {"Div", V_2023_0, {"NPU"}}, - {"Dropout", V_2020_4, {"CPU", "GPU"}}, -- {"Dropout", V_2023_0, {"NPU"}}, - {"Elu", V_2020_4, {"CPU", "GPU"}}, -- {"Elu", V_2023_0, {"NPU"}}, - {"Einsum", V_2023_1, {"CPU", "GPU"}}, - {"Equal", V_2020_4, {"CPU", "GPU"}}, -- {"Equal", V_2023_0, {"NPU"}}, // Added for whisper decoder model. - {"Erf", V_2020_4, {"CPU", "GPU"}}, -- {"Erf", V_2023_0, {"NPU"}}, - {"Exp", V_2020_4, {"CPU", "GPU"}}, -- {"Exp", V_2023_0, {"NPU"}}, - {"Expand", V_2022_1, {"CPU", "GPU"}}, -- {"Expand", V_2023_0, {"NPU"}}, // Gets mapped to broadcast op and multiply op in the plugin. - {"EyeLike", V_2022_1, {"CPU"}}, -- {"EyeLike", V_2023_0, {"NPU"}}, // NoOP - {"Flatten", V_2020_4, {"CPU", "GPU"}}, -- {"Flatten", V_2023_0, {"NPU"}}, - {"Floor", V_2020_4, {"CPU", "GPU"}}, -- {"Floor", V_2023_1, {"NPU"}}, - {"Gather", V_2020_4, {"CPU", "GPU"}}, -- {"Gather", V_2023_0, {"NPU"}}, - {"GatherElements", V_2022_2, {"CPU", "GPU"}}, -- {"GatherElements", V_2023_1, {"NPU"}}, - {"GatherND", V_2021_4, {"CPU", "GPU"}}, -- {"GatherND", V_2023_1, {"NPU"}}, -+ {"Gelu", V_2023_1, {"CPU", "GPU"}}, - {"Gemm", V_2020_4, {"CPU", "GPU"}}, -- {"Gemm", V_2023_0, {"NPU"}}, - {"GlobalAveragePool", V_2020_4, {"CPU", "GPU"}}, -- {"GlobalAveragePool", V_2023_0, {"NPU"}}, - {"GlobalLpPool", V_2020_4, {"CPU", "GPU"}}, -- {"GlobalLpPool", V_2023_1, {"NPU"}}, - {"GlobalMaxPool", V_2022_1, {"CPU", "GPU"}}, -- {"GlobalMaxPool", V_2023_1, {"NPU"}}, - {"Greater", V_2020_4, {"CPU", "GPU"}}, -- {"Greater", V_2023_0, {"NPU"}}, - {"GreaterOrEqual", V_2022_1, {"CPU", "GPU"}}, -- {"GreaterOrEqual", V_2023_0, {"NPU"}}, - {"GridSample", V_2022_3, {"CPU"}}, - {"GridSample", V_2023_0, {"GPU"}}, -- {"GridSample", V_2023_1, {"NPU"}}, -- {"HardMax", V_2023_1, {"CPU", "GPU", "NPU"}}, -+ {"HardMax", V_2023_1, {"CPU", "GPU"}}, - {"Identity", V_2020_4, {"CPU", "GPU"}}, -- {"Identity", V_2023_0, {"NPU"}}, // NoOP - {"If", V_2022_3, {"CPU", "GPU"}}, -- {"If", V_2023_1, {"NPU"}}, - {"ImageScaler", V_2022_1, {"CPU", "GPU"}}, -- {"ImageScaler", V_2023_0, {"NPU"}}, - {"InstanceNormalization", V_2020_4, {"CPU", "GPU"}}, -- {"InstanceNormalization", V_2023_0, {"NPU"}}, - {"HardSigmoid", V_2020_4, {"CPU", "GPU"}}, -- {"HardSigmoid", V_2023_1, {"NPU"}}, - {"HardMax", V_2022_1, {"CPU", "GPU"}}, -+ {"LayerNormalization", V_2023_0, {"CPU", "GPU"}}, - {"LeakyRelu", V_2020_4, {"CPU", "GPU"}}, -- {"LeakyRelu", V_2023_0, {"NPU"}}, - {"Less", V_2020_4, {"CPU", "GPU"}}, -- {"Less", V_2023_0, {"NPU"}}, // Added for whisper decoder model. - {"LessOrEqual", V_2022_1, {"CPU", "GPU"}}, -- {"LessOrEqual", V_2023_0, {"NPU"}}, - {"Log", V_2020_4, {"CPU", "GPU"}}, -- {"Log", V_2023_0, {"NPU"}}, - {"LogSoftMax", V_2022_1, {"CPU", "GPU"}}, - {"Loop", V_2021_4, {"CPU", "GPU"}}, -- {"LpNormalization", V_2023_1, {"CPU", "GPU", "NPU"}}, -- {"LpPool", V_2023_1, {"CPU", "GPU", "NPU"}}, -+ {"LpNormalization", V_2023_1, {"CPU", "GPU"}}, - {"LRN", V_2020_4, {"CPU", "GPU"}}, -- {"LRN", V_2023_0, {"NPU"}}, - {"LSTM", V_2020_4, {"CPU", "GPU"}}, -- {"LSTM", V_2023_1, {"NPU"}}, - {"MatMul", V_2020_4, {"CPU", "GPU"}}, -- {"MatMul", V_2023_0, {"NPU"}}, - {"MatMulInteger", V_2022_1, {"CPU"}}, -- {"MatMulInteger", V_2023_1, {"NPU"}}, - {"Max", V_2020_4, {"CPU", "GPU"}}, -- {"Max", V_2023_0, {"NPU"}}, - {"MaxPool", V_2020_4, {"CPU", "GPU"}}, -- {"MaxPool", V_2023_0, {"NPU"}}, - {"Mean", V_2020_4, {"CPU", "GPU"}}, -- {"Mean", V_2023_0, {"NPU"}}, - {"MeanVarianceNormalization", V_2022_1, {"CPU", "GPU"}}, -- {"MeanVarianceNormalization", V_2023_1, {"NPU"}}, - {"Min", V_2020_4, {"CPU", "GPU"}}, -- {"Min", V_2023_0, {"NPU"}}, - {"Mod", V_2022_1, {"CPU", "GPU"}}, - {"Mul", V_2020_4, {"CPU", "GPU"}}, -- {"Mul", V_2023_0, {"NPU"}}, - {"Neg", V_2020_4, {"CPU", "GPU"}}, -- {"Neg", V_2023_0, {"NPU"}}, - {"NonMaxSuppression", V_2021_1, {"CPU", "GPU"}}, -- {"NonMaxSuppression", V_2023_1, {"NPU"}}, - {"NonZero", V_2021_1, {"CPU"}}, - {"NonZero", V_2023_0, {"GPU"}}, - {"Not", V_2021_1, {"CPU", "GPU"}}, - {"Not", V_2020_4, {"CPU", "GPU"}}, -- {"Not", V_2023_1, {"NPU"}}, - {"OneHot", V_2020_4, {"CPU", "GPU"}}, -- {"OneHot", V_2023_1, {"NPU"}}, - {"Or", V_2022_1, {"CPU", "GPU"}}, -- {"Or", V_2023_1, {"NPU"}}, - {"Pad", V_2020_4, {"CPU", "GPU"}}, -- {"Pad", V_2023_0, {"NPU"}}, - {"Pow", V_2020_4, {"CPU", "GPU"}}, -- {"Pow", V_2023_0, {"NPU"}}, - {"PRelu", V_2020_4, {"CPU", "GPU"}}, -- {"PRelu", V_2023_0, {"NPU"}}, - {"QLinearMatMul", V_2022_3, {"CPU"}}, -- // {"QLinearMatMul", V_2023_1, {"NPU"}}, - {"QuantizeLinear", V_2021_4, {"CPU", "GPU"}}, -- {"QuantizeLinear", V_2023_0, {"NPU"}}, - {"RNN", V_2023_1, {"CPU", "GPU"}}, - {"RandomNormalLike", V_2023_0, {"CPU", "GPU"}}, - {"RandomNormalLike", V_2023_0, {"CPU", "GPU"}}, -- {"RandomNormalLike", V_2023_1, {"NPU"}}, - {"RandomNormal", V_2023_0, {"CPU", "GPU"}}, -- {"RandomNormal", V_2023_1, {"NPU"}}, - {"Range", V_2022_1, {"CPU", "GPU"}}, -- {"Range", V_2023_0, {"NPU"}}, - {"Reciprocal", V_2020_4, {"CPU", "GPU"}}, -- {"Reciprocal", V_2023_0, {"NPU"}}, - {"ReduceL1", V_2022_1, {"CPU", "GPU"}}, -- {"ReduceL1", V_2023_1, {"NPU"}}, - {"ReduceL2", V_2022_1, {"CPU", "GPU"}}, -- {"ReduceL2", V_2023_1, {"NPU"}}, - {"ReduceLogSum", V_2020_4, {"CPU"}}, - {"ReduceLogSum", V_2022_1, {"CPU", "GPU"}}, -- {"ReduceLogSum", V_2023_1, {"NPU"}}, - {"ReduceLogSumExp", V_2022_1, {"CPU", "GPU"}}, -- {"ReduceLogSumExp", V_2023_1, {"NPU"}}, - {"ReduceMax", V_2020_4, {"CPU", "GPU"}}, -- {"ReduceMax", V_2023_1, {"NPU"}}, - {"ReduceMean", V_2020_4, {"CPU", "GPU"}}, -- {"ReduceMean", V_2023_0, {"NPU"}}, - {"ReduceMin", V_2020_4, {"CPU", "GPU"}}, -- {"ReduceMin", V_2023_1, {"NPU"}}, - {"ReduceProd", V_2020_4, {"CPU"}}, - {"ReduceProd", V_2022_1, {"GPU"}}, -- {"ReduceProd", V_2023_1, {"NPU"}}, - {"ReduceSum", V_2020_4, {"CPU", "GPU"}}, -- // {"ReduceSum", V_2023_1, {"NPU"}}, - {"ReduceSumSquare", V_2020_4, {"CPU"}}, - {"ReduceSumSquare", V_2022_1, {"CPU", "GPU"}}, -- {"ReduceSumSquare", V_2023_1, {"NPU"}}, - {"Relu", V_2020_4, {"CPU", "GPU"}}, -- {"Relu", V_2023_0, {"NPU"}}, - {"Resize", V_2020_4, {"CPU"}}, - {"Resize", V_2022_1, {"GPU"}}, -- {"Resize", V_2023_1, {"NPU"}}, - {"Reshape", V_2020_4, {"CPU", "GPU"}}, -- {"Reshape", V_2023_0, {"NPU"}}, - {"ReverseSequence", V_2022_1, {"CPU", "GPU"}}, - {"RoiAlign", V_2021_1, {"CPU", "GPU"}}, -- {"RoiAlign", V_2023_1, {"NPU"}}, - {"Round", V_2021_4, {"CPU", "GPU"}}, -- {"Round", V_2023_1, {"NPU"}}, - {"Scatter", V_2022_1, {"CPU", "GPU"}}, -- {"Scatter", V_2023_1, {"NPU"}}, - {"ScatterElements", V_2022_1, {"CPU", "GPU"}}, -- {"ScatterElements", V_2023_1, {"NPU"}}, - {"ScatterND", V_2022_1, {"CPU", "GPU"}}, -- {"ScatterND", V_2023_1, {"NPU"}}, - {"Selu", V_2020_4, {"CPU", "GPU"}}, -- {"Selu", V_2023_1, {"NPU"}}, - {"Shape", V_2020_4, {"CPU", "GPU"}}, -- {"Shape", V_2023_0, {"NPU"}}, - {"Shrink", V_2022_1, {"CPU", "GPU"}}, -- {"Shrink", V_2023_0, {"NPU"}}, - {"Sigmoid", V_2020_4, {"CPU", "GPU"}}, -- {"Sigmoid", V_2023_0, {"NPU"}}, - {"Sign", V_2020_4, {"CPU"}}, - {"Sign", V_2022_1, {"GPU"}}, -- {"Sign", V_2023_0, {"NPU"}}, - {"Sin", V_2022_1, {"CPU", "GPU"}}, -- {"Sin", V_2023_0, {"NPU"}}, - {"Sinh", V_2020_4, {"CPU"}}, -- {"Sinh", V_2023_1, {"NPU"}}, - {"Size", V_2022_1, {"CPU", "GPU"}}, -- {"Size", V_2023_1, {"NPU"}}, - {"Slice", V_2020_4, {"CPU", "GPU"}}, -- {"Slice", V_2023_0, {"NPU"}}, - {"Softmax", V_2020_4, {"CPU", "GPU"}}, -- {"Softmax", V_2023_0, {"NPU"}}, - {"Softplus", V_2022_1, {"CPU", "GPU"}}, -- {"Softplus", V_2023_0, {"NPU"}}, - {"Softsign", V_2022_1, {"CPU", "GPU"}}, - {"SpaceToDepth", V_2020_4, {"CPU", "GPU"}}, -- {"SpaceToDepth", V_2023_0, {"NPU"}}, - {"Split", V_2020_4, {"CPU", "GPU"}}, -- {"Split", V_2023_0, {"NPU"}}, - {"Sqrt", V_2020_4, {"CPU", "GPU"}}, -- {"Sqrt", V_2023_0, {"NPU"}}, - {"Squeeze", V_2020_4, {"CPU", "GPU"}}, -- {"Squeeze", V_2023_0, {"NPU"}}, - {"Softsign", V_2020_4, {"CPU"}}, - {"Sub", V_2020_4, {"CPU", "GPU"}}, -- {"Sub", V_2023_0, {"NPU"}}, - {"Sum", V_2020_4, {"CPU", "GPU"}}, -- {"Sum", V_2023_0, {"NPU"}}, - {"Tan", V_2020_4, {"CPU", "GPU"}}, -- {"Tan", V_2023_1, {"NPU"}}, - {"Tanh", V_2020_4, {"CPU", "GPU"}}, -- {"Tanh", V_2023_0, {"NPU"}}, - {"ThresholdedRelu", V_2022_1, {"CPU", "GPU"}}, -- {"ThresholdedRelu", V_2023_0, {"NPU"}}, - {"Tile", V_2021_3, {"CPU", "GPU"}}, -- {"Tile", V_2023_0, {"NPU"}}, - {"Transpose", V_2020_4, {"CPU", "GPU"}}, -- {"Transpose", V_2023_0, {"NPU"}}, - {"Trilu", V_2023_0, {"CPU", "GPU"}}, -- {"Trilu", V_2023_1, {"NPU"}}, - {"TopK", V_2020_4, {"CPU", "GPU"}}, -- {"TopK", V_2023_0, {"NPU"}}, - {"Upsample", V_2020_4, {"CPU", "GPU"}}, - {"Unsqueeze", V_2020_4, {"CPU", "GPU"}}, -- {"Unsqueeze", V_2023_0, {"NPU"}}, - {"Where", V_2022_1, {"CPU", "GPU"}}, -- {"Where", V_2023_0, {"NPU"}}, // Added for whisper decoder model. - {"Xor", V_2022_1, {"CPU", "GPU"}}, -- {"Xor", V_2023_1, {"NPU"}}, - }; - - void DataOps::populate_types_supported() { -@@ -370,6 +251,8 @@ void DataOps::populate_types_supported() { - std::make_pair(V_2020_4, ONNX_NAMESPACE::TensorProto_DataType::TensorProto_DataType_INT32)); - supported_types_initializer_.insert( - std::make_pair(V_2020_4, ONNX_NAMESPACE::TensorProto_DataType::TensorProto_DataType_INT64)); -+ supported_types_initializer_.insert( -+ std::make_pair(V_2020_4, ONNX_NAMESPACE::TensorProto_DataType::TensorProto_DataType_UINT16)); - supported_types_initializer_.insert( - std::make_pair(V_2021_1, ONNX_NAMESPACE::TensorProto_DataType::TensorProto_DataType_FLOAT16)); - supported_types_initializer_.insert( -@@ -387,6 +270,8 @@ void DataOps::populate_types_supported() { - std::make_pair(V_2020_4, ONNX_NAMESPACE::TensorProto_DataType::TensorProto_DataType_INT8)); - supported_types_npu_.insert( - std::make_pair(V_2020_4, ONNX_NAMESPACE::TensorProto_DataType::TensorProto_DataType_INT16)); -+ supported_types_npu_.insert( -+ std::make_pair(V_2020_4, ONNX_NAMESPACE::TensorProto_DataType::TensorProto_DataType_UINT16)); - supported_types_npu_.insert( - std::make_pair(V_2020_4, ONNX_NAMESPACE::TensorProto_DataType::TensorProto_DataType_INT32)); - supported_types_npu_.insert( -@@ -402,6 +287,8 @@ void DataOps::populate_types_supported() { - std::make_pair(V_2020_4, ONNX_NAMESPACE::TensorProto_DataType::TensorProto_DataType_INT32)); - supported_types_cpu_.insert( - std::make_pair(V_2020_4, ONNX_NAMESPACE::TensorProto_DataType::TensorProto_DataType_INT16)); -+ supported_types_cpu_.insert( -+ std::make_pair(V_2020_4, ONNX_NAMESPACE::TensorProto_DataType::TensorProto_DataType_UINT16)); - supported_types_cpu_.insert( - std::make_pair(V_2020_4, ONNX_NAMESPACE::TensorProto_DataType::TensorProto_DataType_INT8)); - supported_types_cpu_.insert( -@@ -437,13 +324,12 @@ void DataOps::populate_op_mode_supported() { - no_dimension_supported_.push_back({"DequantizeLinear", V_2021_4, {"All"}}); - no_dimension_supported_.push_back({"Equal", V_2022_1, {"CPU"}}); - no_dimension_supported_.push_back({"Equal", V_2023_0, {"GPU"}}); -+ no_dimension_supported_.push_back({"Expand", V_2023_3, {"CPU"}}); - no_dimension_supported_.push_back({"Floor", V_2020_4, {"All"}}); - no_dimension_supported_.push_back({"Gather", V_2020_4, {"All"}}); -- no_dimension_supported_.push_back({"Greater", V_2023_0, {"NPU"}}); - no_dimension_supported_.push_back({"Identity", V_2023_0, {"All"}}); - no_dimension_supported_.push_back({"Less", V_2022_1, {"CPU"}}); - no_dimension_supported_.push_back({"Loop", V_2021_4, {"All"}}); -- no_dimension_supported_.push_back({"Max", V_2023_0, {"NPU"}}); - no_dimension_supported_.push_back({"Min", V_2020_4, {"All"}}); - no_dimension_supported_.push_back({"Mul", V_2020_4, {"All"}}); - no_dimension_supported_.push_back({"Neg", V_2023_0, {"CPU", "GPU"}}); -@@ -476,9 +362,8 @@ void DataOps::populate_op_mode_supported() { - { - UnsupportedOpMode obj = {{V_2022_1, V_2022_2, V_2022_3}, - [this](const Node* node, const InitializedTensorSet&) { -- // Abs is not supproted with INT8 or INT32 as input data type on GPU and NPU -- if ((device_id_.find("GPU") != std::string::npos) || -- (device_id_.find("NPU") != std::string::npos)) { -+ // Abs is not supproted with INT8 or INT32 as input data type on GPU -+ if ((device_id_.find("GPU") != std::string::npos)) { - for (size_t i = 0; i < node->InputDefs().size(); i++) { - if (node->InputDefs()[i]->TypeAsProto()->tensor_type().elem_type() == - ONNX_NAMESPACE::TensorProto_DataType::TensorProto_DataType_INT8 || -@@ -706,7 +591,7 @@ void DataOps::populate_op_mode_supported() { - op_list_.insert({"PRelu", obj}); - } - { -- UnsupportedOpMode obj = {{V_2023_0, V_2023_1, V_2023_2, V_2023_3}, -+ UnsupportedOpMode obj = {{V_2023_1, V_2023_2, V_2023_3, V_2024_0}, - [this](const Node* node, const InitializedTensorSet&) { - const auto& input_arg = node->InputDefs()[1]; - auto shape = input_arg->Shape(); -@@ -821,7 +706,7 @@ void DataOps::populate_op_mode_supported() { - op_list_.insert({"Squeeze", obj}); - } - { -- UnsupportedOpMode obj = {{V_2023_0, V_2023_1, V_2023_2, V_2023_3}, -+ UnsupportedOpMode obj = {{V_2023_1, V_2023_2, V_2023_3, V_2024_0}, - [this](const Node* node, const InitializedTensorSet&) { - // If the operator is unsqueeze - // If axes is an input, then we cannot produce a static graph. -@@ -836,7 +721,7 @@ void DataOps::populate_op_mode_supported() { - op_list_.insert({"Unsqueeze", obj}); - } - { -- UnsupportedOpMode obj = {{V_2023_0, V_2023_1, V_2023_2, V_2023_3}, -+ UnsupportedOpMode obj = {{V_2023_1, V_2023_2, V_2023_3, V_2024_0}, - [this](const Node* node, const InitializedTensorSet&) { - // check for attributes - auto& upsample_attr = node->GetAttributes(); -@@ -961,7 +846,7 @@ bool DataOps::type_is_supported(const NodeArg* node_arg, bool is_initializer) { - } else { - auto dtype = type_proto->tensor_type().elem_type(); - -- if (device_id_.find("NPU") != std::string::npos || device_id_.find("HETERO") != std::string::npos || -+ if (device_id_.find("HETERO") != std::string::npos || - device_id_.find("MULTI") != std::string::npos || device_id_.find("AUTO") != std::string::npos) { - for (auto const& var : supported_types_npu_) { - if ((var.first <= version_id_) && -@@ -1063,8 +948,7 @@ bool DataOps::dimension_unsupported(const Node* node) { - return true; - } - --bool DataOps::node_is_supported(const std::map>& op_map, -- const NodeIndex node_idx) { -+bool DataOps::node_is_supported(const NodeIndex node_idx) { - const auto& node = graph_viewer_.GetNode(node_idx); - const auto& optype = node->OpType(); - -@@ -1174,37 +1058,14 @@ bool DataOps::node_is_supported(const std::mapOpType()); -- if (opset == op_map.end()) { --#ifndef NDEBUG -- if (openvino_ep::backend_utils::IsDebugEnabled()) { -- std::cout << "Failed in Unsupported onnx model domain" << std::endl; -- } --#endif -- return false; -- } -- if (opset->second.find(optype) == opset->second.end() && op_fun == ops_supported_as_function.end()) { --#ifndef NDEBUG -- if (openvino_ep::backend_utils::IsDebugEnabled()) { -- std::cout << "The operator is not available in OpenVINO ngraph operators list" -- << "nor the operator is a special ONNX function" -- << std::endl; -- } --#endif -- return false; -- } - return true; - } - - std::vector DataOps::GetUnsupportedNodeIndices(std::unordered_set& ng_required_initializers) { -- const auto ng_supported_ops = GetNgSupportedOps(GetOnnxOpSet(graph_viewer_)); -- - std::vector unsupported_nodes_idx; - - for (const auto& node_idx : graph_viewer_.GetNodesInTopologicalOrder()) { -- if (node_is_supported(ng_supported_ops, node_idx)) { -+ if (node_is_supported(node_idx)) { - // Collect inputs that are initializers - graph_viewer_.GetNode(node_idx)->ForEachDef([&ng_required_initializers, this](const NodeArg& node_arg, - bool is_input) { -diff --git a/onnxruntime/core/providers/openvino/ov_versions/data_ops.h b/onnxruntime/core/providers/openvino/ov_versions/data_ops.h -index 87688601ad6925f46de0b68a55cdcff71cbd3203..0990904908111e7b2cbac857a80115dc669fd5b4 100644 ---- a/onnxruntime/core/providers/openvino/ov_versions/data_ops.h -+++ b/onnxruntime/core/providers/openvino/ov_versions/data_ops.h -@@ -1,4 +1,4 @@ --// Copyright (C) 2019-2022 Intel Corporation -+// Copyright (C) Intel Corporation - // Licensed under the MIT License - - #pragma once -@@ -26,7 +26,8 @@ enum versionNum { - V_2023_0, - V_2023_1, - V_2023_2, -- V_2023_3 -+ V_2023_3, -+ V_2024_0 - }; - - using VersionNum = enum versionNum; -@@ -67,9 +68,7 @@ class DataOps { - bool dimension_unsupported(const Node* node); - bool unsupported_op_mode(const Node* node); - bool type_is_supported(const NodeArg* node_arg, bool is_initializer); -- bool node_is_supported(const std::map>& op_map, -- const NodeIndex node_idx); -+ bool node_is_supported(const NodeIndex node_idx); - - public: - DataOps(const GraphViewer& graph_viewer_param, VersionNum ver, const std::string dev_id, const std::string device_precision) -diff --git a/onnxruntime/core/providers/openvino/ov_versions/utils.cc b/onnxruntime/core/providers/openvino/ov_versions/utils.cc -index ee0bfddb7dc83d8403c9e86030694fedc861d2f9..c5ed29df487b45110d3362866d4fd563d3fd0d79 100644 ---- a/onnxruntime/core/providers/openvino/ov_versions/utils.cc -+++ b/onnxruntime/core/providers/openvino/ov_versions/utils.cc -@@ -1,4 +1,4 @@ --// Copyright (C) 2019-2022 Intel Corporation -+// Copyright (C) Intel Corporation - // Licensed under the MIT License - - #include "core/providers/shared_library/provider_api.h" -@@ -11,14 +11,6 @@ - #pragma GCC diagnostic ignored "-Wunused-parameter" - #endif - --#include "openvino/core/deprecated.hpp" --#define IN_OV_COMPONENT --#define NGRAPH_LEGACY_HEADER_INCLUDED --#include -- --#undef NGRAPH_LEGACY_HEADER_INCLUDED --#undef IN_OV_COMPONENT -- - #if defined(_MSC_VER) - #pragma warning(default : 4244 4245) - #elif __GNUC__ -@@ -95,20 +87,6 @@ int GetOnnxOpSet(const GraphViewer& graph_viewer) { - return dm_to_ver.at(kOnnxDomain); - } - --std::map> GetNgSupportedOps(const int onnx_opset) { -- std::map> ng_supported_ops; -- OPENVINO_SUPPRESS_DEPRECATED_START -- ng_supported_ops.emplace(kOnnxDomain, ngraph::onnx_import::get_supported_operators(onnx_opset, kOnnxDomain)); -- -- const std::set ng_disabled_ops = {"LSTM"}; // Place-holder for ops not supported. -- -- for (const auto& disabled_op : ng_disabled_ops) { -- ng_supported_ops.at(kOnnxDomain).erase(disabled_op); -- } -- OPENVINO_SUPPRESS_DEPRECATED_END -- return ng_supported_ops; --} -- - /** - * Returns a vector clusters(or node_idx). For each unsupported node, the graph is split into 3 parts. - * supported_cluster + (UNsupported_node + rest_of_the_graph). This functions returns vector of all supported_clusters by nGraph -diff --git a/onnxruntime/core/providers/openvino/ov_versions/utils.h b/onnxruntime/core/providers/openvino/ov_versions/utils.h -index b3edeef88dfec1951124dc17d2aab13ddd105967..34aa762ba9b6782067287417eef7ea55ccfd54a1 100644 ---- a/onnxruntime/core/providers/openvino/ov_versions/utils.h -+++ b/onnxruntime/core/providers/openvino/ov_versions/utils.h -@@ -1,4 +1,4 @@ --// Copyright (C) 2019-2022 Intel Corporation -+// Copyright (C) Intel Corporation - // Licensed under the MIT License - #pragma once - -diff --git a/onnxruntime/python/onnxruntime_pybind_state.cc b/onnxruntime/python/onnxruntime_pybind_state.cc -index e5e0e81cb7da890cd970d64e4c6310cf02320210..7b56f0c68427a42ef305be933a9ef169b1b07210 100644 ---- a/onnxruntime/python/onnxruntime_pybind_state.cc -+++ b/onnxruntime/python/onnxruntime_pybind_state.cc -@@ -937,6 +937,20 @@ std::unique_ptr CreateExecutionProviderInstance( - ORT_THROW("Invalid value passed for disable_dynamic_shapes: ", option.second); - } - OV_provider_options_map[option.first] = option.second; -+ } else if (option.first == "enable_dynamic_shapes") { -+ LOGS_DEFAULT(WARNING) << " Deprecation notice - 'enable_dynamic_shapes' is Deprected. Upgrade the API to disable_dynamic_shapes parameter." -+ "Please refer https://onnxruntime.ai/docs/execution-providers/OpenVINO-ExecutionProvider.html#requirements to ensure all dependencies are met."; -+ std::string value; -+ if (!(option.second == "True" || option.second == "true" || -+ option.second == "False" || option.second == "false")) { -+ ORT_THROW("Invalid value passed for enable_dynamic_shapes: ", option.second); -+ } -+ if (option.second == "True" || option.second == "true") { -+ value = "false"; -+ } else { -+ value = "true"; -+ } -+ OV_provider_options_map["disable_dynamic_shapes"] = value; - } else if (option.first == "device_id") { - OV_provider_options_map[option.first] = option.second; - continue; -@@ -967,7 +981,7 @@ std::unique_ptr CreateExecutionProviderInstance( - if (!Env::Default().GetEnvironmentVar("INTEL_OPENVINO_DIR").empty()) { - ORT_THROW("INTEL_OPENVINO_DIR is set but OpenVINO library wasn't able to be loaded. Please install a supported version of OpenVINO as mentioned in the requirements page (https://onnxruntime.ai/docs/execution-providers/OpenVINO-ExecutionProvider.html#requirements), ensure dependency libraries are in the PATH and your hardware is supported."); - } else { -- LOGS_DEFAULT(WARNING) << "Failed to create " << type << ". Please reference https://onnxruntime.ai/docs/execution-providers/OpenVINO-ExecutionProvider.html#requirements to ensure all dependencies are met."; -+ LOGS_DEFAULT(WARNING) << "Failed to create " << type << ". Please refer https://onnxruntime.ai/docs/execution-providers/OpenVINO-ExecutionProvider.html#requirements to ensure all dependencies are met."; - } - } - #endif -diff --git a/onnxruntime/python/onnxruntime_pybind_state_common.h b/onnxruntime/python/onnxruntime_pybind_state_common.h -index 6827f2c9dfd91ff5b7b1766acacec7a82838c650..22314610dbee96a695196a9b4e75bd74b110d291 100644 ---- a/onnxruntime/python/onnxruntime_pybind_state_common.h -+++ b/onnxruntime/python/onnxruntime_pybind_state_common.h -@@ -60,11 +60,8 @@ struct OrtStatus { - #elif OPENVINO_CONFIG_GPU_FP16 - #define BACKEND_OPENVINO "-OPENVINO_GPU_FP16" - --#elif OPENVINO_CONFIG_NPU_FP16 --#define BACKEND_OPENVINO "-OPENVINO_NPU_FP16" -- --#elif OPENVINO_CONFIG_NPU_U8 --#define BACKEND_OPENVINO "-OPENVINO_NPU_U8" -+#elif OPENVINO_CONFIG_NPU -+#define BACKEND_OPENVINO "-OPENVINO_NPU" - - #elif OPENVINO_CONFIG_MULTI - #define BACKEND_OPENVINO "-OPENVINO_MULTI" -diff --git a/tools/ci_build/build.py b/tools/ci_build/build.py -index 1056c4ed8451011928e830fe26e15c90c0b7933a..fab23e360405263f201b015a6117dc316519c607 100644 ---- a/tools/ci_build/build.py -+++ b/tools/ci_build/build.py -@@ -75,13 +75,14 @@ def _str_to_bool(s): - - - def _openvino_verify_device_type(device_read): -- choices = ["CPU_FP32", "CPU_FP16", "GPU_FP32", "GPU_FP16"] -+ choices = ["CPU_FP32", "CPU_FP16", "GPU_FP32", "GPU_FP16", "NPU"] - - choices1 = [ - "CPU_FP32_NO_PARTITION", - "CPU_FP16_NO_PARTITION", - "GPU_FP32_NO_PARTITION", - "GPU_FP16_NO_PARTITION", -+ "NPU_NO_PARTITION", - ] - status_hetero = True - res = False -@@ -96,7 +97,7 @@ def _openvino_verify_device_type(device_read): - if len(comma_separated_devices) < 2: - print("At least two devices required in Hetero/Multi/Auto Mode") - status_hetero = False -- dev_options = ["CPU", "GPU"] -+ dev_options = ["CPU", "GPU", "NPU"] - for dev in comma_separated_devices: - if dev not in dev_options: - status_hetero = False -@@ -107,7 +108,7 @@ def invalid_hetero_build(): - print("specify the keyword HETERO or MULTI or AUTO followed by the devices ") - print("in the order of priority you want to build\n") - print("The different hardware devices that can be added in HETERO or MULTI or AUTO") -- print("are ['CPU','GPU'] \n") -+ print("are ['CPU','GPU','NPU'] \n") - print("An example of how to specify the hetero build type. Ex: HETERO:GPU,CPU \n") - print("An example of how to specify the MULTI build type. Ex: MULTI:GPU,CPU \n") - print("An example of how to specify the AUTO build type. Ex: AUTO:GPU,CPU \n") -@@ -1222,6 +1223,7 @@ def generate_build_tree( - "-Donnxruntime_USE_OPENVINO_GPU_FP16=" + ("ON" if args.use_openvino == "GPU_FP16" else "OFF"), - "-Donnxruntime_USE_OPENVINO_CPU_FP32=" + ("ON" if args.use_openvino == "CPU_FP32" else "OFF"), - "-Donnxruntime_USE_OPENVINO_CPU_FP16=" + ("ON" if args.use_openvino == "CPU_FP16" else "OFF"), -+ "-Donnxruntime_USE_OPENVINO_NPU=" + ("ON" if args.use_openvino == "NPU" else "OFF"), - "-Donnxruntime_USE_OPENVINO_GPU_FP32_NP=" - + ("ON" if args.use_openvino == "GPU_FP32_NO_PARTITION" else "OFF"), - "-Donnxruntime_USE_OPENVINO_GPU_FP16_NP=" -@@ -1230,6 +1232,7 @@ def generate_build_tree( - + ("ON" if args.use_openvino == "CPU_FP32_NO_PARTITION" else "OFF"), - "-Donnxruntime_USE_OPENVINO_CPU_FP16_NP=" - + ("ON" if args.use_openvino == "CPU_FP16_NO_PARTITION" else "OFF"), -+ "-Donnxruntime_USE_OPENVINO_NPU_NP=" + ("ON" if args.use_openvino == "NPU_NO_PARTITION" else "OFF"), - "-Donnxruntime_USE_OPENVINO_HETERO=" + ("ON" if args.use_openvino.startswith("HETERO") else "OFF"), - "-Donnxruntime_USE_OPENVINO_DEVICE=" + (args.use_openvino), - "-Donnxruntime_USE_OPENVINO_MULTI=" + ("ON" if args.use_openvino.startswith("MULTI") else "OFF"), -diff --git a/tools/ci_build/github/azure-pipelines/linux-openvino-ci-pipeline.yml b/tools/ci_build/github/azure-pipelines/linux-openvino-ci-pipeline.yml -index c92fc93abba37d3f8c4414da767a85bd7118166b..03e0274fc198ac2b28f6eee2fe0915800d27b56a 100644 ---- a/tools/ci_build/github/azure-pipelines/linux-openvino-ci-pipeline.yml -+++ b/tools/ci_build/github/azure-pipelines/linux-openvino-ci-pipeline.yml -@@ -32,5 +32,5 @@ jobs: - parameters: - AgentPool : 'Linux-CPU-2019' - JobName: 'Linux_CI_Dev' -- RunDockerBuildArgs: '-o ubuntu20.04 -d openvino -v 2023.0.0 -x "--use_openvino CPU_FP32 --build_wheel"' -+ RunDockerBuildArgs: '-o ubuntu20.04 -d openvino -v 2024.0.0 -x "--use_openvino CPU_FP32 --build_wheel"' - TimeoutInMinutes: 120 -diff --git a/tools/ci_build/github/linux/docker/Dockerfile.ubuntu_openvino b/tools/ci_build/github/linux/docker/Dockerfile.ubuntu_openvino -index a0ba5ea232ca3d5061fdfc565a3f7b703d0ceb48..45682c797bbb8389cb7d90dc31bdd60b682f318f 100644 ---- a/tools/ci_build/github/linux/docker/Dockerfile.ubuntu_openvino -+++ b/tools/ci_build/github/linux/docker/Dockerfile.ubuntu_openvino -@@ -1,8 +1,8 @@ - ARG UBUNTU_VERSION=20.04 - FROM ubuntu:${UBUNTU_VERSION} - --ARG OPENVINO_VERSION=2023.0.0 --ARG PYTHON_VERSION=3.8 -+ARG OPENVINO_VERSION=2024.0.0 -+ARG PYTHON_VERSION=3.9 - - ADD scripts /tmp/scripts - RUN /tmp/scripts/install_ubuntu.sh -p ${PYTHON_VERSION} -d EdgeDevice && \ -@@ -14,15 +14,14 @@ RUN apt update && apt install -y libnuma1 ocl-icd-libopencl1 && \ - - ENV INTEL_OPENVINO_DIR /opt/intel/openvino_${OPENVINO_VERSION} - ENV LD_LIBRARY_PATH $INTEL_OPENVINO_DIR/runtime/lib/intel64:$INTEL_OPENVINO_DIR/runtime/3rdparty/tbb/lib:/usr/local/openblas/lib:$LD_LIBRARY_PATH --ENV InferenceEngine_DIR $INTEL_OPENVINO_DIR/runtime/cmake --ENV ngraph_DIR $INTEL_OPENVINO_DIR/runtime/cmake -+ENV OpenVINO_DIR $INTEL_OPENVINO_DIR/runtime/cmake - ENV IE_PLUGINS_PATH $INTEL_OPENVINO_DIR/runtime/lib/intel64 - ENV DEBIAN_FRONTEND=noninteractive - - RUN cd /opt && mkdir -p intel && cd intel && \ -- wget https://storage.openvinotoolkit.org/repositories/openvino/packages/2023.0/linux/l_openvino_toolkit_ubuntu20_2023.0.0.10926.b4452d56304_x86_64.tgz && \ -- tar xzf l_openvino_toolkit_ubuntu20_2023.0.0.10926.b4452d56304_x86_64.tgz && rm -rf l_openvino_toolkit_ubuntu20_2023.0.0.10926.b4452d56304_x86_64.tgz && \ -- mv l_openvino_toolkit_ubuntu20_2023.0.0.10926.b4452d56304_x86_64 openvino_2023.0.0 && \ -+ wget https://storage.openvinotoolkit.org/repositories/openvino/packages/2024.0/linux/l_openvino_toolkit_ubuntu20_2024.0.0.14509.34caeefd078_x86_64.tgz && \ -+ tar xzf l_openvino_toolkit_ubuntu20_2024.0.0.14509.34caeefd078_x86_64.tgz && rm -rf l_openvino_toolkit_ubuntu20_2024.0.0.14509.34caeefd078_x86_64.tgz && \ -+ mv l_openvino_toolkit_ubuntu20_2024.0.0.14509.34caeefd078_x86_64 openvino_2024.0.0 && \ - cd $INTEL_OPENVINO_DIR/install_dependencies && ./install_openvino_dependencies.sh -y - - WORKDIR /root -diff --git a/tools/ci_build/github/linux/docker/Dockerfile_manylinux2014_openvino_multipython b/tools/ci_build/github/linux/docker/Dockerfile_manylinux2014_openvino_multipython -deleted file mode 100644 -index bc0b41277328622995a9b865ef03ff503d2ebd39..0000000000000000000000000000000000000000 ---- a/tools/ci_build/github/linux/docker/Dockerfile_manylinux2014_openvino_multipython -+++ /dev/null -@@ -1,83 +0,0 @@ --FROM quay.io/pypa/manylinux2014_x86_64:latest -- --ENV PATH /opt/rh/devtoolset-10/root/usr/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin --ADD scripts /tmp/scripts --RUN cd /tmp/scripts && /tmp/scripts/manylinux/install_centos.sh && /tmp/scripts/manylinux/install_deps.sh && rm -rf /tmp/scripts -- --ARG PYTHON_VER_PATH="cp38-cp38" --ARG PYTHON_VERSION="3.8" --ARG BUILD_UID=1001 --ARG BUILD_USER=onnxruntimedev --ARG OV_DEVICE_PRECISION="CPU_FP32" --ARG ENABLE_TRAINING=true --ARG ORT_BRANCH="rel-1.13.1" --ARG OV_VERSION="2022.2.0" --RUN adduser --uid $BUILD_UID $BUILD_USER --WORKDIR /home/$BUILD_USER --ENV PYTHON_EXE="/opt/python/$PYTHON_VER_PATH/bin/python$PYTHON_VERSION" -- --RUN yum -y install wget git -- --# libusb1.0.22 --RUN cd /home/ && wget https://github.com/libusb/libusb/archive/v1.0.22.zip && \ -- unzip v1.0.22.zip && rm -rf v1.0.22.zip && cd /home/libusb-1.0.22 && \ --# bootstrap steps -- ./bootstrap.sh && \ -- ./configure --disable-udev --enable-shared && \ -- make -j4 && \ --# configure libusb1.0.22 -- cd /home/libusb-1.0.22/libusb && \ -- /bin/mkdir -p '/usr/local/lib' && \ -- /bin/bash ../libtool --mode=install /usr/bin/install -c libusb-1.0.la '/usr/local/lib' && \ -- /bin/mkdir -p '/usr/local/include/libusb-1.0' && \ -- /usr/bin/install -c -m 644 libusb.h '/usr/local/include/libusb-1.0' && \ -- /bin/mkdir -p '/usr/local/lib/pkgconfig' -- --RUN ${PYTHON_EXE} -m pip install onnx numpy wheel --USER $BUILD_USER --RUN cd $WORKDIR && git clone https://github.com/openvinotoolkit/openvino.git && \ -- cd openvino && \ -- git checkout $OV_VERSION && \ -- git submodule init && \ -- git submodule update --recursive -- --RUN cd $WORKDIR && cd openvino && mkdir build && cd build && \ -- cmake .. -DCMAKE_BUILD_TYPE=Release -DCMAKE_CXX_FLAGS=-D_GLIBCXX_USE_CXX11_ABI=0 -DENABLE_PYTHON=ON -DPYTHON_EXECUTABLE=$PYTHON_EXE -DCMAKE_INSTALL_PREFIX=/home/onnxruntimedev/openvino_$OV_VERSION && \ -- make -j8 && make install -- --ENV INTEL_OPENVINO_DIR /home/onnxruntimedev/openvino_$OV_VERSION --ENV LD_LIBRARY_PATH $INTEL_OPENVINO_DIR/runtime/lib/intel64:$INTEL_OPENVINO_DIR/runtime/3rdparty/tbb/lib:/usr/local/openblas/lib:$LD_LIBRARY_PATH --ENV TBB_LIBS $INTEL_OPENVINO_DIR/runtime/3rdparty/tbb/lib --ENV InferenceEngine_DIR $INTEL_OPENVINO_DIR/runtime/cmake --ENV ngraph_DIR $INTEL_OPENVINO_DIR/runtime/cmake --ENV IE_PLUGINS_PATH $INTEL_OPENVINO_DIR/runtime/lib/intel64 --ENV OPENVINO_MANYLINUX 1 -- --RUN cd $WORKDIR && \ -- git clone --recursive -b $ORT_BRANCH https://github.com/intel/onnxruntime.git --RUN cd onnxruntime/onnxruntime/core/providers/openvino && mkdir scripts -- --RUN cp ${IE_PLUGINS_PATH}/libopenvino.so /home/onnxruntimedev/onnxruntime/onnxruntime/core/providers/openvino/scripts/ --RUN cp ${IE_PLUGINS_PATH}/libopenvino_c.so /home/onnxruntimedev/onnxruntime/onnxruntime/core/providers/openvino/scripts/ --RUN cp ${IE_PLUGINS_PATH}/libopenvino_onnx_frontend.so /home/onnxruntimedev/onnxruntime/onnxruntime/core/providers/openvino/scripts/ --RUN cp ${IE_PLUGINS_PATH}/libopenvino_intel_cpu_plugin.so /home/onnxruntimedev/onnxruntime/onnxruntime/core/providers/openvino/scripts/ --RUN cp ${IE_PLUGINS_PATH}/libopenvino_intel_gpu_plugin.so /home/onnxruntimedev/onnxruntime/onnxruntime/core/providers/openvino/scripts/ --RUN cp ${IE_PLUGINS_PATH}/libopenvino_intel_myriad_plugin.so /home/onnxruntimedev/onnxruntime/onnxruntime/core/providers/openvino/scripts/ --RUN cp ${IE_PLUGINS_PATH}/libopenvino_hetero_plugin.so /home/onnxruntimedev/onnxruntime/onnxruntime/core/providers/openvino/scripts/ --RUN cp ${IE_PLUGINS_PATH}/libopenvino_auto_plugin.so /home/onnxruntimedev/onnxruntime/onnxruntime/core/providers/openvino/scripts/ --RUN cp ${IE_PLUGINS_PATH}/plugins.xml /home/onnxruntimedev/onnxruntime/onnxruntime/core/providers/openvino/scripts/ --RUN cp ${IE_PLUGINS_PATH}/usb-ma2x8x.mvcmd /home/onnxruntimedev/onnxruntime/onnxruntime/core/providers/openvino/scripts/ --RUN cp ${TBB_LIBS}/libtbb.so /home/onnxruntimedev/onnxruntime/onnxruntime/core/providers/openvino/scripts/ --RUN cp ${TBB_LIBS}/libtbb.so.2 /home/onnxruntimedev/onnxruntime/onnxruntime/core/providers/openvino/scripts/ --RUN cp ${TBB_LIBS}/libtbbmalloc.so /home/onnxruntimedev/onnxruntime/onnxruntime/core/providers/openvino/scripts/ --RUN cp ${TBB_LIBS}/libtbbmalloc.so.2 /home/onnxruntimedev/onnxruntime/onnxruntime/core/providers/openvino/scripts/ --RUN cd /home/onnxruntimedev/onnxruntime && git pull --RUN if $ENABLE_TRAINING; then \ -- ${PYTHON_EXE} ./onnxruntime/tools/ci_build/build.py \ -- --build_dir ./onnxruntime/build --use_openvino $(OV_DEVICE_PRECISION) --build_shared_lib \ -- --config Release --build_wheel --skip_tests --enable_training ; \ -- else \ -- ${PYTHON_EXE} ./onnxruntime/tools/ci_build/build.py \ -- --build_dir ./onnxruntime/build --use_openvino $(OV_DEVICE_PRECISION) --build_shared_lib \ -- --config Release --build_wheel --skip_tests ;\ -- fi -diff --git a/tools/nuget/generate_nuspec_for_native_nuget.py b/tools/nuget/generate_nuspec_for_native_nuget.py -index 09fe99d36cc340fb145a52f319df75cdc45aa709..7180377bd744f86d9d5407aefd57cbb159024d30 100644 ---- a/tools/nuget/generate_nuspec_for_native_nuget.py -+++ b/tools/nuget/generate_nuspec_for_native_nuget.py -@@ -732,7 +732,7 @@ def generate_files(line_list, args): - ) - - if args.execution_provider == "openvino": -- openvino_path = get_env_var("INTEL_OPENVINO_DIR") -+ get_env_var("INTEL_OPENVINO_DIR") - files_list.append( - "' - ) - -- if is_windows(): -- dll_list_path = os.path.join(openvino_path, "runtime\\bin\\intel64\\Release\\") -- tbb_list_path = os.path.join(openvino_path, "runtime\\3rdparty\\tbb\\bin\\") -- -- for dll_element in os.listdir(dll_list_path): -- if dll_element.endswith("dll"): -- files_list.append( -- "' -- ) -- -- for tbb_element in os.listdir(tbb_list_path): -- if tbb_element.endswith("dll"): -- files_list.append( -- "' -- ) -- - if args.execution_provider == "cuda" or is_cuda_gpu_win_sub_package and not is_ado_packaging_build: - files_list.append( - "") +onnxruntime_fetchcontent_makeavailable(GSL) + +find_path(safeint_SOURCE_DIR NAMES "SafeInt.hpp") +if(NOT safeint_SOURCE_DIR) + unset(safeint_SOURCE_DIR) + FetchContent_Declare( + safeint + URL ${DEP_URL_safeint} + URL_HASH SHA1=${DEP_SHA1_safeint} + ) + + # use fetch content rather than makeavailable because safeint only includes unconditional test targets + FetchContent_Populate(safeint) +endif() +add_library(safeint_interface INTERFACE) +target_include_directories(safeint_interface INTERFACE ${safeint_SOURCE_DIR}) + + +# Flatbuffers +# We do not need to build flatc for iOS or Android Cross Compile +if (CMAKE_SYSTEM_NAME STREQUAL "iOS" OR CMAKE_SYSTEM_NAME STREQUAL "Android" OR CMAKE_SYSTEM_NAME STREQUAL "Emscripten") + set(FLATBUFFERS_BUILD_FLATC OFF CACHE BOOL "FLATBUFFERS_BUILD_FLATC" FORCE) +endif() +set(FLATBUFFERS_BUILD_TESTS OFF CACHE BOOL "FLATBUFFERS_BUILD_TESTS" FORCE) +set(FLATBUFFERS_INSTALL OFF CACHE BOOL "FLATBUFFERS_INSTALL" FORCE) +set(FLATBUFFERS_BUILD_FLATHASH OFF CACHE BOOL "FLATBUFFERS_BUILD_FLATHASH" FORCE) +set(FLATBUFFERS_BUILD_FLATLIB ON CACHE BOOL "FLATBUFFERS_BUILD_FLATLIB" FORCE) +if(Patch_FOUND) + set(ONNXRUNTIME_FLATBUFFERS_PATCH_COMMAND ${Patch_EXECUTABLE} --binary --ignore-whitespace -p1 < ${PROJECT_SOURCE_DIR}/patches/flatbuffers/flatbuffers.patch) +else() + set(ONNXRUNTIME_FLATBUFFERS_PATCH_COMMAND "") +endif() + +#flatbuffers 1.11.0 does not have flatbuffers::IsOutRange, therefore we require 1.12.0+ +FetchContent_Declare( + flatbuffers + URL ${DEP_URL_flatbuffers} + URL_HASH SHA1=${DEP_SHA1_flatbuffers} + PATCH_COMMAND ${ONNXRUNTIME_FLATBUFFERS_PATCH_COMMAND} + FIND_PACKAGE_ARGS 23.5.9 NAMES Flatbuffers flatbuffers +) + +onnxruntime_fetchcontent_makeavailable(flatbuffers) +if(NOT flatbuffers_FOUND) + if(NOT TARGET flatbuffers::flatbuffers) + add_library(flatbuffers::flatbuffers ALIAS flatbuffers) + endif() + if(TARGET flatc AND NOT TARGET flatbuffers::flatc) + add_executable(flatbuffers::flatc ALIAS flatc) + endif() + if (GDK_PLATFORM) + # cstdlib only defines std::getenv when _CRT_USE_WINAPI_FAMILY_DESKTOP_APP is defined, which + # is probably an oversight for GDK/Xbox builds (::getenv exists and works). + file(WRITE ${CMAKE_BINARY_DIR}/gdk_cstdlib_wrapper.h [[ +#pragma once +#ifdef __cplusplus +#include +namespace std { using ::getenv; } +#endif +]]) + if(TARGET flatbuffers) + target_compile_options(flatbuffers PRIVATE /FI${CMAKE_BINARY_DIR}/gdk_cstdlib_wrapper.h) + endif() + if(TARGET flatc) + target_compile_options(flatc PRIVATE /FI${CMAKE_BINARY_DIR}/gdk_cstdlib_wrapper.h) + endif() + endif() +endif() + +# ONNX +if (NOT onnxruntime_USE_FULL_PROTOBUF) + set(ONNX_USE_LITE_PROTO ON CACHE BOOL "" FORCE) +else() + set(ONNX_USE_LITE_PROTO OFF CACHE BOOL "" FORCE) +endif() + +if(Patch_FOUND) + set(ONNXRUNTIME_ONNX_PATCH_COMMAND ${Patch_EXECUTABLE} --binary --ignore-whitespace -p1 < ${PROJECT_SOURCE_DIR}/patches/onnx/onnx.patch) +else() + set(ONNXRUNTIME_ONNX_PATCH_COMMAND "") +endif() + +FetchContent_Declare( + onnx + URL ${DEP_URL_onnx} + URL_HASH SHA1=${DEP_SHA1_onnx} + PATCH_COMMAND ${ONNXRUNTIME_ONNX_PATCH_COMMAND} + FIND_PACKAGE_ARGS NAMES ONNX onnx +) +if (NOT onnxruntime_MINIMAL_BUILD) + onnxruntime_fetchcontent_makeavailable(onnx) +else() + include(onnx_minimal) +endif() + +if(TARGET ONNX::onnx AND NOT TARGET onnx) + message(STATUS "Aliasing ONNX::onnx to onnx") + add_library(onnx ALIAS ONNX::onnx) +endif() +if(TARGET ONNX::onnx_proto AND NOT TARGET onnx_proto) + message(STATUS "Aliasing ONNX::onnx_proto to onnx_proto") + add_library(onnx_proto ALIAS ONNX::onnx_proto) +endif() + +if(onnxruntime_USE_VCPKG) + find_package(Eigen3 CONFIG REQUIRED) + get_target_property(eigen_INCLUDE_DIRS Eigen3::Eigen INTERFACE_INCLUDE_DIRECTORIES) +else() + include(eigen) # FetchContent +endif() + +if(onnxruntime_USE_VCPKG) + find_package(wil CONFIG REQUIRED) + set(WIL_TARGET "WIL::WIL") +else() + include(wil) # FetchContent +endif() + +# XNNPACK EP +if (onnxruntime_USE_XNNPACK) + if (onnxruntime_DISABLE_CONTRIB_OPS) + message(FATAL_ERROR "XNNPACK EP requires the internal NHWC contrib ops to be available " + "but onnxruntime_DISABLE_CONTRIB_OPS is ON") + endif() + include(xnnpack) +endif() + +if (onnxruntime_USE_MIMALLOC) + add_definitions(-DUSE_MIMALLOC) + + set(MI_OVERRIDE OFF CACHE BOOL "" FORCE) + set(MI_BUILD_TESTS OFF CACHE BOOL "" FORCE) + set(MI_DEBUG_FULL OFF CACHE BOOL "" FORCE) + set(MI_BUILD_SHARED OFF CACHE BOOL "" FORCE) + onnxruntime_fetchcontent_makeavailable(mimalloc) +endif() + +#onnxruntime_EXTERNAL_LIBRARIES could contain onnx, onnx_proto,libprotobuf, cuda/cudnn, +# dnnl/mklml, onnxruntime_codegen_tvm, tvm and pthread +# pthread is always at the last +set(onnxruntime_EXTERNAL_LIBRARIES ${onnxruntime_EXTERNAL_LIBRARIES_XNNPACK} ${WIL_TARGET} nlohmann_json::nlohmann_json onnx onnx_proto ${PROTOBUF_LIB} re2::re2 Boost::mp11 safeint_interface flatbuffers::flatbuffers ${GSL_TARGET} ${ABSEIL_LIBS} date::date ${ONNXRUNTIME_CLOG_TARGET_NAME}) +# The source code of onnx_proto is generated, we must build this lib first before starting to compile the other source code that uses ONNX protobuf types. +# The other libs do not have the problem. All the sources are already there. We can compile them in any order. +set(onnxruntime_EXTERNAL_DEPENDENCIES onnx_proto flatbuffers::flatbuffers) + +if(NOT (onnx_FOUND OR ONNX_FOUND)) # building ONNX from source + target_compile_definitions(onnx PUBLIC $ PRIVATE "__ONNX_DISABLE_STATIC_REGISTRATION") + if (NOT onnxruntime_USE_FULL_PROTOBUF) + target_compile_definitions(onnx PUBLIC "__ONNX_NO_DOC_STRINGS") + endif() +endif() + +if (onnxruntime_RUN_ONNX_TESTS) + add_definitions(-DORT_RUN_EXTERNAL_ONNX_TESTS) +endif() + + +if(onnxruntime_ENABLE_ATEN) + message(STATUS "Aten fallback is enabled.") + FetchContent_Declare( + dlpack + URL ${DEP_URL_dlpack} + URL_HASH SHA1=${DEP_SHA1_dlpack} + FIND_PACKAGE_ARGS NAMES dlpack + ) + # We can't use onnxruntime_fetchcontent_makeavailable since some part of the the dlpack code is Linux only. + # For example, dlpackcpp.h uses posix_memalign. + FetchContent_Populate(dlpack) +endif() + +if(onnxruntime_ENABLE_TRAINING OR (onnxruntime_ENABLE_TRAINING_APIS AND onnxruntime_BUILD_UNIT_TESTS)) + # Once code under orttraining/orttraining/models dir is removed "onnxruntime_ENABLE_TRAINING" should be removed from + # this conditional + FetchContent_Declare( + cxxopts + URL ${DEP_URL_cxxopts} + URL_HASH SHA1=${DEP_SHA1_cxxopts} + FIND_PACKAGE_ARGS NAMES cxxopts + ) + set(CXXOPTS_BUILD_EXAMPLES OFF CACHE BOOL "" FORCE) + set(CXXOPTS_BUILD_TESTS OFF CACHE BOOL "" FORCE) + onnxruntime_fetchcontent_makeavailable(cxxopts) +endif() + +if (onnxruntime_USE_COREML) + FetchContent_Declare( + coremltools + URL ${DEP_URL_coremltools} + URL_HASH SHA1=${DEP_SHA1_coremltools} + PATCH_COMMAND ${Patch_EXECUTABLE} --binary --ignore-whitespace -p1 < ${PROJECT_SOURCE_DIR}/patches/coremltools/crossplatformbuild.patch + ) + # we don't build directly so use Populate. selected files are built from onnxruntime_providers_coreml.cmake + FetchContent_Populate(coremltools) +endif() + +message(STATUS "Finished fetching external dependencies") + + +set(onnxruntime_LINK_DIRS ) +if (onnxruntime_USE_CUDA) + #TODO: combine onnxruntime_CUDNN_HOME and onnxruntime_CUDA_HOME, assume they are the same + find_package(CUDAToolkit REQUIRED) + if (WIN32) + if(onnxruntime_CUDNN_HOME) + list(APPEND onnxruntime_LINK_DIRS ${onnxruntime_CUDNN_HOME}/lib ${onnxruntime_CUDNN_HOME}/lib/x64) + endif() + else() + if(onnxruntime_CUDNN_HOME) + list(APPEND onnxruntime_LINK_DIRS ${onnxruntime_CUDNN_HOME}/lib ${onnxruntime_CUDNN_HOME}/lib64) + endif() + endif() +endif() + +if(onnxruntime_USE_SNPE) + include(external/find_snpe.cmake) + list(APPEND onnxruntime_EXTERNAL_LIBRARIES ${SNPE_NN_LIBS}) +endif() + +FILE(TO_NATIVE_PATH ${CMAKE_BINARY_DIR} ORT_BINARY_DIR) +FILE(TO_NATIVE_PATH ${PROJECT_SOURCE_DIR} ORT_SOURCE_DIR) diff --git a/ports/onnxruntime/onnxruntime_vcpkg_deps.cmake b/ports/onnxruntime/onnxruntime_vcpkg_deps.cmake deleted file mode 100644 index f7fcd838..00000000 --- a/ports/onnxruntime/onnxruntime_vcpkg_deps.cmake +++ /dev/null @@ -1,154 +0,0 @@ -message(STATUS "Using Dependencies from vcpkg...") - -# ABSL should be included before protobuf because protobuf may use absl -find_package(absl CONFIG REQUIRED) -list(APPEND ABSEIL_LIBS - absl::base - absl::city - absl::core_headers - absl::fixed_array - absl::flags - absl::flat_hash_map - absl::flat_hash_set - absl::hash - absl::inlined_vector - absl::low_level_hash - absl::node_hash_map - absl::node_hash_set - absl::optional - absl::raw_hash_set - absl::raw_logging_internal - absl::span - absl::str_format - absl::strings - absl::synchronization - absl::throw_delegate - absl::time -) -list(APPEND onnxruntime_EXTERNAL_LIBRARIES ${ABSEIL_LIBS}) - -find_package(re2 CONFIG REQUIRED) # re2::re2 -list(APPEND onnxruntime_EXTERNAL_LIBRARIES re2::re2) - -if (onnxruntime_BUILD_UNIT_TESTS) - # gtest and gmock - find_package(GTest CONFIG REQUIRED) # GTest::gtest GTest::gtest_main GTest::gmock GTest::gmock_main -endif() - -if (onnxruntime_BUILD_BENCHMARKS) - find_package(benchmark CONFIG REQUIRED) # benchmark::benchmark benchmark::benchmark_main -endif() - -# Flatbuffers -find_package(flatbuffers CONFIG REQUIRED) # flatbuffers::flatbuffers -list(APPEND onnxruntime_EXTERNAL_DEPENDENCIES flatbuffers::flatbuffers) -list(APPEND onnxruntime_EXTERNAL_LIBRARIES flatbuffers::flatbuffers) - -find_package(Protobuf CONFIG REQUIRED) # protobuf::libprotobuf protobuf::libprotobuf-lite -if (onnxruntime_USE_FULL_PROTOBUF) - set(PROTOBUF_LIB protobuf::libprotobuf) -else() - set(PROTOBUF_LIB protobuf::libprotobuf-lite) -endif() -list(APPEND onnxruntime_EXTERNAL_LIBRARIES ${PROTOBUF_LIB}) - -if(NOT DEFINED Protobuf_PROTOC_EXECUTABLE) - find_program(Protobuf_PROTOC_EXECUTABLE NAMES protoc REQUIRED) -endif() -get_filename_component(ONNX_CUSTOM_PROTOC_EXECUTABLE "${Protobuf_PROTOC_EXECUTABLE}" ABSOLUTE) -include(external/protobuf_function.cmake) - -find_package(date CONFIG REQUIRED) -list(APPEND onnxruntime_EXTERNAL_LIBRARIES date::date) - -# see Hints of FindBoost.cmake -find_path(BOOST_INCLUDEDIR "boost/mp11.hpp" REQUIRED) -find_package(Boost REQUIRED) -add_library(Boost::mp11 ALIAS Boost::headers) -list(APPEND onnxruntime_EXTERNAL_LIBRARIES Boost::mp11) - -find_package(nlohmann_json CONFIG REQUIRED) -list(APPEND onnxruntime_EXTERNAL_LIBRARIES nlohmann_json::nlohmann_json) - -if (onnxruntime_ENABLE_CPUINFO) - find_package(cpuinfo CONFIG REQUIRED) - list(APPEND onnxruntime_EXTERNAL_LIBRARIES cpuinfo::cpuinfo) -endif() - -if (NOT WIN32) - find_library(NSYNC_CPP_LIBRARY NAMES nsync_cpp REQUIRED) - add_library(nsync_cpp INTERFACE IMPORTED GLOBAL) - set_target_properties(nsync_cpp PROPERTIES INTERFACE_LINK_LIBRARIES "${NSYNC_CPP_LIBRARY}") - add_library(nsync::nsync_cpp ALIAS nsync_cpp) - list(APPEND onnxruntime_EXTERNAL_LIBRARIES nsync::nsync_cpp) -endif() - -find_package(Microsoft.GSL CONFIG REQUIRED) -list(APPEND onnxruntime_EXTERNAL_LIBRARIES Microsoft.GSL::GSL) -set(GSL_TARGET Microsoft.GSL::GSL) # see onnxruntime_mlas - -# ONNX -find_package(ONNX CONFIG REQUIRED) -if(TARGET ONNX::onnx AND NOT TARGET onnx) - add_library(onnx ALIAS ONNX::onnx) -endif() -if(TARGET ONNX::onnx_proto AND NOT TARGET onnx_proto) - add_library(onnx_proto ALIAS ONNX::onnx_proto) -endif() -list(APPEND onnxruntime_EXTERNAL_LIBRARIES onnx onnx_proto) - -find_package(Eigen3 CONFIG REQUIRED) -list(APPEND onnxruntime_EXTERNAL_LIBRARIES Eigen3::Eigen) -get_property(eigen_INCLUDE_DIRS TARGET Eigen3::Eigen PROPERTY INTERFACE_INCLUDE_DIRECTORIES) - -find_package(wil CONFIG REQUIRED) -list(APPEND onnxruntime_EXTERNAL_LIBRARIES WIL::WIL) - -find_path(SAFEINT_INCLUDE_DIRS "SafeInt.hpp" REQUIRED) -add_library(safeint_interface IMPORTED INTERFACE GLOBAL) -set_target_properties(safeint_interface PROPERTIES - INTERFACE_INCLUDE_DIRECTORIES "${SAFEINT_INCLUDE_DIRS}" -) - -# XNNPACK EP -if (onnxruntime_USE_XNNPACK) - if (onnxruntime_DISABLE_CONTRIB_OPS) - message(FATAL_ERROR "XNNPACK EP requires the internal NHWC contrib ops to be available " - "but onnxruntime_DISABLE_CONTRIB_OPS is ON") - endif() - find_package(cpuinfo CONFIG REQUIRED) - find_library(PTHREADPOOL_LIBRARY NAMES pthreadpool REQUIRED) - find_library(XNNPACK_LIBRARY NAMES XNNPACK REQUIRED) - list(APPEND onnxruntime_EXTERNAL_LIBRARIES cpuinfo::cpuinfo ${PTHREADPOOL_LIBRARY} ${XNNPACK_LIBRARY}) -endif() - -if (onnxruntime_USE_MIMALLOC) - add_compile_definitions(USE_MIMALLOC) - find_package(mimalloc CONFIG REQUIRED) - list(APPEND onnxruntime_EXTERNAL_LIBRARIES mimalloc) -endif() - -if(onnxruntime_ENABLE_ATEN) - message(STATUS "Aten fallback is enabled.") - find_package(dlpack CONFIG REQUIRED) - list(APPEND onnxruntime_EXTERNAL_LIBRARIES dlpack::dlpack) -endif() - -if(onnxruntime_ENABLE_TRAINING OR (onnxruntime_ENABLE_TRAINING_APIS AND onnxruntime_BUILD_UNIT_TESTS)) - find_package(cxxopts CONFIG REQUIRED) - list(APPEND onnxruntime_EXTERNAL_LIBRARIES cxxopts::cxxopts) -endif() - -if (onnxruntime_USE_CUDA) - find_package(CUDAToolkit REQUIRED) - include_directories(${CUDAToolkit_INCLUDE_DIRS}) - list(APPEND onnxruntime_LINK_DIRS ${CUDAToolkit_LIBRARY_DIR}) - set(CMAKE_CUDA_FLAGS "${CMAKE_CUDA_FLAGS} -diag-suppress 2803") - find_package(NvidiaCutlass CONFIG REQUIRED) - list(APPEND onnxruntime_EXTERNAL_LIBRARIES nvidia::cutlass::cutlass) -endif() - -if (onnxruntime_USE_OPENVINO) - find_package(OpenVINO REQUIRED) - # list(APPEND onnxruntime_EXTERNAL_LIBRARIES openvino::runtime) -endif() diff --git a/ports/onnxruntime/portfile.cmake b/ports/onnxruntime/portfile.cmake index 679a8d68..8fc35b6e 100644 --- a/ports/onnxruntime/portfile.cmake +++ b/ports/onnxruntime/portfile.cmake @@ -4,15 +4,17 @@ string(COMPARE EQUAL "${VCPKG_LIBRARY_LINKAGE}" "dynamic" BUILD_SHARED) vcpkg_from_github( OUT_SOURCE_PATH SOURCE_PATH REPO microsoft/onnxruntime - REF v1.18.0 - SHA512 2e1d724eda5635fc24f93966412c197c82ee933aaea4f4ce907b5f2ee7730c1e741f2ef4d50a2d54284fc7bd05bf104bd3c56fd4466525fcd70e63c07fbb2b16 + REF v1.18.1 + SHA512 192cb95e131d7a7796f29556355d0c9055c05723e1120e21155ed21e05301d862f2ba3fd613d8f9289b61577f64cc4b406db7bb25d1bd666b75c29a0f29cc9d8 PATCHES fix-cmake.patch + fix-cmake-cuda.patch + fix-cmake-training.patch fix-sources.patch - # fix-clang-cl-simd-compile.patch - fix-llvm-rc-unicode.patch + fix-clang-cl-simd-compile.patch ) -file(COPY "${CMAKE_CURRENT_LIST_DIR}/onnxruntime_vcpkg_deps.cmake" DESTINATION "${SOURCE_PATH}/cmake/external") +# https://github.com/microsoft/onnxruntime/pull/21348 +file(COPY "${CMAKE_CURRENT_LIST_DIR}/onnxruntime_external_deps.cmake" DESTINATION "${SOURCE_PATH}/cmake/external") find_program(PROTOC NAMES protoc PATHS "${CURRENT_HOST_INSTALLED_DIR}/tools/protobuf" @@ -26,18 +28,16 @@ find_program(FLATC NAMES flatc ) message(STATUS "Using flatc: ${FLATC}") +vcpkg_find_acquire_program(PYTHON3) +get_filename_component(PYTHON_PATH "${PYTHON3}" PATH) +message(STATUS "Using python3: ${PYTHON3}") +vcpkg_add_to_path(PREPEND "${PYTHON_PATH}") + vcpkg_execute_required_process( - COMMAND "${FLATC}" --cpp --scoped-enums --filename-suffix ".fbs" ort.fbs ort_training_checkpoint.fbs - LOGNAME codegen-flatc-cpp - WORKING_DIRECTORY "${SOURCE_PATH}/onnxruntime/core/flatbuffers/schema" + COMMAND "${PYTHON3}" onnxruntime/core/flatbuffers/schema/compile_schema.py --flatc "${FLATC}" + LOGNAME compile_schema + WORKING_DIRECTORY "${SOURCE_PATH}" ) -if("test" IN_LIST FEATURES) - vcpkg_execute_required_process( - COMMAND "${FLATC}" --cpp --scoped-enums --filename-suffix ".fbs" flatbuffers_utils_test.fbs - LOGNAME codegen-flatc-test-cpp - WORKING_DIRECTORY "${SOURCE_PATH}/onnxruntime/test/flatbuffers" - ) -endif() vcpkg_check_features(OUT_FEATURE_OPTIONS FEATURE_OPTIONS FEATURES @@ -46,6 +46,7 @@ vcpkg_check_features(OUT_FEATURE_OPTIONS FEATURE_OPTIONS training onnxruntime_ENABLE_TRAINING training onnxruntime_ENABLE_TRAINING_APIS # training onnxruntime_ENABLE_TRAINING_OPS + # training onnxruntime_ENABLE_TRAINING_TORCH_INTEROP cuda onnxruntime_USE_CUDA cuda onnxruntime_USE_CUDA_NHWC_OPS openvino onnxruntime_USE_OPENVINO @@ -72,6 +73,16 @@ vcpkg_check_features(OUT_FEATURE_OPTIONS FEATURE_OPTIONS cuda onnxruntime_USE_MEMORY_EFFICIENT_ATTENTION ) +if("training" IN_LIST FEATURES) + vcpkg_from_github( + OUT_SOURCE_PATH TENSORBOARD_SOURCE_PATH + REPO tensorflow/tensorboard + REF 2.16.2 + SHA512 0dc57928d55ebd46386d0f0852b3b4e9078222bd4378655abb16f6bc0e5ed2969600071d5d2ae9a3f2aa6bb327fe567869a01a69fdda35c261dc44a1eadd18ce + ) + list(APPEND FEATURE_OPTIONS "-DTENSORBOARD_ROOT:PATH=${TENSORBOARD_SOURCE_PATH}") +endif() + if(VCPKG_TARGET_IS_WINDOWS OR VCPKG_TARGET_IS_UWP) set(GENERATOR_OPTIONS WINDOWS_USE_MSBUILD) if("cuda" IN_LIST FEATURES) @@ -81,11 +92,6 @@ elseif(VCPKG_TARGET_IS_OSX OR VCPKG_TARGET_IS_IOS) set(GENERATOR_OPTIONS GENERATOR Xcode) endif() -vcpkg_find_acquire_program(PYTHON3) -get_filename_component(PYTHON_PATH "${PYTHON3}" PATH) -message(STATUS "Using python3: ${PYTHON3}") -vcpkg_add_to_path(PREPEND "${PYTHON_PATH}") - # see tools/ci_build/build.py vcpkg_cmake_configure( SOURCE_PATH "${SOURCE_PATH}/cmake" @@ -94,14 +100,14 @@ vcpkg_cmake_configure( ${FEATURE_OPTIONS} -DPython_EXECUTABLE:FILEPATH=${PYTHON3} -DProtobuf_PROTOC_EXECUTABLE:FILEPATH=${PROTOC} - # -DProtobuf_USE_STATIC_LIBS=OFF + -DONNX_CUSTOM_PROTOC_EXECUTABLE:FILEPATH=${PROTOC} -DBUILD_PKGCONFIG_FILES=ON -Donnxruntime_BUILD_SHARED_LIB=${BUILD_SHARED} -Donnxruntime_BUILD_WEBASSEMBLY=OFF -Donnxruntime_CROSS_COMPILING=${VCPKG_CROSSCOMPILING} - -Donnxruntime_USE_FULL_PROTOBUF=ON -Donnxruntime_USE_EXTENSIONS=OFF -Donnxruntime_USE_NNAPI_BUILTIN=${VCPKG_TARGET_IS_ANDROID} + -Donnxruntime_USE_VCPKG=ON -Donnxruntime_ENABLE_CPUINFO=ON -Donnxruntime_ENABLE_MICROSOFT_INTERNAL=OFF -Donnxruntime_ENABLE_BITCODE=${VCPKG_TARGET_IS_IOS} @@ -114,8 +120,9 @@ vcpkg_cmake_configure( -Donnxruntime_USE_NEURAL_SPEED=OFF -DUSE_NEURAL_SPEED=OFF # for ORT_BUILD_INFO - -DORT_GIT_COMMIT:STRING="45737400a2f3015c11f005ed7603611eaed306a6" - -DORT_GIT_BRANCH:STRING="v1.18.0" + -DORT_GIT_COMMIT:STRING=387127404e6c1d84b3468c387d864877ed1c67fe + -DORT_GIT_BRANCH:STRING=v1.18.1 + --compile-no-warning-as-error OPTIONS_DEBUG -Donnxruntime_ENABLE_MEMLEAK_CHECKER=OFF -Donnxruntime_ENABLE_MEMORY_PROFILE=OFF @@ -129,6 +136,9 @@ vcpkg_cmake_configure( if("cuda" IN_LIST FEATURES) vcpkg_cmake_build(TARGET onnxruntime_providers_cuda LOGFILE_BASE build-cuda) endif() +if("training" IN_LIST FEATURES) + vcpkg_cmake_build(TARGET tensorboard LOGFILE_BASE build-tensorboard) +endif() vcpkg_cmake_install() vcpkg_cmake_config_fixup(CONFIG_PATH lib/cmake/onnxruntime PACKAGE_NAME onnxruntime) vcpkg_copy_pdbs() diff --git a/ports/onnxruntime/vcpkg.json b/ports/onnxruntime/vcpkg.json index 04bf962f..cb2ae64f 100644 --- a/ports/onnxruntime/vcpkg.json +++ b/ports/onnxruntime/vcpkg.json @@ -1,7 +1,6 @@ { "name": "onnxruntime", - "version-semver": "1.18.0", - "port-version": 1, + "version-semver": "1.18.1", "description": "ONNX Runtime: cross-platform, high performance ML inferencing and training accelerator", "homepage": "https://onnxruntime.ai/", "license": "MIT", @@ -60,6 +59,7 @@ }, "re2", "safeint", + "utf8-range", { "name": "vcpkg-cmake", "host": true @@ -89,6 +89,13 @@ "benchmark", "gtest" ] + }, + "training": { + "description": "Enable full training functionality. Includes ORTModule and ORT Training APIs", + "dependencies": [ + "cxxopts", + "dlpack" + ] } } } diff --git a/test/azure-port-arm64-uwp.txt b/test/azure-port-arm64-uwp.txt index 4fc5abae..96602b69 100644 --- a/test/azure-port-arm64-uwp.txt +++ b/test/azure-port-arm64-uwp.txt @@ -1,2 +1,3 @@ tensorflow-lite abseil +onnx[disable-static-registration] diff --git a/test/azure-port-arm64-windows.txt b/test/azure-port-arm64-windows.txt index c1b1301a..56c98347 100644 --- a/test/azure-port-arm64-windows.txt +++ b/test/azure-port-arm64-windows.txt @@ -1,3 +1,5 @@ libdispatch tensorflow-lite abseil +onnx[disable-static-registration] +onnxruntime[training] diff --git a/test/azure-port-linux.txt b/test/azure-port-linux.txt index 336cb593..1939b6d1 100644 --- a/test/azure-port-linux.txt +++ b/test/azure-port-linux.txt @@ -1,3 +1,4 @@ tensorflow-lite[gpu] -onnxruntime +onnx[disable-static-registration] +onnxruntime[training] abseil diff --git a/test/self-hosted.json b/test/self-hosted.json index b040438b..640aafa5 100644 --- a/test/self-hosted.json +++ b/test/self-hosted.json @@ -1,7 +1,7 @@ { "$schema": "https://raw.githubusercontent.com/microsoft/vcpkg-tool/main/docs/vcpkg.schema.json", "name": "test", - "version-date": "2024-05-25", + "version-date": "2024-08-08", "description": "vcpkg registry maintained by @luncliff", "homepage": "https://github.com/luncliff/vcpkg-registry", "supports": "windows", @@ -24,14 +24,11 @@ { "name": "onnxruntime", "features": [ - "test" + "test", + "training" ], "platform": "windows" }, - { - "name": "openjdk", - "platform": "x64 & windows" - }, { "name": "winpixeventruntime", "platform": "x64 & windows" @@ -55,7 +52,13 @@ "nvidia-tools-extension-sdk", "nvidia-triton-client", "nvidia-triton-common", - "nvidia-triton-core" + "nvidia-triton-core", + { + "name": "onnxruntime", + "features": [ + "cuda" + ] + } ] } } diff --git a/versions/baseline.json b/versions/baseline.json index 91ced106..75184e12 100644 --- a/versions/baseline.json +++ b/versions/baseline.json @@ -137,8 +137,8 @@ "port-version": 0 }, "onnxruntime": { - "baseline": "1.18.0", - "port-version": 1 + "baseline": "1.18.1", + "port-version": 0 }, "opencl": { "baseline": "v2024.05.08", diff --git a/versions/o-/onnxruntime.json b/versions/o-/onnxruntime.json index 4a653ed1..cf70f771 100644 --- a/versions/o-/onnxruntime.json +++ b/versions/o-/onnxruntime.json @@ -1,5 +1,10 @@ { "versions": [ + { + "git-tree": "afebd79a5253d8547428a61094a2a39e4b2f0a9a", + "version-semver": "1.18.1", + "port-version": 0 + }, { "git-tree": "6ff6836fc7e0eb8a5321ed62fe1b630647c21dc1", "version-semver": "1.18.0",