Skip to content

Commit 19f37d7

Browse files
adrianlizarragazhaoxul-qti1duoHectorSVCchenweng-quic
authored
rel-1.22.2 cherry-pick 1 (#25633)
### Description - #24265 - #24616 - #24640 - #24707 - #24646 - #24750 - #24809 - #24895 - #24820 - #25002 - #25171 - #25283 - #24818 - #25351 - #25361 - #25388 - #25520 - #25158 ### Motivation and Context <!-- - Why is this change required? What problem does it solve? - If it fixes an open issue, please link to the issue here. --> --------- Co-authored-by: quic-zhaoxul <[email protected]> Co-authored-by: Yuduo Wu <[email protected]> Co-authored-by: Hector Li <[email protected]> Co-authored-by: chenweng-quic <[email protected]> Co-authored-by: qti-yuduo <[email protected]> Co-authored-by: Akupadhye <[email protected]> Co-authored-by: Jeff Kilpatrick <[email protected]> Co-authored-by: Jeff Kilpatrick <[email protected]> Co-authored-by: George Wu <[email protected]> Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com> Co-authored-by: quic-calvnguy <[email protected]> Co-authored-by: Changming Sun <[email protected]> Co-authored-by: Yulong Wang <[email protected]>
1 parent 89746dc commit 19f37d7

File tree

118 files changed

+4928
-347
lines changed

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

118 files changed

+4928
-347
lines changed

.github/workflows/linux_cuda_ci.yml

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -28,7 +28,7 @@ jobs:
2828
dockerfile_path: tools/ci_build/github/linux/docker/Dockerfile.manylinux2_28_cuda
2929
docker_build_args: '--build-arg BASEIMAGE=onnxruntimebuildcache.azurecr.io/internal/azureml/onnxruntime/build/cuda12_x64_ubi8_gcc12:20250124.1'
3030
docker_image_repo: onnxruntimecuda12manylinuxbuild
31-
extra_build_flags: '--use_binskim_compliant_compile_flags --build_wheel --cuda_version=12.2 --cuda_home=/usr/local/cuda-12.2 --cudnn_home=/usr/local/cuda-12.2 --enable_cuda_profiling --build_java --cmake_extra_defines CMAKE_CUDA_ARCHITECTURES=80 onnxruntime_BUILD_UNIT_TESTS=ON onnxruntime_ENABLE_CUDA_EP_INTERNAL_TESTS=ON'
31+
extra_build_flags: '--use_binskim_compliant_compile_flags --build_wheel --cuda_version=12.2 --cuda_home=/usr/local/cuda-12.2 --cudnn_home=/usr/local/cuda-12.2 --enable_cuda_profiling --build_java --cmake_extra_defines CMAKE_CUDA_ARCHITECTURES=90 onnxruntime_BUILD_UNIT_TESTS=ON onnxruntime_ENABLE_CUDA_EP_INTERNAL_TESTS=ON'
3232
python_path_prefix: 'PATH=/opt/python/cp310-cp310/bin:$PATH'
3333
run_tests: false # <<< Do not run tests in this job
3434
upload_build_output: true # <<< Upload the build/Release directory
@@ -41,7 +41,7 @@ jobs:
4141
needs: build-linux-cuda-x64-release
4242
runs-on:
4343
- self-hosted
44-
- "1ES.Pool=Onnxruntime-github-Linux-GPU-A100-WUS3"
44+
- "1ES.Pool=Onnxruntime-github-Linux-GPU-H100"
4545
permissions:
4646
contents: read
4747
packages: read
@@ -98,5 +98,5 @@ jobs:
9898
build_config: Release
9999
mode: 'test' # Set mode to test
100100
execution_providers: 'cuda'
101-
extra_build_flags: '--use_binskim_compliant_compile_flags --cuda_version=12.2 --cuda_home=/usr/local/cuda-12.2 --cudnn_home=/usr/local/cuda-12.2 --enable_cuda_profiling --cmake_extra_defines CMAKE_CUDA_ARCHITECTURES=80 onnxruntime_BUILD_UNIT_TESTS=ON onnxruntime_ENABLE_CUDA_EP_INTERNAL_TESTS=ON'
101+
extra_build_flags: '--use_binskim_compliant_compile_flags --cuda_version=12.2 --cuda_home=/usr/local/cuda-12.2 --cudnn_home=/usr/local/cuda-12.2 --enable_cuda_profiling --cmake_extra_defines CMAKE_CUDA_ARCHITECTURES=90 onnxruntime_BUILD_UNIT_TESTS=ON onnxruntime_ENABLE_CUDA_EP_INTERNAL_TESTS=ON'
102102
python_path_prefix: 'PATH=/opt/python/cp310-cp310/bin:$PATH'

.github/workflows/linux_tensorrt_ci.yml

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -28,7 +28,7 @@ jobs:
2828
dockerfile_path: tools/ci_build/github/linux/docker/Dockerfile.manylinux2_28_cuda
2929
docker_build_args: '--build-arg BASEIMAGE=onnxruntimebuildcache.azurecr.io/internal/azureml/onnxruntime/build/cuda12_x64_ubi8_gcc12:20250124.1 --build-arg TRT_VERSION=10.9.0.34-1.cuda12.8 --network=host'
3030
docker_image_repo: onnxruntimetensorrt86gpubuild
31-
extra_build_flags: '--use_binskim_compliant_compile_flags --build_wheel --cuda_version=12.2 --cuda_home=/usr/local/cuda-12.2 --cudnn_home=/usr/local/cuda-12.2 --use_tensorrt --tensorrt_home /usr --build_java --cmake_extra_defines CMAKE_CUDA_ARCHITECTURES=80 onnxruntime_BUILD_UNIT_TESTS=ON onnxruntime_ENABLE_CUDA_EP_INTERNAL_TESTS=ON'
31+
extra_build_flags: '--use_binskim_compliant_compile_flags --build_wheel --cuda_version=12.2 --cuda_home=/usr/local/cuda-12.2 --cudnn_home=/usr/local/cuda-12.2 --use_tensorrt --tensorrt_home /usr --build_java --cmake_extra_defines CMAKE_CUDA_ARCHITECTURES=90 onnxruntime_BUILD_UNIT_TESTS=ON onnxruntime_ENABLE_CUDA_EP_INTERNAL_TESTS=ON'
3232
python_path_prefix: 'PATH=/opt/python/cp310-cp310/bin:$PATH'
3333
run_tests: false # <<< Do not run tests in this job
3434
upload_build_output: true # <<< Upload the build/Release directory
@@ -41,7 +41,7 @@ jobs:
4141
needs: build-linux-TensorRT-x64-release
4242
runs-on:
4343
- self-hosted
44-
- "1ES.Pool=Onnxruntime-github-Linux-GPU-A100-WUS3"
44+
- "1ES.Pool=Onnxruntime-github-Linux-GPU-H100"
4545
permissions:
4646
contents: read
4747
packages: read
@@ -100,5 +100,5 @@ jobs:
100100
build_config: Release
101101
mode: 'test' # Set mode to test
102102
execution_providers: 'cuda tensorrt'
103-
extra_build_flags: '--use_binskim_compliant_compile_flags --build_wheel --cuda_version=12.2 --cuda_home=/usr/local/cuda-12.2 --cudnn_home=/usr/local/cuda-12.2 --use_tensorrt --tensorrt_home /usr --build_java --cmake_extra_defines CMAKE_CUDA_ARCHITECTURES=80 onnxruntime_BUILD_UNIT_TESTS=ON onnxruntime_ENABLE_CUDA_EP_INTERNAL_TESTS=ON'
103+
extra_build_flags: '--use_binskim_compliant_compile_flags --build_wheel --cuda_version=12.2 --cuda_home=/usr/local/cuda-12.2 --cudnn_home=/usr/local/cuda-12.2 --use_tensorrt --tensorrt_home /usr --build_java --cmake_extra_defines CMAKE_CUDA_ARCHITECTURES=90 onnxruntime_BUILD_UNIT_TESTS=ON onnxruntime_ENABLE_CUDA_EP_INTERNAL_TESTS=ON'
104104
python_path_prefix: 'PATH=/opt/python/cp310-cp310/bin:$PATH'

VERSION_NUMBER

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1 +1 @@
1-
1.22.1
1+
1.22.2

cgmanifests/cgmanifest.json

Lines changed: 1 addition & 11 deletions
Original file line numberDiff line numberDiff line change
@@ -36,7 +36,7 @@
3636
"component": {
3737
"type": "git",
3838
"git": {
39-
"commitHash": "bee4d1dd8dc1ee4a1fd8fa6a96476c2f8b7492a3",
39+
"commitHash": "5c210da409e7f1e51ddf445134a4376fdbd70d7d",
4040
"repositoryUrl": "https://github.com/dmlc/dlpack.git"
4141
}
4242
}
@@ -316,16 +316,6 @@
316316
"comments": "gtest-ios-framework"
317317
}
318318
},
319-
{
320-
"component": {
321-
"type": "git",
322-
"git": {
323-
"commitHash": "277508879878e0a5b5b43599b1bea11f66eb3c6c",
324-
"repositoryUrl": "https://github.com/dmlc/dlpack.git"
325-
},
326-
"comments": "dlpack"
327-
}
328-
},
329319
{
330320
"component": {
331321
"Type": "other",

cmake/CMakeLists.txt

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -150,6 +150,7 @@ option(onnxruntime_DISABLE_SPARSE_TENSORS "Disable sparse tensors data types" OF
150150
option(onnxruntime_DISABLE_OPTIONAL_TYPE "Disable optional type" OFF)
151151
option(onnxruntime_DISABLE_FLOAT8_TYPES "Disable float 8 types" OFF)
152152
option(onnxruntime_MINIMAL_BUILD "Exclude as much as possible from the build. Support ORT format models. No support for ONNX format models." OFF)
153+
option(onnxruntime_CLIENT_PACKAGE_BUILD "Enables default settings that are more appropriate for client/on-device workloads." OFF)
153154
cmake_dependent_option(onnxruntime_DISABLE_RTTI "Disable RTTI" ON "NOT onnxruntime_ENABLE_PYTHON;NOT onnxruntime_USE_CUDA" OFF)
154155
# For now onnxruntime_DISABLE_EXCEPTIONS will only work with onnxruntime_MINIMAL_BUILD, more changes (ONNX, non-CPU EP, ...) are required to run this standalone
155156
cmake_dependent_option(onnxruntime_DISABLE_EXCEPTIONS "Disable exception handling. Requires onnxruntime_MINIMAL_BUILD currently." ON "onnxruntime_MINIMAL_BUILD;NOT onnxruntime_ENABLE_PYTHON" OFF)

cmake/adjust_global_compile_flags.cmake

Lines changed: 5 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -98,6 +98,11 @@ if (onnxruntime_MINIMAL_BUILD)
9898
endif()
9999
endif()
100100

101+
# ORT build with default settings more appropriate for client/on-device workloads.
102+
if (onnxruntime_CLIENT_PACKAGE_BUILD)
103+
add_compile_definitions(ORT_CLIENT_PACKAGE_BUILD)
104+
endif()
105+
101106
if (onnxruntime_ENABLE_LTO)
102107
include(CheckIPOSupported)
103108
check_ipo_supported(RESULT ipo_enabled OUTPUT ipo_output)

cmake/deps.txt

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -16,7 +16,7 @@ abseil_cpp;https://github.com/abseil/abseil-cpp/archive/refs/tags/20240722.0.zip
1616
coremltools;https://github.com/apple/coremltools/archive/refs/tags/7.1.zip;f1bab0f30966f2e217d8e01207d518f230a1641a
1717
cxxopts;https://github.com/jarro2783/cxxopts/archive/3c73d91c0b04e2b59462f0a741be8c07024c1bc0.zip;6c6ca7f8480b26c8d00476e0e24b7184717fe4f0
1818
date;https://github.com/HowardHinnant/date/archive/refs/tags/v3.0.1.zip;2dac0c81dc54ebdd8f8d073a75c053b04b56e159
19-
dlpack;https://github.com/dmlc/dlpack/archive/refs/tags/v0.6.zip;4d565dd2e5b31321e5549591d78aa7f377173445
19+
dlpack;https://github.com/dmlc/dlpack/archive/5c210da409e7f1e51ddf445134a4376fdbd70d7d.zip;e499c86e4e5c5268a87661d7ea39c27fae10907c
2020
# This Eigen commit id matches the eigen archive being consumed from https://gitlab.com/libeigen/eigen/-/archive/3.4/eigen-3.4.zip
2121
# prior to the 3.4.1 RC changing the bits and invalidating the hash.
2222
# it contains changes on top of 3.4.0 which are required to fix build issues.

cmake/onnxruntime_mlas.cmake

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -31,6 +31,7 @@ onnxruntime_add_static_library(onnxruntime_mlas
3131
${MLAS_SRC_DIR}/eltwise.cpp
3232
${MLAS_SRC_DIR}/erf.cpp
3333
${MLAS_SRC_DIR}/compute.cpp
34+
${MLAS_SRC_DIR}/dequantize.cpp
3435
${MLAS_SRC_DIR}/quantize.cpp
3536
${MLAS_SRC_DIR}/qgemm_kernel_default.cpp
3637
${MLAS_SRC_DIR}/qladd.cpp

cmake/onnxruntime_providers_qnn.cmake

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -66,10 +66,10 @@
6666
COMMAND ${CMAKE_COMMAND} -E copy ${QNN_LIB_FILES} $<TARGET_FILE_DIR:${onnxruntime_providers_qnn_target}>
6767
)
6868
endif()
69-
if (EXISTS "${onnxruntime_QNN_HOME}/Qualcomm AI Hub Proprietary License.pdf")
69+
if (EXISTS "${onnxruntime_QNN_HOME}/LICENSE.pdf")
7070
add_custom_command(
7171
TARGET ${onnxruntime_providers_qnn_target} POST_BUILD
72-
COMMAND ${CMAKE_COMMAND} -E copy "${onnxruntime_QNN_HOME}/Qualcomm AI Hub Proprietary License.pdf" $<TARGET_FILE_DIR:${onnxruntime_providers_qnn_target}>
72+
COMMAND ${CMAKE_COMMAND} -E copy "${onnxruntime_QNN_HOME}/LICENSE.pdf" $<TARGET_FILE_DIR:${onnxruntime_providers_qnn_target}>/Qualcomm_LICENSE.pdf
7373
)
7474
endif()
7575
else()
@@ -154,10 +154,10 @@
154154
COMMAND ${CMAKE_COMMAND} -E copy ${QNN_LIB_FILES} $<TARGET_FILE_DIR:${onnxruntime_providers_qnn_target}>
155155
)
156156
endif()
157-
if (EXISTS "${onnxruntime_QNN_HOME}/Qualcomm AI Hub Proprietary License.pdf")
157+
if (EXISTS "${onnxruntime_QNN_HOME}/LICENSE.pdf")
158158
add_custom_command(
159159
TARGET ${onnxruntime_providers_qnn_target} POST_BUILD
160-
COMMAND ${CMAKE_COMMAND} -E copy "${onnxruntime_QNN_HOME}/Qualcomm AI Hub Proprietary License.pdf" $<TARGET_FILE_DIR:${onnxruntime_providers_qnn_target}>
160+
COMMAND ${CMAKE_COMMAND} -E copy "${onnxruntime_QNN_HOME}/LICENSE.pdf" $<TARGET_FILE_DIR:${onnxruntime_providers_qnn_target}>/Qualcomm_LICENSE.pdf
161161
)
162162
endif()
163163
endif()

cmake/onnxruntime_python.cmake

Lines changed: 2 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -1050,18 +1050,10 @@ if (onnxruntime_USE_QNN)
10501050
${QNN_LIB_FILES}
10511051
$<TARGET_FILE_DIR:${build_output_target}>/onnxruntime/capi/
10521052
)
1053-
add_custom_command(
1054-
TARGET onnxruntime_pybind11_state POST_BUILD
1055-
COMMAND ${CMAKE_COMMAND} -E copy
1056-
$<TARGET_FILE:ep_weight_sharing_ctx_gen>
1057-
$<TARGET_FILE_DIR:${build_output_target}>/onnxruntime/capi/
1058-
)
1059-
if (EXISTS "${onnxruntime_QNN_HOME}/Qualcomm AI Hub Proprietary License.pdf")
1053+
if (EXISTS "${onnxruntime_QNN_HOME}/LICENSE.pdf")
10601054
add_custom_command(
10611055
TARGET onnxruntime_pybind11_state POST_BUILD
1062-
COMMAND ${CMAKE_COMMAND} -E copy
1063-
"${onnxruntime_QNN_HOME}/Qualcomm AI Hub Proprietary License.pdf"
1064-
$<TARGET_FILE_DIR:${build_output_target}>/onnxruntime/
1056+
COMMAND ${CMAKE_COMMAND} -E copy "${onnxruntime_QNN_HOME}/LICENSE.pdf" $<TARGET_FILE_DIR:${build_output_target}>/onnxruntime/Qualcomm_LICENSE.pdf
10651057
)
10661058
endif()
10671059
endif()

0 commit comments

Comments
 (0)