@@ -26,17 +26,17 @@ jobs:
2626 build_config : Release
2727 architecture : x64
2828 dockerfile_path : tools/ci_build/github/linux/docker/Dockerfile.manylinux2_28_cuda
29- docker_build_args : ' --build-arg BASEIMAGE=onnxruntimebuildcache.azurecr.io/internal/azureml/onnxruntime/build/cuda12_x64_almalinux8_gcc14:20251017 .1'
30- docker_image_repo : onnxruntimecuda12manylinuxbuild
29+ docker_build_args : ' --build-arg BASEIMAGE=onnxruntimebuildcache.azurecr.io/internal/azureml/onnxruntime/build/cuda13_x64_almalinux8_gcc14:20251107 .1'
30+ docker_image_repo : onnxruntimecuda13manylinuxbuild
3131 extra_build_flags : >-
3232 --use_binskim_compliant_compile_flags
3333 --build_wheel
3434 --parallel
3535 --nvcc_threads 4
3636 --flash_nvcc_threads 4
37- --cuda_version=12.8
38- --cuda_home=/usr/local/cuda-12.8
39- --cudnn_home=/usr/local/cuda-12.8
37+ --cuda_version=13.0
38+ --cuda_home=/usr/local/cuda-13.0
39+ --cudnn_home=/usr/local/cuda-13.0
4040 --enable_cuda_profiling
4141 --cmake_extra_defines CMAKE_CUDA_ARCHITECTURES=86
4242 --cmake_extra_defines onnxruntime_QUICK_BUILD=ON
6767 id : build_docker_image_step
6868 with :
6969 dockerfile : ${{ github.workspace }}/tools/ci_build/github/linux/docker/Dockerfile.manylinux2_28_cuda
70- image-name : ghcr.io/microsoft/onnxruntime/onnxruntimecuda12manylinuxbuild
71- build-args : ' --build-arg BASEIMAGE=onnxruntimebuildcache.azurecr.io/internal/azureml/onnxruntime/build/cuda12_x64_almalinux8_gcc14:20251017 .1'
70+ image-name : ghcr.io/microsoft/onnxruntime/onnxruntimecuda13manylinuxbuild
71+ build-args : ' --build-arg BASEIMAGE=onnxruntimebuildcache.azurecr.io/internal/azureml/onnxruntime/build/cuda13_x64_almalinux8_gcc14:20251107 .1'
7272 push : true
7373 azure-container-registry-name : onnxruntimebuildcache
7474 env :
@@ -100,6 +100,15 @@ jobs:
100100 echo "Warning: perms.txt not found in artifact."
101101 fi
102102
103+ # Verify the GPU is accessible inside Docker before running the full test suite.
104+ # If the NVIDIA Container Toolkit fails to expose /dev/nvidia* devices,
105+ # tests will fail with "CUDA failure 100" and waste 10+ minutes.
106+ - name : Verify GPU access in Docker
107+ run : |
108+ docker run --rm --gpus all \
109+ "${{ steps.build_docker_image_step.outputs.full-image-name }}" \
110+ nvidia-smi
111+
103112 # --- Install the ORT wheel and run CUDA plugin EP tests ---
104113 - name : Run CUDA Plugin EP Python Tests
105114 run : |
@@ -111,6 +120,11 @@ jobs:
111120 bash -c "
112121 set -ex
113122 export PATH=/opt/python/cp312-cp312/bin:\$PATH
123+ # Ensure libcudart.so.13 is findable regardless of host-runner NVIDIA Container Toolkit configuration.
124+ # The CUDA runtime library lives in the container image at /usr/local/cuda-13.0/lib64, but the
125+ # LD_LIBRARY_PATH may not include this path when the runner's NVIDIA toolkit only mounts driver
126+ # libraries at /usr/local/nvidia/lib64.
127+ export LD_LIBRARY_PATH=/usr/local/cuda-13.0/lib64:\${LD_LIBRARY_PATH:-}
114128
115129 # Install the ORT wheel
116130 python -m pip install /build/Release/Release/dist/onnxruntime*.whl
0 commit comments