Skip to content

Commit cc21215

Browse files
authored
Bump TensorRT-LLM backend dependency to v0.16.0 (#2931)
* backend(trtllm): update to 0.16.0 * backend(trtllm): do not use shallow clone * backend(trtllm): use tag instead * backend(trtllm): move to nvidia remote instead of hf * backend(trtllm): reenable shallow clone * backend(trtllm): attempt to use ADD instead of RUN for openmpi * backend(trtllm): make sure we are using correct path for openmpi ADD in dockerfile * backend(trtllm): add correctly untar it
1 parent 1dd3466 commit cc21215

File tree

3 files changed

+11
-9
lines changed

3 files changed

+11
-9
lines changed

Dockerfile_trtllm

Lines changed: 7 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
ARG cuda_arch_list="75-real;80-real;86-real;89-real;90-real"
2-
ARG ompi_version="4.1.7rc1"
2+
ARG ompi_version="4.1.7"
33
ARG build_type=release
44
ARG is_gha_build=false
55

@@ -37,10 +37,12 @@ FROM cuda-builder AS mpi-builder
3737
ARG ompi_version
3838

3939
ENV OMPI_TARBALL_FILENAME="openmpi-$ompi_version.tar.bz2"
40-
RUN wget "https://download.open-mpi.org/release/open-mpi/v4.1/$OMPI_TARBALL_FILENAME" -P /opt/src && \
41-
mkdir /usr/src/mpi && \
42-
tar -xf "/opt/src/$OMPI_TARBALL_FILENAME" -C /usr/src/mpi --strip-components=1 && \
43-
cd /usr/src/mpi && \
40+
ADD --checksum=sha256:54a33cb7ad81ff0976f15a6cc8003c3922f0f3d8ceed14e1813ef3603f22cd34 \
41+
https://download.open-mpi.org/release/open-mpi/v4.1/$OMPI_TARBALL_FILENAME \
42+
/opt/src/mpi/
43+
44+
WORKDIR /opt/src/mpi
45+
RUN tar --strip-components=1 -xf $OMPI_TARBALL_FILENAME &&\
4446
./configure --prefix=/usr/local/mpi --with-cuda=/usr/local/cuda --with-slurm && \
4547
make -j all && \
4648
make install && \

backends/trtllm/cmake/trtllm.cmake

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -27,8 +27,8 @@ find_package(Python3 REQUIRED Interpreter)
2727

2828
fetchcontent_declare(
2929
trtllm
30-
GIT_REPOSITORY https://github.com/huggingface/TensorRT-LLM.git
31-
GIT_TAG 1bb9ca4688805444f203647674bac1d7219d0579
30+
GIT_REPOSITORY https://github.com/nvidia/TensorRT-LLM.git
31+
GIT_TAG v0.16.0
3232
GIT_SHALLOW ON
3333
DOWNLOAD_EXTRACT_TIMESTAMP
3434
)

backends/trtllm/scripts/install_tensorrt.sh

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -2,8 +2,8 @@
22

33
set -ex
44

5-
TRT_VER_BASE="10.6.0"
6-
TRT_VER_FULL="${TRT_VER_BASE}.26"
5+
TRT_VER_BASE="10.7.0"
6+
TRT_VER_FULL="${TRT_VER_BASE}.23"
77
CUDA_VER="12.6"
88
CUDNN_VER="9.5.0.50-1"
99
NCCL_VER="2.22.3-1+cuda12.6"

0 commit comments

Comments
 (0)