Skip to content

Commit 9f60afe

Browse files
authored
Update Dockerfile to enable CUDA 13 (#820) (#821)
* Change target commit. * Update Dockerfile * git: Update submodule. * docker: Update base container image * Update dockerfile versions * Removing line as un-used * Update submodule commit reference. * Update Dokerfile
1 parent 06795f1 commit 9f60afe

File tree

2 files changed

+15
-25
lines changed

2 files changed

+15
-25
lines changed

dockerfile/Dockerfile.triton.trt_llm_backend

Lines changed: 14 additions & 24 deletions
Original file line numberDiff line numberDiff line change
@@ -1,34 +1,30 @@
1-
ARG BASE_IMAGE=nvcr.io/nvidia/tritonserver:25.06-py3-min
2-
ARG PYTORCH_IMAGE=nvcr.io/nvidia/pytorch:25.06-py3
3-
ARG NVRTC_VER=12.9.86-1
4-
ARG TRT_VER=10.11.0.33
5-
ARG NCCL_VER=2.27.5-1+cuda12.9
6-
ARG RELEASE_URL_TRT_x86=https://developer.nvidia.com/downloads/compute/machine-learning/tensorrt/10.11.0/tars/TensorRT-${TRT_VER}.Linux.x86_64-gnu.cuda-12.9.tar.gz
7-
ARG RELEASE_URL_TRT_ARM=https://developer.nvidia.com/downloads/compute/machine-learning/tensorrt/10.11.0/tars/TensorRT-${TRT_VER}.Linux.aarch64-gnu.cuda-12.9.tar.gz
1+
ARG BASE_IMAGE=nvcr.io/nvidia/tritonserver:25.10-py3-min
2+
ARG PYTORCH_IMAGE=nvcr.io/nvidia/pytorch:25.10-py3
3+
ARG NVRTC_VER=13.0.48-1
4+
ARG TRT_VER=10.13.3.9
5+
ARG NCCL_VER=2.27.7-1+cuda13.0
6+
ARG RELEASE_URL_TRT_x86=https://developer.nvidia.com/downloads/compute/machine-learning/tensorrt/10.13.3/tars/TensorRT-${TRT_VER}.Linux.x86_64-gnu.cuda-13.0.tar.gz
7+
ARG RELEASE_URL_TRT_ARM=https://developer.nvidia.com/downloads/compute/machine-learning/tensorrt/10.13.3/tars/TensorRT-${TRT_VER}.Linux.aarch64-gnu.cuda-13.0.tar.gz
88

99
# Versions of packages to copy from pytorch image
10-
ARG TORCH_VER=2.8.0a0+5228986c39.nv25.6
11-
ARG TORCHVISION_VER=0.22.0a0+95f10a4e
12-
ARG SETUPTOOLS_VER=78.1.1
13-
ARG PYTORCH_TRITON_VER=3.3.0+git96316ce52.nvinternal
14-
ARG JINJA2_VER=3.1.6
10+
ARG FLASH_ATTN_VER=2.7.4.post1+25.10
1511
ARG NETWORKX_VER=3.5
12+
ARG PACKAGING_VER=25.0
13+
ARG PYTORCH_TRITON_VER=3.4.0+gitc817b9b6
14+
ARG SETUPTOOLS_VER=79.0.1
1615
ARG SYMPY_VER=1.14.0
17-
ARG PACKAGING_VER=23.2
18-
ARG FLASH_ATTN_VER=2.7.4.post1
16+
ARG TORCH_VER=2.9.0a0+145a3a7bda.nv25.10
17+
ARG TORCHVISION_VER=0.24.0a0+094e7af5
1918

2019
ARG TENSORRTLLM_REPO=https://github.com/NVIDIA/TensorRT-LLM.git
2120
ARG TENSORRTLLM_REPO_TAG=release/1.0
22-
ARG TENSORRTLLM_VER=1.0.0
21+
ARG TENSORRTLLM_VER=1.2.0rc2
2322

2423
FROM ${PYTORCH_IMAGE} AS pytorch_image
2524
FROM ${BASE_IMAGE} AS install_dependencies
2625

2726
WORKDIR /workspace
2827

29-
# Might not need to copy cusparseLt in the future once it's included in DLFW cuda container
30-
COPY --from=pytorch_image /usr/local/cuda/lib64/libcusparseLt* /usr/local/cuda/lib64/
31-
3228
ENV PIP_BREAK_SYSTEM_PACKAGES=1
3329
RUN apt-get update -q=2 \
3430
&& apt-get install -y --no-install-recommends \
@@ -103,7 +99,6 @@ ARG TORCH_VER
10399
ARG TORCHVISION_VER
104100
ARG SETUPTOOLS_VER
105101
ARG PYTORCH_TRITON_VER
106-
ARG JINJA2_VER
107102
ARG NETWORKX_VER
108103
ARG SYMPY_VER
109104
ARG PACKAGING_VER
@@ -121,8 +116,6 @@ COPY --from=pytorch_image /usr/local/lib/python3.12/dist-packages/setuptools-${S
121116
COPY --from=pytorch_image /usr/local/lib/python3.12/dist-packages/functorch /usr/local/lib/python3.12/dist-packages/functorch
122117
COPY --from=pytorch_image /usr/local/lib/python3.12/dist-packages/pytorch_triton-${PYTORCH_TRITON_VER}.dist-info /usr/local/lib/python3.12/dist-packages/pytorch_triton-${PYTORCH_TRITON_VER}.dist-info
123118
COPY --from=pytorch_image /usr/local/lib/python3.12/dist-packages/triton /usr/local/lib/python3.12/dist-packages/triton
124-
COPY --from=pytorch_image /usr/local/lib/python3.12/dist-packages/jinja2 /usr/local/lib/python3.12/dist-packages/jinja2
125-
COPY --from=pytorch_image /usr/local/lib/python3.12/dist-packages/jinja2-${JINJA2_VER}.dist-info /usr/local/lib/python3.12/dist-packages/jinja2-${JINJA2_VER}.dist-info
126119
COPY --from=pytorch_image /usr/local/lib/python3.12/dist-packages/networkx /usr/local/lib/python3.12/dist-packages/networkx
127120
COPY --from=pytorch_image /usr/local/lib/python3.12/dist-packages/networkx-${NETWORKX_VER}.dist-info /usr/local/lib/python3.12/dist-packages/networkx-${NETWORKX_VER}.dist-info
128121
COPY --from=pytorch_image /usr/local/lib/python3.12/dist-packages/sympy /usr/local/lib/python3.12/dist-packages/sympy
@@ -133,9 +126,6 @@ COPY --from=pytorch_image /usr/local/lib/python3.12/dist-packages/flash_attn /us
133126
COPY --from=pytorch_image /usr/local/lib/python3.12/dist-packages/flash_attn-${FLASH_ATTN_VER}.dist-info /usr/local/lib/python3.12/dist-packages/flash_attn-${FLASH_ATTN_VER}.dist-info
134127
COPY --from=pytorch_image /usr/local/lib/python3.12/dist-packages/flash_attn_2_cuda.cpython-312-*-linux-gnu.so /usr/local/lib/python3.12/dist-packages/
135128

136-
# Might not need to copy cusparseLt in the future once it's included in DLFW cuda container
137-
COPY --from=pytorch_image /usr/local/cuda/lib64/libcusparseLt* /usr/local/cuda/lib64/
138-
139129
ARG NVRTC_VER
140130
ARG NCCL_VER
141131
ENV CUDA_VER=$CUDA_VERSION \

tensorrt_llm

Submodule tensorrt_llm updated 6387 files

0 commit comments

Comments
 (0)