Skip to content

Commit a4940e9

Browse files
yuanjingx87Fridah-nvyiqingy0
authored
[None] infra:Update dependencies for DLFW 25.06 (#5967)
Signed-off-by: Yuanjing Xue <[email protected]> Signed-off-by: Frida Hou <[email protected]> Signed-off-by: yuanjingx87 <[email protected]> Co-authored-by: Fridah-nv <[email protected]> Co-authored-by: Yiqing Yan <[email protected]>
1 parent 714f82b commit a4940e9

File tree

19 files changed

+58
-58
lines changed

19 files changed

+58
-58
lines changed

.devcontainer/docker-compose.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
11
version: "3.9"
22
services:
33
tensorrt_llm-dev:
4-
image: urm.nvidia.com/sw-tensorrt-docker/tensorrt-llm:pytorch-25.05-py3-x86_64-ubuntu24.04-trt10.11.0.33-skip-tritondevel-202506271620-5539
4+
image: urm.nvidia.com/sw-tensorrt-docker/tensorrt-llm:pytorch-25.06-py3-x86_64-ubuntu24.04-trt10.11.0.33-skip-tritondevel-202507101256-9530
55
network_mode: host
66
ipc: host
77

README.md

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -7,7 +7,7 @@ TensorRT-LLM
77
[![Documentation](https://img.shields.io/badge/docs-latest-brightgreen.svg?style=flat)](https://nvidia.github.io/TensorRT-LLM/)
88
[![python](https://img.shields.io/badge/python-3.12-green)](https://www.python.org/downloads/release/python-3123/)
99
[![python](https://img.shields.io/badge/python-3.10-green)](https://www.python.org/downloads/release/python-31012/)
10-
[![cuda](https://img.shields.io/badge/cuda-12.9.0-green)](https://developer.nvidia.com/cuda-downloads)
10+
[![cuda](https://img.shields.io/badge/cuda-12.9.1-green)](https://developer.nvidia.com/cuda-downloads)
1111
[![trt](https://img.shields.io/badge/TRT-10.11.0-green)](https://developer.nvidia.com/tensorrt)
1212
[![version](https://img.shields.io/badge/release-0.21.0-green)](./tensorrt_llm/version.py)
1313
[![license](https://img.shields.io/badge/license-Apache%202-blue)](./LICENSE)

constraints.txt

Lines changed: 0 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -1,9 +0,0 @@
1-
# These vulnerabilities were inherited from the base image (pytorch:25.05-py3) and should be removed when the base image
2-
# is updated.
3-
4-
# WAR against https://github.com/advisories/GHSA-vqfr-h8mv-ghfj
5-
h11>=0.16.0
6-
# WAR against https://github.com/advisories/GHSA-7cx3-6m66-7c5m
7-
tornado>=6.5.0
8-
# WAR against https://github.com/advisories/GHSA-5rjg-fvgr-3xxf
9-
setuptools>=78.1.1

docker/Dockerfile.multi

Lines changed: 2 additions & 11 deletions
Original file line numberDiff line numberDiff line change
@@ -1,8 +1,8 @@
11
# Multi-stage Dockerfile
22
ARG BASE_IMAGE=nvcr.io/nvidia/pytorch
33
ARG TRITON_IMAGE=nvcr.io/nvidia/tritonserver
4-
ARG BASE_TAG=25.05-py3
5-
ARG TRITON_BASE_TAG=25.05-py3
4+
ARG BASE_TAG=25.06-py3
5+
ARG TRITON_BASE_TAG=25.06-py3
66
ARG DEVEL_IMAGE=devel
77

88
FROM ${BASE_IMAGE}:${BASE_TAG} AS base
@@ -76,15 +76,6 @@ RUN pip3 install opencv-python-headless --force-reinstall --no-deps --no-cache-d
7676
COPY docker/common/install_deep_ep.sh install_deep_ep.sh
7777
RUN bash ./install_deep_ep.sh && rm install_deep_ep.sh
7878

79-
# WARs against security issues inherited from pytorch:25.04
80-
# * https://github.com/advisories/GHSA-vqfr-h8mv-ghfj
81-
# * https://github.com/advisories/GHSA-7cx3-6m66-7c5m
82-
# * https://github.com/advisories/GHSA-5rjg-fvgr-3xxf
83-
RUN pip3 install --upgrade --no-cache-dir \
84-
"h11>=0.16" \
85-
"tornado>=6.5.0" \
86-
"setuptools>=78.1.1,<80"
87-
8879
FROM ${TRITON_IMAGE}:${TRITON_BASE_TAG} AS triton
8980

9081
FROM devel AS tritondevel

docker/Makefile

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -183,16 +183,16 @@ jenkins-aarch64_%: STAGE = tritondevel
183183
jenkins-rockylinux8_%: IMAGE_WITH_TAG = $(shell grep '^[[:space:]]*LLM_ROCKYLINUX8_PY312_DOCKER_IMAGE = ' ../jenkins/L0_MergeRequest.groovy | grep -o '".*"' | tr -d '"')
184184
jenkins-rockylinux8_%: STAGE = tritondevel
185185
jenkins-rockylinux8_%: BASE_IMAGE = nvidia/cuda
186-
jenkins-rockylinux8_%: BASE_TAG = 12.9.0-devel-rockylinux8
186+
jenkins-rockylinux8_%: BASE_TAG = 12.9.1-devel-rockylinux8
187187

188188
rockylinux8_%: STAGE = tritondevel
189189
rockylinux8_%: BASE_IMAGE = nvidia/cuda
190-
rockylinux8_%: BASE_TAG = 12.9.0-devel-rockylinux8
190+
rockylinux8_%: BASE_TAG = 12.9.1-devel-rockylinux8
191191

192192
# For x86_64 and aarch64
193193
ubuntu22_%: STAGE = tritondevel
194194
ubuntu22_%: BASE_IMAGE = nvidia/cuda
195-
ubuntu22_%: BASE_TAG = 12.9.0-devel-ubuntu22.04
195+
ubuntu22_%: BASE_TAG = 12.9.1-devel-ubuntu22.04
196196

197197
trtllm_%: STAGE = release
198198
trtllm_%: PUSH_TO_STAGING := 0

docker/common/install_cuda_toolkit.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -5,7 +5,7 @@ set -ex
55
# This script is used for reinstalling CUDA on Rocky Linux 8 with the run file.
66
# CUDA version is usually aligned with the latest NGC CUDA image tag.
77
# Only use when public CUDA image is not ready.
8-
CUDA_VER="12.9.0_575.51.03"
8+
CUDA_VER="12.9.1_575.57.08"
99
CUDA_VER_SHORT="${CUDA_VER%_*}"
1010

1111
NVCC_VERSION_OUTPUT=$(nvcc --version)

docker/common/install_pytorch.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,7 @@ set -ex
44

55
# Use latest stable version from https://pypi.org/project/torch/#history
66
# and closest to the version specified in
7-
# https://docs.nvidia.com/deeplearning/frameworks/pytorch-release-notes/rel-25-05.html#rel-25-05
7+
# https://docs.nvidia.com/deeplearning/frameworks/pytorch-release-notes/rel-25-06.html#rel-25-06
88
TORCH_VERSION="2.7.1"
99
SYSTEM_ID=$(grep -oP '(?<=^ID=).+' /etc/os-release | tr -d '"')
1010

docker/common/install_tensorrt.sh

Lines changed: 8 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -5,20 +5,19 @@ set -ex
55
TRT_VER="10.11.0.33"
66
# Align with the pre-installed cuDNN / cuBLAS / NCCL versions from
77
# https://docs.nvidia.com/deeplearning/frameworks/pytorch-release-notes/rel-25-05.html#rel-25-05
8-
CUDA_VER="12.9" # 12.9.0
8+
CUDA_VER="12.9" # 12.9.1
99
# Keep the installation for cuDNN if users want to install PyTorch with source codes.
1010
# PyTorch 2.x can compile with cuDNN v9.
11-
CUDNN_VER="9.10.1.4-1"
12-
# NCCL version 2.26.x used in the NGC PyTorch 25.05 image but has a performance regression issue.
13-
# Use NCCL version 2.27.5 which has the fixes.
11+
CUDNN_VER="9.10.2.21-1"
12+
# PyTorch 25.06 uses NCCL 2.27.3. NCCL 2.27.5 resolves a perf regression issue.
13+
# Use NCCL version 2.27.5 instead.
1414
NCCL_VER="2.27.5-1+cuda12.9"
15-
# Use cuBLAS version 12.9.0.13 instead.
16-
CUBLAS_VER="12.9.0.13-1"
15+
CUBLAS_VER="12.9.1.4-1"
1716
# Align with the pre-installed CUDA / NVCC / NVRTC versions from
1817
# https://docs.nvidia.com/cuda/cuda-toolkit-release-notes/index.html
19-
NVRTC_VER="12.9.41-1"
20-
CUDA_RUNTIME="12.9.37-1"
21-
CUDA_DRIVER_VERSION="575.51.03-1.el8"
18+
NVRTC_VER="12.9.86-1"
19+
CUDA_RUNTIME="12.9.79-1"
20+
CUDA_DRIVER_VERSION="575.57.08-1.el8"
2221

2322
for i in "$@"; do
2423
case $i in

docs/source/reference/support-matrix.md

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -143,7 +143,7 @@ The following table shows the supported software for TensorRT-LLM.
143143
* -
144144
- Software Compatibility
145145
* - Container
146-
- [25.05](https://docs.nvidia.com/deeplearning/frameworks/support-matrix/index.html)
146+
- [25.06](https://docs.nvidia.com/deeplearning/frameworks/support-matrix/index.html)
147147
* - TensorRT
148148
- [10.11](https://docs.nvidia.com/deeplearning/tensorrt/release-notes/index.html)
149149
* - Precision

jenkins/L0_MergeRequest.groovy

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -28,10 +28,10 @@ UPLOAD_PATH = env.uploadPath ? env.uploadPath : "sw-tensorrt-generic/llm-artifac
2828
// Container configuration
2929
// available tags can be found in: https://urm.nvidia.com/artifactory/sw-tensorrt-docker/tensorrt-llm/
3030
// [base_image_name]-[arch]-[os](-[python_version])-[trt_version]-[torch_install_type]-[stage]-[date]-[mr_id]
31-
LLM_DOCKER_IMAGE = "urm.nvidia.com/sw-tensorrt-docker/tensorrt-llm:pytorch-25.05-py3-x86_64-ubuntu24.04-trt10.11.0.33-skip-tritondevel-202506271620-5539"
32-
LLM_SBSA_DOCKER_IMAGE = "urm.nvidia.com/sw-tensorrt-docker/tensorrt-llm:pytorch-25.05-py3-aarch64-ubuntu24.04-trt10.11.0.33-skip-tritondevel-202506271620-5539"
33-
LLM_ROCKYLINUX8_PY310_DOCKER_IMAGE = "urm.nvidia.com/sw-tensorrt-docker/tensorrt-llm:cuda-12.9.0-devel-rocky8-x86_64-rocky8-py310-trt10.11.0.33-skip-tritondevel-202506271620-5539"
34-
LLM_ROCKYLINUX8_PY312_DOCKER_IMAGE = "urm.nvidia.com/sw-tensorrt-docker/tensorrt-llm:cuda-12.9.0-devel-rocky8-x86_64-rocky8-py312-trt10.11.0.33-skip-tritondevel-202506271620-5539"
31+
LLM_DOCKER_IMAGE = "urm.nvidia.com/sw-tensorrt-docker/tensorrt-llm:pytorch-25.06-py3-x86_64-ubuntu24.04-trt10.11.0.33-skip-tritondevel-202507101256-9530"
32+
LLM_SBSA_DOCKER_IMAGE = "urm.nvidia.com/sw-tensorrt-docker/tensorrt-llm:pytorch-25.06-py3-aarch64-ubuntu24.04-trt10.11.0.33-skip-tritondevel-202507101256-9530"
33+
LLM_ROCKYLINUX8_PY310_DOCKER_IMAGE = "urm.nvidia.com/sw-tensorrt-docker/tensorrt-llm:cuda-12.9.1-devel-rocky8-x86_64-rocky8-py310-trt10.11.0.33-skip-tritondevel-202507101256-9530"
34+
LLM_ROCKYLINUX8_PY312_DOCKER_IMAGE = "urm.nvidia.com/sw-tensorrt-docker/tensorrt-llm:cuda-12.9.1-devel-rocky8-x86_64-rocky8-py312-trt10.11.0.33-skip-tritondevel-202507101256-9530"
3535

3636
// TODO: Move common variables to an unified location
3737
BUILD_CORES_REQUEST = "8"

0 commit comments

Comments
 (0)