Skip to content

Commit 0c55200

Browse files
committed
[Infra][TRTLLM-6224] - Upgrade dependencies to DLFW 25.06 and CUDA 12.9.1
Signed-off-by: Yiqing Yan <[email protected]>
1 parent 04fa6c0 commit 0c55200

File tree

10 files changed

+20
-30
lines changed

10 files changed

+20
-30
lines changed

README.md

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -7,7 +7,7 @@ TensorRT-LLM
77
[![Documentation](https://img.shields.io/badge/docs-latest-brightgreen.svg?style=flat)](https://nvidia.github.io/TensorRT-LLM/)
88
[![python](https://img.shields.io/badge/python-3.12-green)](https://www.python.org/downloads/release/python-3123/)
99
[![python](https://img.shields.io/badge/python-3.10-green)](https://www.python.org/downloads/release/python-31012/)
10-
[![cuda](https://img.shields.io/badge/cuda-12.9.0-green)](https://developer.nvidia.com/cuda-downloads)
10+
[![cuda](https://img.shields.io/badge/cuda-12.9.1-green)](https://developer.nvidia.com/cuda-downloads)
1111
[![trt](https://img.shields.io/badge/TRT-10.11.0-green)](https://developer.nvidia.com/tensorrt)
1212
[![version](https://img.shields.io/badge/release-1.0.0rc1-green)](./tensorrt_llm/version.py)
1313
[![license](https://img.shields.io/badge/license-Apache%202-blue)](./LICENSE)

constraints.txt

Lines changed: 0 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -1,9 +0,0 @@
1-
# These vulnerabilities were inherited from the base image (pytorch:25.05-py3) and should be removed when the base image
2-
# is updated.
3-
4-
# WAR against https://github.com/advisories/GHSA-vqfr-h8mv-ghfj
5-
h11>=0.16.0
6-
# WAR against https://github.com/advisories/GHSA-7cx3-6m66-7c5m
7-
tornado>=6.5.0
8-
# WAR against https://github.com/advisories/GHSA-5rjg-fvgr-3xxf
9-
setuptools>=78.1.1

docker/Dockerfile.multi

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,8 +1,8 @@
11
# Multi-stage Dockerfile
22
ARG BASE_IMAGE=nvcr.io/nvidia/pytorch
33
ARG TRITON_IMAGE=nvcr.io/nvidia/tritonserver
4-
ARG BASE_TAG=25.05-py3
5-
ARG TRITON_BASE_TAG=25.05-py3
4+
ARG BASE_TAG=25.06-py3
5+
ARG TRITON_BASE_TAG=25.06-py3
66
ARG DEVEL_IMAGE=devel
77

88
FROM ${BASE_IMAGE}:${BASE_TAG} AS base

docker/Makefile

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -182,16 +182,16 @@ jenkins-aarch64_%: STAGE = tritondevel
182182
jenkins-rockylinux8_%: IMAGE_WITH_TAG = $(shell . ../jenkins/current_image_tags.properties && echo $$LLM_ROCKYLINUX8_PY312_DOCKER_IMAGE)
183183
jenkins-rockylinux8_%: STAGE = tritondevel
184184
jenkins-rockylinux8_%: BASE_IMAGE = nvidia/cuda
185-
jenkins-rockylinux8_%: BASE_TAG = 12.9.0-devel-rockylinux8
185+
jenkins-rockylinux8_%: BASE_TAG = 12.9.1-devel-rockylinux8
186186

187187
rockylinux8_%: STAGE = tritondevel
188188
rockylinux8_%: BASE_IMAGE = nvidia/cuda
189-
rockylinux8_%: BASE_TAG = 12.9.0-devel-rockylinux8
189+
rockylinux8_%: BASE_TAG = 12.9.1-devel-rockylinux8
190190

191191
# For x86_64 and aarch64
192192
ubuntu22_%: STAGE = tritondevel
193193
ubuntu22_%: BASE_IMAGE = nvidia/cuda
194-
ubuntu22_%: BASE_TAG = 12.9.0-devel-ubuntu22.04
194+
ubuntu22_%: BASE_TAG = 12.9.1-devel-ubuntu22.04
195195

196196
trtllm_%: STAGE = release
197197
trtllm_%: PUSH_TO_STAGING := 0

docker/common/install_cuda_toolkit.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -5,7 +5,7 @@ set -ex
55
# This script is used for reinstalling CUDA on Rocky Linux 8 with the run file.
66
# CUDA version is usually aligned with the latest NGC CUDA image tag.
77
# Only use when public CUDA image is not ready.
8-
CUDA_VER="12.9.0_575.51.03"
8+
CUDA_VER="12.9.1_575.57.08"
99
CUDA_VER_SHORT="${CUDA_VER%_*}"
1010

1111
NVCC_VERSION_OUTPUT=$(nvcc --version)

docker/common/install_pytorch.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,7 @@ set -ex
44

55
# Use latest stable version from https://pypi.org/project/torch/#history
66
# and closest to the version specified in
7-
# https://docs.nvidia.com/deeplearning/frameworks/pytorch-release-notes/rel-25-05.html#rel-25-05
7+
# https://docs.nvidia.com/deeplearning/frameworks/pytorch-release-notes/rel-25-06.html#rel-25-06
88
TORCH_VERSION="2.7.1"
99
SYSTEM_ID=$(grep -oP '(?<=^ID=).+' /etc/os-release | tr -d '"')
1010

docker/common/install_tensorrt.sh

Lines changed: 9 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -4,21 +4,20 @@ set -ex
44

55
TRT_VER="10.11.0.33"
66
# Align with the pre-installed cuDNN / cuBLAS / NCCL versions from
7-
# https://docs.nvidia.com/deeplearning/frameworks/pytorch-release-notes/rel-25-05.html#rel-25-05
8-
CUDA_VER="12.9" # 12.9.0
7+
# https://docs.nvidia.com/deeplearning/frameworks/pytorch-release-notes/rel-25-06.html#rel-25-06
8+
CUDA_VER="12.9" # 12.9.1
99
# Keep the installation for cuDNN if users want to install PyTorch with source codes.
1010
# PyTorch 2.x can compile with cuDNN v9.
11-
CUDNN_VER="9.10.1.4-1"
12-
# NCCL version 2.26.x used in the NGC PyTorch 25.05 image but has a performance regression issue.
13-
# Use NCCL version 2.27.5 which has the fixes.
11+
CUDNN_VER="9.10.2.21-1"
12+
# PyTorch 25.06 uses NCCL 2.27.3. NCCL 2.27.5 resolves a perf regression issue.
13+
# Use NCCL version 2.27.5 instead.
1414
NCCL_VER="2.27.5-1+cuda12.9"
15-
# Use cuBLAS version 12.9.0.13 instead.
16-
CUBLAS_VER="12.9.0.13-1"
15+
CUBLAS_VER="12.9.1.4-1"
1716
# Align with the pre-installed CUDA / NVCC / NVRTC versions from
1817
# https://docs.nvidia.com/cuda/cuda-toolkit-release-notes/index.html
19-
NVRTC_VER="12.9.41-1"
20-
CUDA_RUNTIME="12.9.37-1"
21-
CUDA_DRIVER_VERSION="575.51.03-1.el8"
18+
NVRTC_VER="12.9.86-1"
19+
CUDA_RUNTIME="12.9.79-1"
20+
CUDA_DRIVER_VERSION="575.57.08-1.el8"
2221

2322
for i in "$@"; do
2423
case $i in

docs/source/reference/support-matrix.md

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -142,7 +142,7 @@ The following table shows the supported software for TensorRT-LLM.
142142
* -
143143
- Software Compatibility
144144
* - Container
145-
- [25.05](https://docs.nvidia.com/deeplearning/frameworks/support-matrix/index.html)
145+
- [25.06](https://docs.nvidia.com/deeplearning/frameworks/support-matrix/index.html)
146146
* - TensorRT
147147
- [10.11](https://docs.nvidia.com/deeplearning/tensorrt/release-notes/index.html)
148148
* - Precision

jenkins/L0_Test.groovy

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -39,7 +39,7 @@ LLM_ROCKYLINUX8_PY310_DOCKER_IMAGE = env.wheelDockerImagePy310
3939
LLM_ROCKYLINUX8_PY312_DOCKER_IMAGE = env.wheelDockerImagePy312
4040

4141
// DLFW torch image
42-
DLFW_IMAGE = "nvcr.io/nvidia/pytorch:25.05-py3"
42+
DLFW_IMAGE = "nvcr.io/nvidia/pytorch:25.06-py3"
4343

4444
//Ubuntu base image
4545
UBUNTU_22_04_IMAGE = "urm.nvidia.com/docker/ubuntu:22.04"

requirements.txt

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -22,7 +22,7 @@ h5py==3.12.1
2222
StrEnum
2323
sentencepiece>=0.1.99
2424
tensorrt~=10.11.0
25-
# https://docs.nvidia.com/deeplearning/frameworks/pytorch-release-notes/rel-25-05.html#rel-25-05 uses 2.8.0a0.
25+
# https://docs.nvidia.com/deeplearning/frameworks/pytorch-release-notes/rel-25-06.html#rel-25-06 uses 2.8.0a0.
2626
torch>=2.7.1,<=2.8.0a0
2727
torchvision
2828
nvidia-modelopt[torch]~=0.31.0

0 commit comments

Comments
 (0)