File tree Expand file tree Collapse file tree 4 files changed +8
-8
lines changed Expand file tree Collapse file tree 4 files changed +8
-8
lines changed Original file line number Diff line number Diff line change 1
1
version : " 3.9"
2
2
services :
3
3
tensorrt_llm-dev :
4
- image : urm.nvidia.com/sw-tensorrt-docker/tensorrt-llm:pytorch-25.05-py3-x86_64-ubuntu24.04-trt10.11.0.33-skip-tritondevel-202506051650-4885
4
+ image : urm.nvidia.com/sw-tensorrt-docker/tensorrt-llm:pytorch-25.05-py3-x86_64-ubuntu24.04-trt10.11.0.33-skip-tritondevel-202506271620-5539
5
5
network_mode : host
6
6
ipc : host
7
7
Original file line number Diff line number Diff line change @@ -10,8 +10,8 @@ CUDA_VER="12.9" # 12.9.0
10
10
# PyTorch 2.x can compile with cuDNN v9.
11
11
CUDNN_VER=" 9.10.1.4-1"
12
12
# NCCL version 2.26.x used in the NGC PyTorch 25.05 image but has a performance regression issue.
13
- # Use NCCL version 2.25.1 instead .
14
- NCCL_VER=" 2.25.1 -1+cuda12.8 "
13
+ # Use NCCL version 2.27.5 which has the fixes .
14
+ NCCL_VER=" 2.27.5 -1+cuda12.9 "
15
15
# Use cuBLAS version 12.9.0.13 instead.
16
16
CUBLAS_VER=" 12.9.0.13-1"
17
17
# Align with the pre-installed CUDA / NVCC / NVRTC versions from
Original file line number Diff line number Diff line change @@ -28,10 +28,10 @@ UPLOAD_PATH = env.uploadPath ? env.uploadPath : "sw-tensorrt-generic/llm-artifac
28
28
// Container configuration
29
29
// available tags can be found in: https://urm.nvidia.com/artifactory/sw-tensorrt-docker/tensorrt-llm/
30
30
// [base_image_name]-[arch]-[os](-[python_version])-[trt_version]-[torch_install_type]-[stage]-[date]-[mr_id]
31
- LLM_DOCKER_IMAGE = " urm.nvidia.com/sw-tensorrt-docker/tensorrt-llm:pytorch-25.05-py3-x86_64-ubuntu24.04-trt10.11.0.33-skip-tritondevel-202506051650-4885 "
32
- LLM_SBSA_DOCKER_IMAGE = " urm.nvidia.com/sw-tensorrt-docker/tensorrt-llm:pytorch-25.05-py3-aarch64-ubuntu24.04-trt10.11.0.33-skip-tritondevel-202506051650-4885 "
33
- LLM_ROCKYLINUX8_PY310_DOCKER_IMAGE = " urm.nvidia.com/sw-tensorrt-docker/tensorrt-llm:cuda-12.9.0-devel-rocky8-x86_64-rocky8-py310-trt10.11.0.33-skip-tritondevel-202506051650-4885 "
34
- LLM_ROCKYLINUX8_PY312_DOCKER_IMAGE = " urm.nvidia.com/sw-tensorrt-docker/tensorrt-llm:cuda-12.9.0-devel-rocky8-x86_64-rocky8-py312-trt10.11.0.33-skip-tritondevel-202506051650-4885 "
31
+ LLM_DOCKER_IMAGE = " urm.nvidia.com/sw-tensorrt-docker/tensorrt-llm:pytorch-25.05-py3-x86_64-ubuntu24.04-trt10.11.0.33-skip-tritondevel-202506271620-5539 "
32
+ LLM_SBSA_DOCKER_IMAGE = " urm.nvidia.com/sw-tensorrt-docker/tensorrt-llm:pytorch-25.05-py3-aarch64-ubuntu24.04-trt10.11.0.33-skip-tritondevel-202506271620-5539 "
33
+ LLM_ROCKYLINUX8_PY310_DOCKER_IMAGE = " urm.nvidia.com/sw-tensorrt-docker/tensorrt-llm:cuda-12.9.0-devel-rocky8-x86_64-rocky8-py310-trt10.11.0.33-skip-tritondevel-202506271620-5539 "
34
+ LLM_ROCKYLINUX8_PY312_DOCKER_IMAGE = " urm.nvidia.com/sw-tensorrt-docker/tensorrt-llm:cuda-12.9.0-devel-rocky8-x86_64-rocky8-py312-trt10.11.0.33-skip-tritondevel-202506271620-5539 "
35
35
36
36
// TODO: Move common variables to an unified location
37
37
BUILD_CORES_REQUEST = " 8"
Original file line number Diff line number Diff line change 1
1
2
2
import java.lang.InterruptedException
3
3
4
- DOCKER_IMAGE = " urm.nvidia.com/sw-tensorrt-docker/tensorrt-llm:pytorch-25.05-py3-x86_64-ubuntu24.04-trt10.11.0.33-skip-tritondevel-202506051650-4885 "
4
+ DOCKER_IMAGE = " urm.nvidia.com/sw-tensorrt-docker/tensorrt-llm:pytorch-25.05-py3-x86_64-ubuntu24.04-trt10.11.0.33-skip-tritondevel-202506271620-5539 "
5
5
6
6
def createKubernetesPodConfig (image , arch = " amd64" )
7
7
{
You can’t perform that action at this time.
0 commit comments