context.yaml 3.92 KB
Newer Older
1
2
3
4
5
6
7
8
9
10
11
12
# SPDX-FileCopyrightText: Copyright (c) 2024-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
# SPDX-License-Identifier: Apache-2.0
#
# This file represents the default ARG values of Dockerfiles generated
# by render.py. These are the recommended default values for users and
# is the source of truth for the values used in our delivered images.
#
# Some ARGs have multiple valid values and can be changed for local testing,
# you can do so locally in this file, or pass the --build-arg into docker build
# when building.

dynamo:
13
  cuda12.9:
14
    base_image: nvcr.io/nvidia/cuda-dl-base
15
16
    base_image_tag: 25.06-cuda12.9-devel-ubuntu24.04
  cuda13.0:
17
    base_image: nvcr.io/nvidia/cuda-dl-base
18
    base_image_tag: 25.11-cuda13.0-devel-ubuntu24.04
19
20
  epp_image: us-central1-docker.pkg.dev/k8s-staging-images/gateway-api-inference-extension/epp:v0.5.1
  frontend_image: nvcr.io/nvidia/base/ubuntu:noble-20250619
21
22
23
24
  planner_build_image: python
  planner_build_image_tag: 3.12-slim
  planner_runtime_image: nvcr.io/nvidia/distroless/python
  planner_runtime_image_tag: 3.12-v4.0.3
25
26
27
28
29
  python_version: "3.12"

  nats_version: v2.10.28
  etcd_version: v3.5.21

30
  nixl_ref: 0.10.1
31
  nixl_ucx_ref: v1.20.x
32
33
34
  nixl_gdrcopy_ref: v2.5.1
  nixl_ucx_efa_ref: 9d2b88a1f67faf9876f267658bd077b379b8bb76
  nixl_libfabric_ref: v2.3.0
35
  enable_kvbm: "true"
36
  enable_media_ffmpeg: "false"
37
  enable_gpu_memory_service: "true"
38
39
40
41
  ffmpeg_version: "7.1"
  efa_version: 1.45.1

vllm:
42
  cuda12.9:
43
44
    base_image: nvcr.io/nvidia/cuda-dl-base
    runtime_image: nvcr.io/nvidia/cuda
45
    base_image_tag: 25.06-cuda12.9-devel-ubuntu24.04
46
    runtime_image_tag: 12.9.1-runtime-ubuntu24.04
Alec's avatar
Alec committed
47
    vllm_ref: v0.19.0
48
  cuda13.0:
49
50
    base_image: nvcr.io/nvidia/cuda-dl-base
    runtime_image: nvcr.io/nvidia/cuda
51
    base_image_tag: 25.11-cuda13.0-devel-ubuntu24.04
52
    runtime_image_tag: 13.0.2-runtime-ubuntu24.04
Alec's avatar
Alec committed
53
    vllm_ref: v0.19.0
54
55
56
57
58
  xpu:
    base_image: intel/deep-learning-essentials
    runtime_image: intel/deep-learning-essentials
    base_image_tag: 2025.3.2-0-devel-ubuntu24.04
    runtime_image_tag: 2025.3.2-0-devel-ubuntu24.04
59
    vllm_ref: v0.17.1
60
61
62
63
64
65
  cpu:
    base_image: ubuntu
    runtime_image: ubuntu
    base_image_tag: 24.04
    runtime_image_tag: 24.04
    vllm_ref: v0.16.0
Alec's avatar
Alec committed
66
67
  flashinf_ref: v0.6.6
  lmcache_ref: 0.4.2
Alec's avatar
Alec committed
68
  vllm_omni_ref: "release/v0.19.0rc1"
69
  nixl_ref: 0.10.1
70
  max_jobs: "10"
71
  enable_media_ffmpeg: "false"
72
73
  enable_gpu_memory_service: "true"
  enable_kvbm: "true"
74
75
  enable_modelexpress_p2p: "false"
  modelexpress_ref: "3d73992ce6c10e52ddc54f7f12af35d27e173f15"
76
77
78

sglang:
  cuda12.9:
79
80
    base_image: nvcr.io/nvidia/cuda-dl-base
    runtime_image: lmsysorg/sglang
81
    base_image_tag: 25.06-cuda12.9-devel-ubuntu24.04
82
    runtime_image_tag: v0.5.9-runtime
83
  cuda13.0:
84
85
    base_image: nvcr.io/nvidia/cuda-dl-base
    runtime_image: lmsysorg/sglang
86
    base_image_tag: 25.11-cuda13.0-devel-ubuntu24.04
87
    runtime_image_tag: v0.5.9-cu130-runtime
88
  nixl_ref: 0.10.0
89
  enable_media_ffmpeg: "false"
90
91
92
93
  enable_gpu_memory_service: "true"
  enable_kvbm: "false"

trtllm:
94
  cuda13.1:
95
96
    base_image: nvcr.io/nvidia/pytorch
    runtime_image: nvcr.io/nvidia/cuda-dl-base
97
98
    base_image_tag: 25.12-py3
    runtime_image_tag: 25.12-cuda13.1-runtime-ubuntu24.04
99
  nixl_ref: 0.10.1
100
  enable_media_ffmpeg: "false"
101
102
103
104
105
  enable_gpu_memory_service: "false"
  enable_kvbm: "true"
  python_version: "3.12"
  index_url: https://pypi.nvidia.com/
  pip_wheel_dir: /tmp/trtllm_wheel/
106
  pip_wheel: tensorrt-llm==1.3.0rc9
107
108
  trtllm_wheel_image: nvcr.io/nvidia/tensorrt-llm/release:${TENSORRTLLM_PIP_WHEEL#*==}

109
  github_trtllm_commit: v1.3.0rc9
110
111
112
113
114
115
116
117
118
119
120
121
  torch_version: 2.10.0a0+b4e4ee81d3.nv25.12
  torch_tensorrt_version: 2.10.0a0
  torchvision_version: 0.25.0a0+ca221243
  torchao_ver: 0.15.0+git01374eb5
  torchdata_ver: 0.11.0
  torchtitan_ver: 0.2.0
  jinja2_version: 3.1.6
  sympy_version: 1.14.0
  pytorch_triton_ver: 3.5.1+gitbfeb0668.nv25.12
  flash_attn_version: 2.7.4.post1+25.12
  flashinfer_python_ver: 0.6.1
  has_trtllm_context: "0"