Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
dynamo
Commits
a2bc6d5c
Unverified
Commit
a2bc6d5c
authored
Apr 10, 2026
by
Richard Huo
Committed by
GitHub
Apr 10, 2026
Browse files
chore: update trtllm version to v1.3.0rc11 (#8048)
parent
adae833e
Changes
6
Hide whitespace changes
Inline
Side-by-side
Showing
6 changed files
with
22 additions
and
21 deletions
+22
-21
benchmarks/pyproject.toml
benchmarks/pyproject.toml
+1
-1
container/context.yaml
container/context.yaml
+12
-12
container/deps/requirements.common.txt
container/deps/requirements.common.txt
+1
-1
container/templates/trtllm_framework.Dockerfile
container/templates/trtllm_framework.Dockerfile
+4
-5
docs/reference/support-matrix.md
docs/reference/support-matrix.md
+1
-1
pyproject.toml
pyproject.toml
+3
-1
No files found.
benchmarks/pyproject.toml
View file @
a2bc6d5c
...
...
@@ -48,7 +48,7 @@ dependencies = [
"pandas"
,
"pydantic>=2"
,
"tabulate"
,
# Satisfies vLLM 0.11.0 (>=4.55.2), vLLM 0.11.2 (>=4.56.0,<5), TRT-LLM 1.3.0rc
9
(==4.57.
1
), SGLang 0.5.8 (==4.57.1)
# Satisfies vLLM 0.11.0 (>=4.55.2), vLLM 0.11.2 (>=4.56.0,<5), TRT-LLM 1.3.0rc
11
(==4.57.
3
), SGLang 0.5.8 (==4.57.1)
"transformers>=4.56.0"
,
]
...
...
container/context.yaml
View file @
a2bc6d5c
...
...
@@ -94,8 +94,8 @@ trtllm:
cuda13.1
:
base_image
:
nvcr.io/nvidia/pytorch
runtime_image
:
nvcr.io/nvidia/cuda-dl-base
base_image_tag
:
2
5.1
2-py3
runtime_image_tag
:
2
5.1
2-cuda13.1-runtime-ubuntu24.04
base_image_tag
:
2
6.0
2-py3
runtime_image_tag
:
2
6.0
2-cuda13.1-runtime-ubuntu24.04
nixl_ref
:
0.10.1
enable_media_ffmpeg
:
"
false"
enable_gpu_memory_service
:
"
false"
...
...
@@ -103,19 +103,19 @@ trtllm:
python_version
:
"
3.12"
index_url
:
https://pypi.nvidia.com/
pip_wheel_dir
:
/tmp/trtllm_wheel/
pip_wheel
:
tensorrt-llm==1.3.0rc
9
pip_wheel
:
tensorrt-llm==1.3.0rc
11
trtllm_wheel_image
:
nvcr.io/nvidia/tensorrt-llm/release:${TENSORRTLLM_PIP_WHEEL#*==}
github_trtllm_commit
:
v1.3.0rc
9
torch_version
:
2.1
0
.0a0+
b4e4ee81d3
.nv2
5.1
2
torch_tensorrt_version
:
2.1
0
.0a0
torchvision_version
:
0.25.0a0+
ca221243
torchao_ver
:
0.1
5
.0+git
01374eb5
github_trtllm_commit
:
v1.3.0rc
11
torch_version
:
2.1
1
.0a0+
eb65b36914
.nv2
6.
2
torch_tensorrt_version
:
2.1
1
.0a0
torchvision_version
:
0.25.0a0+
1e53952f.nv26.2.44259020
torchao_ver
:
0.1
6
.0+git
a89eaab2
torchdata_ver
:
0.11.0
torchtitan_ver
:
0.2.
0
torchtitan_ver
:
0.2.
1+git9f211ec1
jinja2_version
:
3.1.6
sympy_version
:
1.14.0
pytorch_triton_ver
:
3.
5.1
+git
bfeb0668
.nv2
5.1
2
flash_attn_version
:
2.7.4.post1+
25.12
flashinfer_python_ver
:
0.6.
1
pytorch_triton_ver
:
3.
6.0
+git
9844da95
.nv2
6.
2
flash_attn_version
:
2.7.4.post1+
nv26.2.44259020
flashinfer_python_ver
:
0.6.
6
has_trtllm_context
:
"
0"
container/deps/requirements.common.txt
View file @
a2bc6d5c
...
...
@@ -28,7 +28,7 @@ tensorboard>=2.19.0,<2.21.0
tensorboardX==2.6.2.2
# Transformers version constraint for container builds
# - vLLM 0.11.0: >=4.55.2, vLLM 0.11.2: >=4.56.0,<5
# - TensorRT-LLM 1.3.0rc
9
: ==4.57.
1
# - TensorRT-LLM 1.3.0rc
11
: ==4.57.
3
# - SGLang 0.5.8: ==4.57.1
# Using >=4.56.0 to satisfy all frameworks
transformers>=4.56.0
...
...
container/templates/trtllm_framework.Dockerfile
View file @
a2bc6d5c
...
...
@@ -133,7 +133,7 @@ RUN --mount=type=cache,target=/root/.cache/uv \
# Install from local wheel directory in build context
WHEEL_FILE="$(find /trtllm_wheel -name "*.whl" | head -n 1)"; \
if [ -n "$WHEEL_FILE" ]; then \
uv pip install "$WHEEL_FILE"
triton==3.5.1
; \
uv pip install "$WHEEL_FILE"; \
else \
echo "No wheel file found in /trtllm_wheel directory."; \
exit 1; \
...
...
@@ -141,19 +141,18 @@ RUN --mount=type=cache,target=/root/.cache/uv \
elif [ -n "$(find /trtllm_wheel_image -name "*.whl" | head -n 1)" ]; then \
# Install from wheel embedded in the TRTLLM release image
WHEEL_FILE="$(find /trtllm_wheel_image -name "*.whl" | head -n 1)"; \
uv pip install "$WHEEL_FILE"
triton==3.5.1
; \
uv pip install "$WHEEL_FILE"; \
else \
# Install TensorRT-LLM wheel from the provided index URL, allow dependencies from PyPI
# TRTLLM 1.2.0rc6.post2 has issues installing from pypi with uv, installing from direct wheel link works best
# explicitly installing triton 3.5.1 as trtllm only lists triton as dependency on x64_64 for some reason
if echo "${TENSORRTLLM_PIP_WHEEL}" | grep -q '^tensorrt-llm=='; then \
TRTLLM_VERSION=$(echo "${TENSORRTLLM_PIP_WHEEL}" | sed -E 's/tensorrt-llm==([0-9a-zA-Z.+-]+).*/\1/'); \
PYTHON_TAG="cp$(echo ${PYTHON_VERSION} | tr -d '.')"; \
ARCH_ALT=$([ "${TARGETARCH}" = "amd64" ] && echo "x86_64" || echo "aarch64"); \
DIRECT_URL="https://pypi.nvidia.com/tensorrt-llm/tensorrt_llm-${TRTLLM_VERSION}-${PYTHON_TAG}-${PYTHON_TAG}-linux_${ARCH_ALT}.whl"; \
uv pip install --index-strategy=unsafe-best-match --extra-index-url "${TENSORRTLLM_INDEX_URL}" "${DIRECT_URL}"
triton==3.5.1
; \
uv pip install --index-strategy=unsafe-best-match --extra-index-url "${TENSORRTLLM_INDEX_URL}" "${DIRECT_URL}"; \
else \
uv pip install --index-strategy=unsafe-best-match --extra-index-url "${TENSORRTLLM_INDEX_URL}" "${TENSORRTLLM_PIP_WHEEL}"
triton==3.5.1
; \
uv pip install --index-strategy=unsafe-best-match --extra-index-url "${TENSORRTLLM_INDEX_URL}" "${TENSORRTLLM_PIP_WHEEL}"; \
fi; \
fi && \
# Run TensorRT installer that ships with the TRTLLM wheel
...
...
docs/reference/support-matrix.md
View file @
a2bc6d5c
...
...
@@ -29,7 +29,7 @@ The following table shows the backend framework versions included with each Dyna
|
**Dynamo**
|
**SGLang**
|
**TensorRT-LLM**
|
**vLLM**
|
**NIXL**
|
| :--- | :--- | :--- | :--- | :--- |
|
**main (ToT)**
|
`0.5.9`
|
`1.3.0rc
9
`
|
`0.19.0`
|
`0.10.1`
|
|
**main (ToT)**
|
`0.5.9`
|
`1.3.0rc
11
`
|
`0.19.0`
|
`0.10.1`
|
|
**v1.1.0-dev.1**
*(experimental)*
|
`0.5.9`
|
`1.3.0rc5.post1`
|
`0.17.1`
|
`0.10.1`
|
|
**v1.0.1**
|
`0.5.9`
|
`1.3.0rc5.post1`
|
`0.16.0`
|
`0.10.1`
|
|
**v1.0.0**
|
`0.5.9`
|
`1.3.0rc5.post1`
|
`0.16.0`
|
`0.10.1`
|
...
...
pyproject.toml
View file @
a2bc6d5c
...
...
@@ -44,7 +44,7 @@ Repository = "https://github.com/ai-dynamo/dynamo.git"
[project.optional-dependencies]
trtllm
=[
"uvloop"
,
"tensorrt-llm==1.3.0rc
9
"
,
"tensorrt-llm==1.3.0rc
11
"
,
]
vllm
=
[
...
...
@@ -210,6 +210,8 @@ filterwarnings = [
"ignore:Triton is not supported on current platform.*:UserWarning"
,
# torch.jit.script_method deprecation from torch.utils.mkldnn
"ignore:.*torch
\\
.jit
\\
.script_method.*is deprecated.*:DeprecationWarning"
,
# torch.jit.script deprecation from modelopt.torch.quantization
"ignore:`torch.jit.script` is deprecated:DeprecationWarning"
,
# nvidia-modelopt warning about transformers version (transitive dep from TRT-LLM)
"ignore:transformers version .* is incompatible with nvidia-modelopt.*:UserWarning"
,
# SGLang quantization warnings on CPU-only runners
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment