Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
dynamo
Commits
abd4b5d9
Unverified
Commit
abd4b5d9
authored
Jan 12, 2026
by
Tanmay Verma
Committed by
GitHub
Jan 12, 2026
Browse files
chore: Upgrade to tensorrt_llm==1.2.0rc6.post1 (#5356)
parent
9e6c9ae9
Changes
6
Show whitespace changes
Inline
Side-by-side
Showing
6 changed files
with
7 additions
and
7 deletions
+7
-7
benchmarks/pyproject.toml
benchmarks/pyproject.toml
+1
-1
container/Dockerfile.trtllm
container/Dockerfile.trtllm
+1
-1
container/build.sh
container/build.sh
+2
-2
container/deps/requirements.txt
container/deps/requirements.txt
+1
-1
docs/reference/support-matrix.md
docs/reference/support-matrix.md
+1
-1
pyproject.toml
pyproject.toml
+1
-1
No files found.
benchmarks/pyproject.toml
View file @
abd4b5d9
...
@@ -46,7 +46,7 @@ dependencies = [
...
@@ -46,7 +46,7 @@ dependencies = [
"pydantic>=2"
,
"pydantic>=2"
,
"tabulate"
,
"tabulate"
,
"types-tabulate"
,
"types-tabulate"
,
# Satisfies vLLM 0.11.0 (>=4.55.2), vLLM 0.11.2 (>=4.56.0,<5), TRT-LLM 1.2.0rc6 (==4.5
6.0
), SGLang 0.5.7 (==4.57.1)
# Satisfies vLLM 0.11.0 (>=4.55.2), vLLM 0.11.2 (>=4.56.0,<5), TRT-LLM 1.2.0rc6
.post1
(==4.5
7.1
), SGLang 0.5.7 (==4.57.1)
"transformers>=4.56.0,<=4.57.1"
,
"transformers>=4.56.0,<=4.57.1"
,
"pytest-mypy"
,
"pytest-mypy"
,
]
]
...
...
container/Dockerfile.trtllm
View file @
abd4b5d9
...
@@ -561,7 +561,7 @@ RUN if [ "$HAS_TRTLLM_CONTEXT" = "1" ]; then \
...
@@ -561,7 +561,7 @@ RUN if [ "$HAS_TRTLLM_CONTEXT" = "1" ]; then \
sed -i 's/pip3 install/uv pip install/g' /tmp/install_tensorrt.sh && \
sed -i 's/pip3 install/uv pip install/g' /tmp/install_tensorrt.sh && \
bash /tmp/install_tensorrt.sh && \
bash /tmp/install_tensorrt.sh && \
# Install TensorRT-LLM wheel from the provided index URL, allow dependencies from PyPI
# Install TensorRT-LLM wheel from the provided index URL, allow dependencies from PyPI
# TRTLLM 1.2.0rc6 has issues installing from pypi with uv, installing from direct wheel link works best
# TRTLLM 1.2.0rc6
.post1
has issues installing from pypi with uv, installing from direct wheel link works best
# explicitly installing triton 3.5.0 as trtllm only lists triton as dependency on x64_64 for some reason
# explicitly installing triton 3.5.0 as trtllm only lists triton as dependency on x64_64 for some reason
if echo "${TENSORRTLLM_PIP_WHEEL}" | grep -q '^tensorrt-llm=='; then \
if echo "${TENSORRTLLM_PIP_WHEEL}" | grep -q '^tensorrt-llm=='; then \
TRTLLM_VERSION=$(echo "${TENSORRTLLM_PIP_WHEEL}" | sed -E 's/tensorrt-llm==([0-9a-zA-Z.+-]+).*/\1/'); \
TRTLLM_VERSION=$(echo "${TENSORRTLLM_PIP_WHEEL}" | sed -E 's/tensorrt-llm==([0-9a-zA-Z.+-]+).*/\1/'); \
...
...
container/build.sh
View file @
abd4b5d9
...
@@ -89,7 +89,7 @@ DEFAULT_TENSORRTLLM_PIP_WHEEL_DIR="/tmp/trtllm_wheel/"
...
@@ -89,7 +89,7 @@ DEFAULT_TENSORRTLLM_PIP_WHEEL_DIR="/tmp/trtllm_wheel/"
# TensorRT-LLM commit to use for building the trtllm wheel if not provided.
# TensorRT-LLM commit to use for building the trtllm wheel if not provided.
# Important Note: This commit is not used in our CI pipeline. See the CI
# Important Note: This commit is not used in our CI pipeline. See the CI
# variables to learn how to run a pipeline with a specific commit.
# variables to learn how to run a pipeline with a specific commit.
DEFAULT_EXPERIMENTAL_TRTLLM_COMMIT
=
"
9ba14263db0045ed3fa0860f949b5ce320107eb3
"
# 1.2.0rc6
DEFAULT_EXPERIMENTAL_TRTLLM_COMMIT
=
"
e4a6c9995dacf66bab4410475a6774152f95a0a6
"
# 1.2.0rc6
.post1
TRTLLM_COMMIT
=
""
TRTLLM_COMMIT
=
""
TRTLLM_USE_NIXL_KVCACHE_EXPERIMENTAL
=
"0"
TRTLLM_USE_NIXL_KVCACHE_EXPERIMENTAL
=
"0"
TRTLLM_GIT_URL
=
""
TRTLLM_GIT_URL
=
""
...
@@ -98,7 +98,7 @@ TRTLLM_GIT_URL=""
...
@@ -98,7 +98,7 @@ TRTLLM_GIT_URL=""
DEFAULT_TENSORRTLLM_INDEX_URL
=
"https://pypi.nvidia.com/"
DEFAULT_TENSORRTLLM_INDEX_URL
=
"https://pypi.nvidia.com/"
# TODO: Remove the version specification from here and use the ai-dynamo[trtllm] package.
# TODO: Remove the version specification from here and use the ai-dynamo[trtllm] package.
# Need to update the Dockerfile.trtllm to use the ai-dynamo[trtllm] package.
# Need to update the Dockerfile.trtllm to use the ai-dynamo[trtllm] package.
DEFAULT_TENSORRTLLM_PIP_WHEEL
=
"tensorrt-llm==1.2.0rc6"
DEFAULT_TENSORRTLLM_PIP_WHEEL
=
"tensorrt-llm==1.2.0rc6
.post1
"
TENSORRTLLM_PIP_WHEEL
=
""
TENSORRTLLM_PIP_WHEEL
=
""
VLLM_BASE_IMAGE
=
"nvcr.io/nvidia/cuda-dl-base"
VLLM_BASE_IMAGE
=
"nvcr.io/nvidia/cuda-dl-base"
...
...
container/deps/requirements.txt
View file @
abd4b5d9
...
@@ -52,7 +52,7 @@ tensorboard>=2.19.0,<2.21.0
...
@@ -52,7 +52,7 @@ tensorboard>=2.19.0,<2.21.0
tensorboardX==2.6.2.2
tensorboardX==2.6.2.2
# Transformers version constraint for container builds
# Transformers version constraint for container builds
# - vLLM 0.11.0: >=4.55.2, vLLM 0.11.2: >=4.56.0,<5
# - vLLM 0.11.0: >=4.55.2, vLLM 0.11.2: >=4.56.0,<5
# - TensorRT-LLM 1.2.0rc6: ==4.5
6.0
# - TensorRT-LLM 1.2.0rc6
.post1
: ==4.5
7.1
# - SGLang 0.5.7: ==4.57.1
# - SGLang 0.5.7: ==4.57.1
# Using >=4.56.0 and <=4.57.1 to satisfy all frameworks
# Using >=4.56.0 and <=4.57.1 to satisfy all frameworks
transformers>=4.56.0,<=4.57.1
transformers>=4.56.0,<=4.57.1
...
...
docs/reference/support-matrix.md
View file @
abd4b5d9
...
@@ -63,7 +63,7 @@ The following table shows the dependency versions included with each Dynamo rele
...
@@ -63,7 +63,7 @@ The following table shows the dependency versions included with each Dynamo rele
|
**Dependency**
|
**main (ToT)**
|
**v0.8.0 (unreleased)**
|
**v0.7.1**
|
**v0.7.0.post1**
|
**v0.7.0**
|
|
**Dependency**
|
**main (ToT)**
|
**v0.8.0 (unreleased)**
|
**v0.7.1**
|
**v0.7.0.post1**
|
**v0.7.0**
|
| :------------- | :------------- | :---------------------- | :--------- | :--------------- | :--------- |
| :------------- | :------------- | :---------------------- | :--------- | :--------------- | :--------- |
| SGLang | 0.5.7 | 0.5.7 | 0.5.3.post4| 0.5.3.post4 | 0.5.3.post4|
| SGLang | 0.5.7 | 0.5.7 | 0.5.3.post4| 0.5.3.post4 | 0.5.3.post4|
| TensorRT-LLM | 1.2.0rc6
| 1.2.0rc6 | 1.2.0rc3 | 1.2.0rc3 | 1.2.0rc2 |
| TensorRT-LLM | 1.2.0rc6
.post1
| 1.2.0rc6 | 1.2.0rc3 | 1.2.0rc3 | 1.2.0rc2 |
| vLLM | 0.13.0 | 0.12.0 | 0.11.0 | 0.11.0 | 0.11.0 |
| vLLM | 0.13.0 | 0.12.0 | 0.11.0 | 0.11.0 | 0.11.0 |
| NIXL | 0.8.0 | 0.8.0 | 0.8.0 | 0.8.0 | 0.8.0 |
| NIXL | 0.8.0 | 0.8.0 | 0.8.0 | 0.8.0 | 0.8.0 |
...
...
pyproject.toml
View file @
abd4b5d9
...
@@ -50,7 +50,7 @@ Repository = "https://github.com/ai-dynamo/dynamo.git"
...
@@ -50,7 +50,7 @@ Repository = "https://github.com/ai-dynamo/dynamo.git"
[project.optional-dependencies]
[project.optional-dependencies]
trtllm
=[
trtllm
=[
"uvloop"
,
"uvloop"
,
"tensorrt-llm==1.2.0rc6"
,
"tensorrt-llm==1.2.0rc6
.post1
"
,
]
]
vllm
=
[
vllm
=
[
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment