"...git@developer.sourcefind.cn:2222/OpenDAS/vllm_cscc.git" did not exist on "73f48ce559e230fd0d738c52cb2e99bd0dd08754"
Unverified Commit 25393fb3 authored by Harrison Saturley-Hall's avatar Harrison Saturley-Hall Committed by GitHub
Browse files

chore: bump trtllm to 1.3.0rc5.post1 (#7040)


Signed-off-by: default avatarHarrison King Saturley-Hall <hsaturleyhal@nvidia.com>
parent e14be96a
...@@ -90,10 +90,10 @@ trtllm: ...@@ -90,10 +90,10 @@ trtllm:
python_version: "3.12" python_version: "3.12"
index_url: https://pypi.nvidia.com/ index_url: https://pypi.nvidia.com/
pip_wheel_dir: /tmp/trtllm_wheel/ pip_wheel_dir: /tmp/trtllm_wheel/
pip_wheel: tensorrt-llm==1.3.0rc5 pip_wheel: tensorrt-llm==1.3.0rc5.post1
trtllm_wheel_image: nvcr.io/nvidia/tensorrt-llm/release:${TENSORRTLLM_PIP_WHEEL#*==} trtllm_wheel_image: nvcr.io/nvidia/tensorrt-llm/release:${TENSORRTLLM_PIP_WHEEL#*==}
github_trtllm_commit: v1.3.0rc5 github_trtllm_commit: v1.3.0rc5.post1
torch_version: 2.10.0a0+b4e4ee81d3.nv25.12 torch_version: 2.10.0a0+b4e4ee81d3.nv25.12
torch_tensorrt_version: 2.10.0a0 torch_tensorrt_version: 2.10.0a0
torchvision_version: 0.25.0a0+ca221243 torchvision_version: 0.25.0a0+ca221243
......
...@@ -27,9 +27,9 @@ The following table shows the backend framework versions included with each Dyna ...@@ -27,9 +27,9 @@ The following table shows the backend framework versions included with each Dyna
| **Dynamo** | **SGLang** | **TensorRT-LLM** | **vLLM** | **NIXL** | | **Dynamo** | **SGLang** | **TensorRT-LLM** | **vLLM** | **NIXL** |
| :--- | :--- | :--- | :--- | :--- | | :--- | :--- | :--- | :--- | :--- |
| **main (ToT)** | `0.5.9` | `1.3.0rc5` | `0.16.0` | `0.10.1` | | **main (ToT)** | `0.5.9` | `1.3.0rc5.post1` | `0.16.0` | `0.10.1` |
| **v1.0.0** *(in progress)* | `0.5.9` | `1.3.0rc5.post1` | `0.16.0` | `0.10.1` | | **v1.0.0** *(in progress)* | `0.5.9` | `1.3.0rc5.post1` | `0.16.0` | `0.10.1` |
| **v0.9.1** *(in progress)* | `0.5.8` | `1.3.0rc3` | `0.14.1` | `0.9.0` | | **v0.9.1** | `0.5.8` | `1.3.0rc3` | `0.14.1` | `0.9.0` |
| **v0.9.0** | `0.5.8` | `1.3.0rc1` | `0.14.1` | `0.9.0` | | **v0.9.0** | `0.5.8` | `1.3.0rc1` | `0.14.1` | `0.9.0` |
| **v0.8.1.post3** | `0.5.6.post2` | `1.2.0rc6.post3` | `0.12.0` | `0.8.0` | | **v0.8.1.post3** | `0.5.6.post2` | `1.2.0rc6.post3` | `0.12.0` | `0.8.0` |
| **v0.8.1.post2** | `0.5.6.post2` | `1.2.0rc6.post2` | `0.12.0` | `0.8.0` | | **v0.8.1.post2** | `0.5.6.post2` | `1.2.0rc6.post2` | `0.12.0` | `0.8.0` |
...@@ -64,7 +64,7 @@ Dynamo container images include CUDA toolkit libraries. The host machine must ha ...@@ -64,7 +64,7 @@ Dynamo container images include CUDA toolkit libraries. The host machine must ha
| | **TensorRT-LLM** | 13.1 | 580.xx+ | | | | **TensorRT-LLM** | 13.1 | 580.xx+ | |
| | **vLLM** | 12.9 | 575.xx+ | | | | **vLLM** | 12.9 | 575.xx+ | |
| | | 13.0 | 580.xx+ | | | | | 13.0 | 580.xx+ | |
| **0.9.1** *(in progress)* | **SGLang** | 12.9 | 575.xx+ | | | **0.9.1** | **SGLang** | 12.9 | 575.xx+ | |
| | **TensorRT-LLM** | 13.0 | 580.xx+ | | | | **TensorRT-LLM** | 13.0 | 580.xx+ | |
| | **vLLM** | 12.9 | 575.xx+ | | | | **vLLM** | 12.9 | 575.xx+ | |
| **0.9.0** | **SGLang** | 12.9 | 575.xx+ | | | **0.9.0** | **SGLang** | 12.9 | 575.xx+ | |
......
...@@ -53,7 +53,7 @@ Repository = "https://github.com/ai-dynamo/dynamo.git" ...@@ -53,7 +53,7 @@ Repository = "https://github.com/ai-dynamo/dynamo.git"
trtllm =[ trtllm =[
"uvloop", "uvloop",
"msgpack==1.1.2", "msgpack==1.1.2",
"tensorrt-llm==1.3.0rc5", "tensorrt-llm==1.3.0rc5.post1",
] ]
vllm = [ vllm = [
......
...@@ -123,9 +123,6 @@ trtllm_configs = { ...@@ -123,9 +123,6 @@ trtllm_configs = {
pytest.mark.gpu_2, pytest.mark.gpu_2,
pytest.mark.post_merge, pytest.mark.post_merge,
pytest.mark.trtllm, pytest.mark.trtllm,
pytest.mark.skip(
reason="DYN-2265 https://github.com/ai-dynamo/dynamo/pull/6704/changes#r2866554157 TODO enable this test when upgrading from trtllm 1.3.0rc5 to 1.3.0rc5.post1"
),
], ],
model="Qwen/Qwen3-0.6B", model="Qwen/Qwen3-0.6B",
frontend_port=DefaultPort.FRONTEND.value, frontend_port=DefaultPort.FRONTEND.value,
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment