Unverified Commit 2c6e6d22 authored by Alec's avatar Alec Committed by GitHub
Browse files

chore(deps): bump vLLM to 0.15.1 (#6102)


Signed-off-by: default avataralec-flowers <aflowers@nvidia.com>
Signed-off-by: default avatarAlec <35311602+alec-flowers@users.noreply.github.com>
Co-authored-by: default avatarClaude Sonnet 4.5 <noreply@anthropic.com>
parent 45bc1b79
...@@ -38,9 +38,9 @@ vllm: ...@@ -38,9 +38,9 @@ vllm:
base_image_tag: 25.06-cuda12.9-devel-ubuntu24.04 base_image_tag: 25.06-cuda12.9-devel-ubuntu24.04
cuda13.0: cuda13.0:
base_image_tag: 25.11-cuda13.0-devel-ubuntu24.04 base_image_tag: 25.11-cuda13.0-devel-ubuntu24.04
vllm_ref: v0.14.1 vllm_ref: v0.15.1
flashinf_ref: v0.5.3 flashinf_ref: v0.6.1
lmcache_ref: 0.3.12 lmcache_ref: 0.3.13
max_jobs: "10" max_jobs: "10"
enable_media_ffmpeg: "true" enable_media_ffmpeg: "true"
enable_gpu_memory_service: "true" enable_gpu_memory_service: "true"
......
...@@ -11,7 +11,7 @@ ...@@ -11,7 +11,7 @@
set -euo pipefail set -euo pipefail
VLLM_VER="0.14.1" VLLM_VER="0.15.1"
VLLM_REF="v${VLLM_VER}" VLLM_REF="v${VLLM_VER}"
# Basic Configurations # Basic Configurations
...@@ -23,8 +23,8 @@ INSTALLATION_DIR=/tmp ...@@ -23,8 +23,8 @@ INSTALLATION_DIR=/tmp
TORCH_CUDA_ARCH_LIST="9.0;10.0" # For EP Kernels -- TODO: check if we need to add 12.0+PTX TORCH_CUDA_ARCH_LIST="9.0;10.0" # For EP Kernels -- TODO: check if we need to add 12.0+PTX
DEEPGEMM_REF="" DEEPGEMM_REF=""
CUDA_VERSION="12.9" CUDA_VERSION="12.9"
FLASHINF_REF="v0.5.3" FLASHINF_REF="v0.6.1"
LMCACHE_REF="0.3.12" LMCACHE_REF="0.3.13"
while [[ $# -gt 0 ]]; do while [[ $# -gt 0 ]]; do
case $1 in case $1 in
......
...@@ -16,7 +16,7 @@ The following table shows the backend framework versions included with each Dyna ...@@ -16,7 +16,7 @@ The following table shows the backend framework versions included with each Dyna
| **Dynamo** | **vLLM** | **SGLang** | **TensorRT-LLM** | **NIXL** | | **Dynamo** | **vLLM** | **SGLang** | **TensorRT-LLM** | **NIXL** |
| :--- | :--- | :--- | :--- | :--- | | :--- | :--- | :--- | :--- | :--- |
| **main (ToT)** | `0.14.1` | `0.5.8` | `1.3.0rc1` | `0.9.0` | | **main (ToT)** | `0.15.1` | `0.5.8` | `1.3.0rc1` | `0.9.0` |
| **v1.0.0** *(planned)* | `0.15.0` | *Latest as of 2/17* | *Latest as of 2/17* | `0.10.0` | | **v1.0.0** *(planned)* | `0.15.0` | *Latest as of 2/17* | *Latest as of 2/17* | `0.10.0` |
| **v0.9.0** *(in progress)* | `0.14.1` | `0.5.8` | `1.3.0rc1` | `0.9.0` | | **v0.9.0** *(in progress)* | `0.14.1` | `0.5.8` | `1.3.0rc1` | `0.9.0` |
| **v0.8.1.post3** *(in progress)* | `0.12.0` | `0.5.6.post2` | `1.2.0rc6.post3` | `0.8.0` | | **v0.8.1.post3** *(in progress)* | `0.12.0` | `0.5.6.post2` | `1.2.0rc6.post3` | `0.8.0` |
......
...@@ -57,7 +57,7 @@ trtllm =[ ...@@ -57,7 +57,7 @@ trtllm =[
vllm = [ vllm = [
"uvloop", "uvloop",
"nixl[cu12]<=0.9.0", "nixl[cu12]<=0.9.0",
"vllm[flashinfer,runai]==0.14.1", "vllm[flashinfer,runai]==0.15.1",
"vllm-omni==0.14.0", "vllm-omni==0.14.0",
] ]
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment