feat: install Run:ai model streamer for vllm (#4848)

Signed-off-by: Guangtong Bai <guangtong.bai@gmail.com>

feat: install Run:ai model streamer for vllm (#4848)
Signed-off-by: Guangtong Bai <guangtong.bai@gmail.com>
53cec4ac · Guangtong Bai · GitHub · 2ef0f5fb · 53cec4ac · 53cec4ac
Unverified Commit 53cec4ac authored Dec 11, 2025 by Guangtong Bai Committed by GitHub Dec 11, 2025
Hide whitespace changes
Inline Side-by-side

Showing with 2 additions and 2 deletions

container/deps/vllm/install_vllm.sh container/deps/vllm/install_vllm.sh +1 -1

pyproject.toml pyproject.toml +1 -1

No files found.
--- a/container/deps/vllm/install_vllm.sh
+++ b/container/deps/vllm/install_vllm.sh
@@ -126,7 +126,7 @@ git checkout $VLLM_REF
 echo "\n=== Installing vLLM & FlashInfer ==="
 echo "Installing vLLM $VLLM_REF from PyPI..."

-uv pip install vllm[flashinfer]==$VLLM_REF --torch-backend=${TORCH_BACKEND}
+uv pip install vllm[flashinfer,runai]==$VLLM_REF --torch-backend=${TORCH_BACKEND}
 uv pip install flashinfer-cubin==$FLASHINF_REF
 uv pip install flashinfer-jit-cache==$FLASHINF_REF --extra-index-url https://flashinfer.ai/whl/${TORCH_BACKEND}


--- a/pyproject.toml
+++ b/pyproject.toml
@@ -56,7 +56,7 @@ trtllm =[
 vllm = [
    "uvloop",
    "nixl[cu12]<=0.7.1",
-    "vllm[flashinfer]==0.12.0",
+    "vllm[flashinfer,runai]==0.12.0",
 ]

 sglang = [