Commit 12600c73 authored by Anant Sharma's avatar Anant Sharma Committed by GitHub
Browse files

build: add vllm optional dependency (#201)

parent 3ba2d427
...@@ -323,11 +323,9 @@ RUN uv venv $VIRTUAL_ENV --python 3.12 && \ ...@@ -323,11 +323,9 @@ RUN uv venv $VIRTUAL_ENV --python 3.12 && \
echo "source $VIRTUAL_ENV/bin/activate" >> ~/.bashrc echo "source $VIRTUAL_ENV/bin/activate" >> ~/.bashrc
# Install the wheels # Install the wheels
COPY --from=dev /workspace/dist/*.whl whls/ COPY --from=dev /workspace/dist/*.whl wheelhouse/
RUN uv pip install $(find whls -name ai_dynamo_runtime-*.whl) && \ RUN uv pip install ai-dynamo[vllm] --find-links wheelhouse && \
uv pip install $(find whls -name ai_dynamo-*.whl) && \ rm -r wheelhouse
uv pip install $(find whls -name vllm-*.whl) && \
rm -r whls
# Tell vllm to use the Dynamo LLM C API for KV Cache Routing # Tell vllm to use the Dynamo LLM C API for KV Cache Routing
ENV VLLM_KV_CAPI_PATH="/opt/dynamo/bindings/lib/libdynamo_llm_capi.so" ENV VLLM_KV_CAPI_PATH="/opt/dynamo/bindings/lib/libdynamo_llm_capi.so"
......
...@@ -30,6 +30,7 @@ dependencies = [ ...@@ -30,6 +30,7 @@ dependencies = [
"types-psutil==7.0.0.20250218", "types-psutil==7.0.0.20250218",
"ai-dynamo-runtime==0.1.0", "ai-dynamo-runtime==0.1.0",
] ]
classifiers = [ classifiers = [
"Development Status :: 4 - Beta", "Development Status :: 4 - Beta",
"Intended Audience :: Developers", "Intended Audience :: Developers",
...@@ -46,6 +47,11 @@ classifiers = [ ...@@ -46,6 +47,11 @@ classifiers = [
] ]
keywords = ["llm", "genai", "inference", "nvidia", "distributed", "dynamo"] keywords = ["llm", "genai", "inference", "nvidia", "distributed", "dynamo"]
[project.optional-dependencies]
vllm = [
"vllm==0.7.2+dynamo"
]
[project.scripts] [project.scripts]
dynamo = "dynamo.sdk.cli.cli:cli" dynamo = "dynamo.sdk.cli.cli:cli"
dynamo-run = "dynamo.sdk.cli.run_executable:dynamo_run" dynamo-run = "dynamo.sdk.cli.run_executable:dynamo_run"
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment