"components/backends/vscode:/vscode.git/clone" did not exist on "13a5d61b549919bb6b766f7bc60eecdad282a11a"
Unverified Commit 9f3cc6e9 authored by ptarasiewiczNV's avatar ptarasiewiczNV Committed by GitHub
Browse files

fix: Use fixed vLLM DSR1 checkpoint path (#5721)


Signed-off-by: default avatarPiotr Tarasiewicz <ptarasiewicz@nvidia.com>
parent 584020f4
......@@ -7,9 +7,6 @@ metadata:
name: vllm-dsr1
spec:
backendFramework: vllm
envs:
- name: HF_HOME
value: /model-cache
pvcs:
- name: model-cache
create: false
......@@ -17,6 +14,9 @@ spec:
Frontend:
componentType: frontend
replicas: 1
volumeMounts:
- name: model-cache
mountPoint: /model-cache
extraPodSpec:
mainContainer:
startupProbe:
......@@ -73,7 +73,7 @@ spec:
args:
- |
exec python3 -m dynamo.vllm \
--model deepseek-ai/DeepSeek-R1 \
--model /model-cache/deepseek-r1 \
--served-model-name deepseek-ai/DeepSeek-R1 \
--all2all-backend deepep_low_latency \
--data-parallel-hybrid-lb \
......@@ -132,7 +132,7 @@ spec:
args:
- |
exec python3 -m dynamo.vllm \
--model deepseek-ai/DeepSeek-R1 \
--model /model-cache/deepseek-r1 \
--is-prefill-worker \
--served-model-name deepseek-ai/DeepSeek-R1 \
--all2all-backend deepep_high_throughput \
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment