Unverified Commit d187a14c authored by atchernych's avatar atchernych Committed by GitHub
Browse files

fix: Fix Disag Examples (#8070)


Signed-off-by: default avatarAnna Tchernych <atchernych@nvidia.com>
parent 3b410226
...@@ -144,7 +144,7 @@ spec: ...@@ -144,7 +144,7 @@ spec:
- name: MODEL_PATH - name: MODEL_PATH
value: "Qwen/Qwen3-0.6B" value: "Qwen/Qwen3-0.6B"
args: args:
- "python3 -m dynamo.vllm --model $MODEL_PATH --served-model-name $SERVED_MODEL_NAME --tensor-parallel-size 1 --data-parallel-size 1 --kv-transfer-config '{\"kv_connector\":\"NixlConnector\",\"kv_role\":\"kv_both\"}' --gpu-memory-utilization 0.90 --enable-prefix-caching --block-size 16 --kv-events-config '{\"enable_kv_cache_events\":true}'" - "python3 -m dynamo.vllm --model $MODEL_PATH --served-model-name $SERVED_MODEL_NAME --tensor-parallel-size 1 --data-parallel-size 1 --disaggregation-mode decode --kv-transfer-config '{\"kv_connector\":\"NixlConnector\",\"kv_role\":\"kv_both\"}' --gpu-memory-utilization 0.90 --block-size 16"
command: command:
- /bin/sh - /bin/sh
- -c - -c
......
...@@ -163,7 +163,7 @@ spec: ...@@ -163,7 +163,7 @@ spec:
- name: HF_HOME - name: HF_HOME
value: /opt/models value: /opt/models
args: args:
- "python3 -m dynamo.vllm --model $MODEL_PATH --served-model-name $SERVED_MODEL_NAME --tensor-parallel-size 4 --data-parallel-size 1 --kv-transfer-config '{\"kv_connector\":\"NixlConnector\",\"kv_role\":\"kv_both\"}' --gpu-memory-utilization 0.90 --enable-prefix-caching --block-size 128 --kv-events-config '{\"enable_kv_cache_events\":true}'" - "python3 -m dynamo.vllm --model $MODEL_PATH --served-model-name $SERVED_MODEL_NAME --tensor-parallel-size 4 --data-parallel-size 1 --disaggregation-mode decode --kv-transfer-config '{\"kv_connector\":\"NixlConnector\",\"kv_role\":\"kv_both\"}' --gpu-memory-utilization 0.90 --block-size 128"
command: command:
- /bin/sh - /bin/sh
- -c - -c
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment