Unverified Commit 8a0657cb authored by Hongkuan Zhou's avatar Hongkuan Zhou Committed by GitHub
Browse files

fix: correct planner entrypoint in profiler's planner config gen (#7095)


Signed-off-by: default avatarhongkuanz <hongkuanz@nvidia.com>
parent 9df36b38
......@@ -103,7 +103,7 @@ class DgdPlannerServiceConfig(BaseModel):
mainContainer=Container(
image="my-registry/dynamo-runtime:my-tag", # placeholder
workingDir=f"{get_workspace_dir()}/components/src/dynamo/planner",
command=["python3", "-m", "dynamo.planner.planner_sla"],
command=["python3", "-m", "dynamo.planner"],
args=[],
)
)
......
......@@ -73,24 +73,16 @@ spec:
extraPodSpec:
mainContainer:
image: my-registry/vllm-runtime:my-tag
workingDir: /workspace/components/src/dynamo/planner
ports:
- name: metrics
containerPort: 9085
command:
- /bin/sh
- -c
- python3
- -m
- dynamo.planner
args:
- >-
python3 -m planner_sla
--environment=kubernetes
--backend=vllm
--ttft 200
--itl 10
--profile-results-dir /workspace/tests/planner/profiling_results/H200_TP1P_TP1D/
--adjustment-interval=60
--prometheus-port=9085
--no-correction
- --config
- '{"environment": "kubernetes", "backend": "vllm", "ttft": 200, "itl": 10, "profile_results_dir": "/workspace/tests/planner/profiling_results/H200_TP1P_TP1D/", "throughput_adjustment_interval": 60, "metric_reporting_prometheus_port": 9085, "no_correction": true}'
VllmDecodeWorker:
envFromSecret: hf-token-secret
componentType: worker
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment