"vscode:/vscode.git/clone" did not exist on "cf269dba88b42b0d04b83308a9b9aa94dba378cc"
Unverified Commit 8a0657cb authored by Hongkuan Zhou's avatar Hongkuan Zhou Committed by GitHub
Browse files

fix: correct planner entrypoint in profiler's planner config gen (#7095)


Signed-off-by: default avatarhongkuanz <hongkuanz@nvidia.com>
parent 9df36b38
...@@ -103,7 +103,7 @@ class DgdPlannerServiceConfig(BaseModel): ...@@ -103,7 +103,7 @@ class DgdPlannerServiceConfig(BaseModel):
mainContainer=Container( mainContainer=Container(
image="my-registry/dynamo-runtime:my-tag", # placeholder image="my-registry/dynamo-runtime:my-tag", # placeholder
workingDir=f"{get_workspace_dir()}/components/src/dynamo/planner", workingDir=f"{get_workspace_dir()}/components/src/dynamo/planner",
command=["python3", "-m", "dynamo.planner.planner_sla"], command=["python3", "-m", "dynamo.planner"],
args=[], args=[],
) )
) )
......
...@@ -73,24 +73,16 @@ spec: ...@@ -73,24 +73,16 @@ spec:
extraPodSpec: extraPodSpec:
mainContainer: mainContainer:
image: my-registry/vllm-runtime:my-tag image: my-registry/vllm-runtime:my-tag
workingDir: /workspace/components/src/dynamo/planner
ports: ports:
- name: metrics - name: metrics
containerPort: 9085 containerPort: 9085
command: command:
- /bin/sh - python3
- -c - -m
- dynamo.planner
args: args:
- >- - --config
python3 -m planner_sla - '{"environment": "kubernetes", "backend": "vllm", "ttft": 200, "itl": 10, "profile_results_dir": "/workspace/tests/planner/profiling_results/H200_TP1P_TP1D/", "throughput_adjustment_interval": 60, "metric_reporting_prometheus_port": 9085, "no_correction": true}'
--environment=kubernetes
--backend=vllm
--ttft 200
--itl 10
--profile-results-dir /workspace/tests/planner/profiling_results/H200_TP1P_TP1D/
--adjustment-interval=60
--prometheus-port=9085
--no-correction
VllmDecodeWorker: VllmDecodeWorker:
envFromSecret: hf-token-secret envFromSecret: hf-token-secret
componentType: worker componentType: worker
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment