"vllm/vscode:/vscode.git/clone" did not exist on "77f7bb4532af0e4d92641c5402453ef395a287c4"
Unverified Commit 3a418254 authored by Karen Chung's avatar Karen Chung Committed by GitHub
Browse files

fix: Correctly pass DP rank from Dynamo router into vLLM engine (#6014)

parent 5035447f
......@@ -1350,8 +1350,7 @@ class DecodeWorkerHandler(BaseWorkerHandler):
logger.debug(
f"Decode request {request_id} has no LoRA specified (model: {model_name})"
)
dp_rank = request.get("dp_rank", None)
dp_rank = request.get("routing", {}).get("dp_rank")
trace_headers = build_trace_headers(context)
......@@ -1395,7 +1394,7 @@ class DecodeWorkerHandler(BaseWorkerHandler):
request, self.default_sampling_params
)
dp_rank = request.get("dp_rank", None)
dp_rank = request.get("routing", {}).get("dp_rank")
openai_request_id = request.get("id") or request.get("request_id", request_id)
previous_text = ""
......@@ -1565,7 +1564,7 @@ class PrefillWorkerHandler(BaseWorkerHandler):
f"Prefill request {request_id} has no LoRA specified (model: {model_name})"
)
dp_rank = request.get("dp_rank", None)
dp_rank = request.get("routing", {}).get("dp_rank")
trace_headers = build_trace_headers(context)
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment