"vscode:/vscode.git/clone" did not exist on "ece76a62018f91f149c60f82590fc7e7e7ff5df4"
Unverified Commit 3a418254 authored by Karen Chung's avatar Karen Chung Committed by GitHub
Browse files

fix: Correctly pass DP rank from Dynamo router into vLLM engine (#6014)

parent 5035447f
...@@ -1350,8 +1350,7 @@ class DecodeWorkerHandler(BaseWorkerHandler): ...@@ -1350,8 +1350,7 @@ class DecodeWorkerHandler(BaseWorkerHandler):
logger.debug( logger.debug(
f"Decode request {request_id} has no LoRA specified (model: {model_name})" f"Decode request {request_id} has no LoRA specified (model: {model_name})"
) )
dp_rank = request.get("routing", {}).get("dp_rank")
dp_rank = request.get("dp_rank", None)
trace_headers = build_trace_headers(context) trace_headers = build_trace_headers(context)
...@@ -1395,7 +1394,7 @@ class DecodeWorkerHandler(BaseWorkerHandler): ...@@ -1395,7 +1394,7 @@ class DecodeWorkerHandler(BaseWorkerHandler):
request, self.default_sampling_params request, self.default_sampling_params
) )
dp_rank = request.get("dp_rank", None) dp_rank = request.get("routing", {}).get("dp_rank")
openai_request_id = request.get("id") or request.get("request_id", request_id) openai_request_id = request.get("id") or request.get("request_id", request_id)
previous_text = "" previous_text = ""
...@@ -1565,7 +1564,7 @@ class PrefillWorkerHandler(BaseWorkerHandler): ...@@ -1565,7 +1564,7 @@ class PrefillWorkerHandler(BaseWorkerHandler):
f"Prefill request {request_id} has no LoRA specified (model: {model_name})" f"Prefill request {request_id} has no LoRA specified (model: {model_name})"
) )
dp_rank = request.get("dp_rank", None) dp_rank = request.get("routing", {}).get("dp_rank")
trace_headers = build_trace_headers(context) trace_headers = build_trace_headers(context)
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment