fix: inherit tool_call_parser and reasoning_parser in LoRA model registration (#7559)

Signed-off-by: AmeenP <ameenp360@gmail.com>

fix: inherit tool_call_parser and reasoning_parser in LoRA model registration (#7559)
Signed-off-by: AmeenP <ameenp360@gmail.com>
d2d97f18 · Ameen Patel · GitHub · de6e4f30 · d2d97f18
Unverified Commit d2d97f18 authored Mar 22, 2026 by Ameen Patel Committed by GitHub Mar 22, 2026
Hide whitespace changes
Inline Side-by-side

Showing with 10 additions and 0 deletions

components/src/dynamo/vllm/handlers.py components/src/dynamo/vllm/handlers.py +10 -0

No files found.
--- a/components/src/dynamo/vllm/handlers.py
+++ b/components/src/dynamo/vllm/handlers.py
@@ -40,6 +40,7 @@ from dynamo.common.utils.time_section import time_and_log_code_section
 from dynamo.llm import (
    KvEventPublisher,
    ModelInput,
+    ModelRuntimeConfig,
    ModelType,
    lora_name_to_id,
    register_model,
@@ -776,6 +777,14 @@ class BaseWorkerHandler(ABC, Generic[RequestT, ResponseT]):
                                "lora_id": lora_id,
                            }
+                            runtime_config = ModelRuntimeConfig()
+                            runtime_config.tool_call_parser = (
+                                self.config.dyn_tool_call_parser
+                            )
+                            runtime_config.reasoning_parser = (
+                                self.config.dyn_reasoning_parser
+                            )
                            # Publish with format: v1/mdc/dynamo/backend/generate/{instance_id}/{lora_slug}
                            await register_model(
                                model_input=ModelInput.Tokens,
@@ -783,6 +792,7 @@ class BaseWorkerHandler(ABC, Generic[RequestT, ResponseT]):
                                endpoint=self.generate_endpoint,
                                model_path=self.config.model,
                                kv_cache_block_size=self.config.engine_args.block_size,
+                                runtime_config=runtime_config,
                                user_data=user_data,
                                lora_name=lora_name,
                                base_model_path=self.config.model,