Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
dynamo
Commits
f9ba6f5c
"vscode:/vscode.git/clone" did not exist on "fcc42624a36ab2aaa71c0a8ddf3ec09e5cd12987"
Unverified
Commit
f9ba6f5c
authored
May 29, 2025
by
Tanmay Verma
Committed by
GitHub
May 29, 2025
Browse files
feat: Publish events and metrics when using kv routing (#1262)
parent
4e47903b
Changes
2
Show whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
12 additions
and
1 deletion
+12
-1
launch/dynamo-run/src/subprocess.rs
launch/dynamo-run/src/subprocess.rs
+7
-0
launch/dynamo-run/src/subprocess/trtllm_inc.py
launch/dynamo-run/src/subprocess/trtllm_inc.py
+5
-1
No files found.
launch/dynamo-run/src/subprocess.rs
View file @
f9ba6f5c
...
...
@@ -10,6 +10,7 @@ use anyhow::Context;
use
regex
::
Regex
;
use
tokio
::
io
::
AsyncBufReadExt
;
use
crate
::
flags
::
RouterMode
;
use
dynamo_llm
::
engines
::
MultiNodeConfig
;
use
dynamo_llm
::
local_model
::
LocalModel
;
use
dynamo_runtime
::
protocols
::
Endpoint
as
EndpointId
;
...
...
@@ -51,6 +52,12 @@ pub async fn start(
"--context-length"
.to_string
(),
card
.context_length
.to_string
(),
];
// TRTLLM only
// The worker node will only publish events and metrics if the router mode is KV
if
flags
.router_mode
==
RouterMode
::
KV
{
args
.push
(
"--publish-events-and-metrics"
.to_string
());
}
// sglang only
// vllm uses CUDA_VISIBLE_DEVICES
if
flags
.base_gpu_id
!=
0
{
...
...
launch/dynamo-run/src/subprocess/trtllm_inc.py
View file @
f9ba6f5c
...
...
@@ -178,7 +178,11 @@ async def init(runtime: DistributedRuntime, config: Config):
async
with
get_tensorrtllm_engine
(
engine_args
)
as
engine
:
endpoint
=
component
.
endpoint
(
config
.
endpoint
)
await
register_llm
(
ModelType
.
Backend
,
endpoint
,
config
.
model_path
,
config
.
model_name
ModelType
.
Backend
,
endpoint
,
config
.
model_path
,
config
.
model_name
,
kv_cache_block_size
=
config
.
kv_block_size
,
)
if
config
.
publish_events_and_metrics
:
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment