Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
7a8a48d5
Unverified
Commit
7a8a48d5
authored
Jan 18, 2025
by
Simon Mo
Committed by
GitHub
Jan 19, 2025
Browse files
[V1] Collect env var for usage stats (#12115)
parent
32eb0da8
Changes
1
Show whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
18 additions
and
0 deletions
+18
-0
vllm/usage/usage_lib.py
vllm/usage/usage_lib.py
+18
-0
No files found.
vllm/usage/usage_lib.py
View file @
7a8a48d5
...
@@ -27,6 +27,17 @@ _USAGE_STATS_SERVER = envs.VLLM_USAGE_STATS_SERVER
...
@@ -27,6 +27,17 @@ _USAGE_STATS_SERVER = envs.VLLM_USAGE_STATS_SERVER
_GLOBAL_RUNTIME_DATA
:
Dict
[
str
,
Union
[
str
,
int
,
bool
]]
=
{}
_GLOBAL_RUNTIME_DATA
:
Dict
[
str
,
Union
[
str
,
int
,
bool
]]
=
{}
_USAGE_ENV_VARS_TO_COLLECT
=
[
"VLLM_USE_MODELSCOPE"
,
"VLLM_USE_TRITON_FLASH_ATTN"
,
"VLLM_ATTENTION_BACKEND"
,
"VLLM_USE_FLASHINFER_SAMPLER"
,
"VLLM_PP_LAYER_PARTITION"
,
"VLLM_USE_TRITON_AWQ"
,
"VLLM_USE_V1"
,
"VLLM_ENABLE_V1_MULTIPROCESSING"
,
]
def
set_runtime_usage_data
(
key
:
str
,
value
:
Union
[
str
,
int
,
bool
])
->
None
:
def
set_runtime_usage_data
(
key
:
str
,
value
:
Union
[
str
,
int
,
bool
])
->
None
:
"""Set global usage data that will be sent with every usage heartbeat."""
"""Set global usage data that will be sent with every usage heartbeat."""
...
@@ -122,6 +133,7 @@ class UsageMessage:
...
@@ -122,6 +133,7 @@ class UsageMessage:
self
.
gpu_count
:
Optional
[
int
]
=
None
self
.
gpu_count
:
Optional
[
int
]
=
None
self
.
gpu_type
:
Optional
[
str
]
=
None
self
.
gpu_type
:
Optional
[
str
]
=
None
self
.
gpu_memory_per_device
:
Optional
[
int
]
=
None
self
.
gpu_memory_per_device
:
Optional
[
int
]
=
None
self
.
env_var_json
:
Optional
[
str
]
=
None
# vLLM Information
# vLLM Information
self
.
model_architecture
:
Optional
[
str
]
=
None
self
.
model_architecture
:
Optional
[
str
]
=
None
...
@@ -176,6 +188,12 @@ class UsageMessage:
...
@@ -176,6 +188,12 @@ class UsageMessage:
self
.
vllm_version
=
VLLM_VERSION
self
.
vllm_version
=
VLLM_VERSION
self
.
model_architecture
=
model_architecture
self
.
model_architecture
=
model_architecture
# Environment variables
self
.
env_var_json
=
json
.
dumps
({
env_var
:
getattr
(
envs
,
env_var
)
for
env_var
in
_USAGE_ENV_VARS_TO_COLLECT
})
# Metadata
# Metadata
self
.
log_time
=
_get_current_timestamp_ns
()
self
.
log_time
=
_get_current_timestamp_ns
()
self
.
source
=
envs
.
VLLM_USAGE_SOURCE
self
.
source
=
envs
.
VLLM_USAGE_SOURCE
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment