Unverified Commit bd4366d0 authored by jthomson04's avatar jthomson04 Committed by GitHub
Browse files

fix: Fix warning messages with healthcheck (#4793)


Signed-off-by: default avatarjthomson04 <jwillthomson19@gmail.com>
parent 3e4b480b
...@@ -67,15 +67,14 @@ class VllmHealthCheckPayload(HealthCheckPayload): ...@@ -67,15 +67,14 @@ class VllmHealthCheckPayload(HealthCheckPayload):
self.default_payload = { self.default_payload = {
"token_ids": [bos_token_id], "token_ids": [bos_token_id],
"sampling_options": { "sampling_options": {
"max_tokens": 1,
"temperature": 0.0, "temperature": 0.0,
}, },
"stop_conditions": { "stop_conditions": {
"max_tokens": 1,
"stop": None, "stop": None,
"stop_token_ids": None, "stop_token_ids": None,
"include_stop_str_in_output": False, "include_stop_str_in_output": False,
"ignore_eos": False, "ignore_eos": False,
"min_tokens": 0,
}, },
} }
super().__init__() super().__init__()
......
...@@ -303,6 +303,11 @@ impl HealthCheckManager { ...@@ -303,6 +303,11 @@ impl HealthCheckManager {
false false
}; };
tokio::spawn(async move {
// We need to consume the rest of the stream to avoid warnings on the frontend.
response_stream.for_each(|_| async {}).await;
});
// Update health status based on response // Update health status based on response
system_health.lock().set_endpoint_health_status( system_health.lock().set_endpoint_health_status(
&endpoint_subject_owned, &endpoint_subject_owned,
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment