Unverified Commit 3577b5c1 authored by Neelay Shah's avatar Neelay Shah Committed by GitHub
Browse files

chore: Improve prefill router error reporting and fix typo (#4220)


Co-authored-by: default avatarClaude <noreply@anthropic.com>
parent 7802f969
...@@ -249,7 +249,10 @@ impl ...@@ -249,7 +249,10 @@ impl
next.generate(decode_request).await next.generate(decode_request).await
} }
Err(e) => { Err(e) => {
tracing::debug!(error = %e, "Remote prefill failed, falling back to decode-only"); tracing::warn!(
error = %e,
"Remote prefill failed, falling back to decode-only. This may impact performance in disaggregated deployments. Verify prefill workers are healthy and accessible."
);
next.generate(context.map(|_| req)).await next.generate(context.map(|_| req)).await
} }
} }
......
...@@ -42,7 +42,7 @@ pub struct PotentialLoad { ...@@ -42,7 +42,7 @@ pub struct PotentialLoad {
#[derive(Debug, thiserror::Error)] #[derive(Debug, thiserror::Error)]
pub enum KvSchedulerError { pub enum KvSchedulerError {
#[error("no endpoints aviailable to route work")] #[error("no endpoints available to route work")]
NoEndpoints, NoEndpoints,
#[error("all workers busy")] #[error("all workers busy")]
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment