Unverified Commit 0e4fffbc authored by Piotr Marcinkiewicz's avatar Piotr Marcinkiewicz Committed by GitHub
Browse files

fix: Change default vLLM router to round-robin (#597)

parent 12f72a42
......@@ -28,7 +28,7 @@ def parse_vllm_args(service_name, prefix) -> AsyncEngineArgs:
"--router",
type=str,
choices=["random", "round-robin", "kv"],
default="random",
default="round-robin",
help="Router type to use for scheduling requests to workers",
)
parser.add_argument(
......
......@@ -102,8 +102,8 @@ pub struct Flags {
/// If using `out=dyn://..` with multiple backends, this says how to route the requests.
///
/// Mostly interesting for KV-aware routing.
/// Defaults to RouterMode::Random
#[arg(long, default_value = "random")]
/// Defaults to RouterMode::RoundRobin
#[arg(long, default_value = "round-robin")]
pub router_mode: RouterMode,
/// Internal use only.
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment