Unverified Commit 0e4fffbc authored by Piotr Marcinkiewicz's avatar Piotr Marcinkiewicz Committed by GitHub
Browse files

fix: Change default vLLM router to round-robin (#597)

parent 12f72a42
...@@ -28,7 +28,7 @@ def parse_vllm_args(service_name, prefix) -> AsyncEngineArgs: ...@@ -28,7 +28,7 @@ def parse_vllm_args(service_name, prefix) -> AsyncEngineArgs:
"--router", "--router",
type=str, type=str,
choices=["random", "round-robin", "kv"], choices=["random", "round-robin", "kv"],
default="random", default="round-robin",
help="Router type to use for scheduling requests to workers", help="Router type to use for scheduling requests to workers",
) )
parser.add_argument( parser.add_argument(
......
...@@ -102,8 +102,8 @@ pub struct Flags { ...@@ -102,8 +102,8 @@ pub struct Flags {
/// If using `out=dyn://..` with multiple backends, this says how to route the requests. /// If using `out=dyn://..` with multiple backends, this says how to route the requests.
/// ///
/// Mostly interesting for KV-aware routing. /// Mostly interesting for KV-aware routing.
/// Defaults to RouterMode::Random /// Defaults to RouterMode::RoundRobin
#[arg(long, default_value = "random")] #[arg(long, default_value = "round-robin")]
pub router_mode: RouterMode, pub router_mode: RouterMode,
/// Internal use only. /// Internal use only.
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment