Unverified Commit f7ac3949 authored by Nick Hill's avatar Nick Hill Committed by GitHub
Browse files

fix(router): Obey max batch size (#23)

parent e6d3eb5d
...@@ -127,7 +127,7 @@ async fn batching_task( ...@@ -127,7 +127,7 @@ async fn batching_task(
// Try to get a new batch // Try to get a new batch
if let Some((new_request_ids, new_batch)) = if let Some((new_request_ids, new_batch)) =
db.next_batch(min_size, max_batch_size) db.next_batch(min_size, max_batch_size - batch_size as usize)
{ {
// Generate one token for this new batch to have the attention past in cache // Generate one token for this new batch to have the attention past in cache
let new_cached_batch = let new_cached_batch =
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment