"git@developer.sourcefind.cn:renzhc/diffusers_dcu.git" did not exist on "df55f0535829e2a1348062f85c7483fb51197102"
Unverified Commit 718c391f authored by Wenxuan Tan's avatar Wenxuan Tan Committed by GitHub
Browse files

[Hoxfix] Fix incomplete token_to_kv_pool refactor (#4121)

parent fc671f66
...@@ -484,7 +484,7 @@ class Scheduler: ...@@ -484,7 +484,7 @@ class Scheduler:
logger.error( logger.error(
f"{self.cur_batch.batch_size()=}, " f"{self.cur_batch.batch_size()=}, "
f"{self.cur_batch.reqs=}, " f"{self.cur_batch.reqs=}, "
f"{self.token_to_kv_pool.available_size()=}, " f"{self.token_to_kv_pool_allocator.available_size()=}, "
f"{self.tree_cache.evictable_size()=}, " f"{self.tree_cache.evictable_size()=}, "
) )
# Wait for some time so that the parent process can print the error. # Wait for some time so that the parent process can print the error.
...@@ -932,7 +932,7 @@ class Scheduler: ...@@ -932,7 +932,7 @@ class Scheduler:
): ):
# During idle time, also collect metrics every 30 seconds. # During idle time, also collect metrics every 30 seconds.
num_used = self.max_total_num_tokens - ( num_used = self.max_total_num_tokens - (
self.token_to_kv_pool.available_size() self.token_to_kv_pool_allocator.available_size()
+ self.tree_cache.evictable_size() + self.tree_cache.evictable_size()
) )
num_running_reqs = len(self.running_batch.reqs) if self.running_batch else 0 num_running_reqs = len(self.running_batch.reqs) if self.running_batch else 0
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment