Unverified Commit 7c162fa9 authored by Liangsheng Yin's avatar Liangsheng Yin Committed by GitHub
Browse files

Fix schedule bug (#1451)

parent 36078fb2
......@@ -229,6 +229,7 @@ class PrefillAdder:
else:
add_req_state(req, insert_sort=True)
cur_rem_tokens = self.cur_rem_tokens - len(req.origin_input_ids)
tokens_freed = 0
for i, (tokens_left, tokens_occupied) in enumerate(self.req_states):
decode_steps = (
......@@ -237,7 +238,7 @@ class PrefillAdder:
else tokens_left
)
bs = len(self.req_states) - i
if self.cur_rem_tokens + tokens_freed - decode_steps * bs <= 0:
if cur_rem_tokens + tokens_freed - decode_steps * bs <= 0:
return False
tokens_freed += tokens_occupied
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment