Commit 2b1be0e8 authored by jujl1's avatar jujl1
Browse files

fix: 解决原版0消耗chunk-prefill崩溃问题

parent 9f68733a
...@@ -796,6 +796,7 @@ class V1ZeroModelRunner(GPUModelRunner): ...@@ -796,6 +796,7 @@ class V1ZeroModelRunner(GPUModelRunner):
req_state = self.requests[req_id] req_state = self.requests[req_id]
token_idx = self.last_sampled_token_lens[req_idx] token_idx = self.last_sampled_token_lens[req_idx]
if token_idx == -1: if token_idx == -1:
self.fix_sampled_token_ids[req_idx].clear()
continue continue
fix_len = len(self.fix_sampled_token_ids[req_idx]) fix_len = len(self.fix_sampled_token_ids[req_idx])
req_state.output_token_ids[token_idx:token_idx + fix_len] = self.fix_sampled_token_ids[req_idx] req_state.output_token_ids[token_idx:token_idx + fix_len] = self.fix_sampled_token_ids[req_idx]
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment