Commit 5208b291 authored by jujl1's avatar jujl1
Browse files

fix: 解决列表访问越界

parent bc945a5a
...@@ -72,6 +72,8 @@ def zero_overhead_update_from_output(scheduler:Scheduler, ...@@ -72,6 +72,8 @@ def zero_overhead_update_from_output(scheduler:Scheduler,
continue continue
request = scheduler.requests[req_id] request = scheduler.requests[req_id]
generated_token_ids = model_runner_output.fix_sampled_token_ids[req_idx] generated_token_ids = model_runner_output.fix_sampled_token_ids[req_idx]
if not generated_token_ids:
continue
if req_id not in requsets_valid_token_len: if req_id not in requsets_valid_token_len:
requsets_valid_token_len[req_id] = 0 requsets_valid_token_len[req_id] = 0
valid_output_len = requsets_valid_token_len[req_id] valid_output_len = requsets_valid_token_len[req_id]
......
...@@ -705,6 +705,7 @@ class V1ZeroModelRunner(GPUModelRunner): ...@@ -705,6 +705,7 @@ class V1ZeroModelRunner(GPUModelRunner):
self.fix_sampled_token_ids = self.last_sampler_host_tokens.tolist() self.fix_sampled_token_ids = self.last_sampler_host_tokens.tolist()
for req_idx, start_idx, end_idx in self.token_ids_cpu_fix_record: for req_idx, start_idx, end_idx in self.token_ids_cpu_fix_record:
if start_idx == -1: if start_idx == -1:
self.fix_sampled_token_ids[req_idx].clear()
continue continue
req_id = self.fix_req_ids[req_idx] req_id = self.fix_req_ids[req_idx]
if req_id in self.input_batch.req_ids: if req_id in self.input_batch.req_ids:
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment