"vscode:/vscode.git/clone" did not exist on "b7e62d3454afc807ddcc2fe3a56ce075461f1bc4"
Commit 639a11d2 authored by 王敏's avatar 王敏
Browse files

[fix]解决EP开启pd_padding大输入卡住问题

parent 82cd3c88
......@@ -226,8 +226,8 @@ class EagleProposer:
with set_forward_context(per_layer_attn_metadata,
self.vllm_config,
num_tokens=num_input_tokens,
skip_cuda_graphs=not decoding):
num_tokens=num_input_tokens):
#skip_cuda_graphs=not decoding):
ret_hidden_states = self.model(
self.input_ids[:num_input_tokens],
self.positions[:num_input_tokens],
......
......@@ -150,8 +150,8 @@ class V1ZeroEagleProposer(EagleProposer):
with set_forward_context(per_layer_attn_metadata,
self.vllm_config,
num_tokens=num_input_tokens,
skip_cuda_graphs=not decoding):
num_tokens=num_input_tokens,):
#skip_cuda_graphs=not decoding):
ret_hidden_states = self.model(
self.input_ids[:num_input_tokens],
self.positions[:num_input_tokens],
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment