Unverified Commit ced35a06 authored by Thysrael's avatar Thysrael Committed by GitHub
Browse files

fix(typo): fix `reply` to `replay` in `base_attn_backend.py` (#4784)

parent 26f07294
...@@ -47,7 +47,7 @@ class AttentionBackend(ABC): ...@@ -47,7 +47,7 @@ class AttentionBackend(ABC):
spec_info: Optional[Union[EagleDraftInput, EagleVerifyInput]], spec_info: Optional[Union[EagleDraftInput, EagleVerifyInput]],
seq_lens_cpu: Optional[torch.Tensor], seq_lens_cpu: Optional[torch.Tensor],
): ):
"""Init the metadata for a forward pass for replying a cuda graph.""" """Init the metadata for a forward pass for replaying a cuda graph."""
raise NotImplementedError() raise NotImplementedError()
def get_cuda_graph_seq_len_fill_value(self): def get_cuda_graph_seq_len_fill_value(self):
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment