"vllm/vscode:/vscode.git/clone" did not exist on "7090c27bb2cb0d9c4e0acd644e484291df3aff2a"
Unverified Commit 006aea17 authored by Woosuk Kwon's avatar Woosuk Kwon Committed by GitHub
Browse files

[BugFix] Remove incorrect assert in split_decodes_and_prefills (#36553)


Signed-off-by: default avatarWoosuk Kwon <woosuk@inferact.ai>
parent 0836be3b
...@@ -528,7 +528,6 @@ def split_decodes_and_prefills( ...@@ -528,7 +528,6 @@ def split_decodes_and_prefills(
# requests may have a query length of 0 but since they are padding its fine # requests may have a query length of 0 but since they are padding its fine
# to treat them as decodes (ensures num_decodes matches the captured size) # to treat them as decodes (ensures num_decodes matches the captured size)
if torch.all((query_lens == query_lens[0]) | (query_lens == 0)): if torch.all((query_lens == query_lens[0]) | (query_lens == 0)):
assert num_reqs * query_lens[0] == num_tokens, "tokens not padded correctly"
return num_reqs, 0, num_tokens, 0 # all decodes return num_reqs, 0, num_tokens, 0 # all decodes
is_prefill = query_lens != query_lens[0] is_prefill = query_lens != query_lens[0]
else: else:
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment