Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
552cac95
Unverified
Commit
552cac95
authored
Nov 17, 2025
by
Zhuohan Li
Committed by
GitHub
Nov 17, 2025
Browse files
[Misc] Fix wrong comment in scheduler (#28880)
Signed-off-by:
Zhuohan Li
<
zhuohan123@gmail.com
>
parent
61485844
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
4 additions
and
4 deletions
+4
-4
vllm/v1/core/sched/scheduler.py
vllm/v1/core/sched/scheduler.py
+4
-4
No files found.
vllm/v1/core/sched/scheduler.py
View file @
552cac95
...
@@ -472,9 +472,9 @@ class Scheduler(SchedulerInterface):
...
@@ -472,9 +472,9 @@ class Scheduler(SchedulerInterface):
num_computed_tokens
=
(
num_computed_tokens
=
(
num_new_local_computed_tokens
+
num_external_computed_tokens
num_new_local_computed_tokens
+
num_external_computed_tokens
)
)
# KVTransfer: WAITING reqs have num_computed_tokens > 0
# after async KV recvs are completed.
else
:
else
:
# KVTransfer: WAITING reqs have num_computed_tokens > 0
# after async KV recvs are completed.
new_computed_blocks
=
self
.
kv_cache_manager
.
empty_kv_cache_blocks
new_computed_blocks
=
self
.
kv_cache_manager
.
empty_kv_cache_blocks
num_new_local_computed_tokens
=
0
num_new_local_computed_tokens
=
0
num_computed_tokens
=
request
.
num_computed_tokens
num_computed_tokens
=
request
.
num_computed_tokens
...
@@ -483,12 +483,12 @@ class Scheduler(SchedulerInterface):
...
@@ -483,12 +483,12 @@ class Scheduler(SchedulerInterface):
external_load_encoder_input
=
[]
external_load_encoder_input
=
[]
new_encoder_compute_budget
=
encoder_compute_budget
new_encoder_compute_budget
=
encoder_compute_budget
# KVTransfer: loading remote KV, do not allocate for new work.
if
load_kv_async
:
if
load_kv_async
:
# KVTransfer: loading remote KV, do not allocate for new work.
assert
num_external_computed_tokens
>
0
assert
num_external_computed_tokens
>
0
num_new_tokens
=
0
num_new_tokens
=
0
# Number of tokens to be scheduled.
else
:
else
:
# Number of tokens to be scheduled.
# We use `request.num_tokens` instead of
# We use `request.num_tokens` instead of
# `request.num_prompt_tokens` to consider the resumed
# `request.num_prompt_tokens` to consider the resumed
# requests, which have output tokens.
# requests, which have output tokens.
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment