Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
bf790acd
Commit
bf790acd
authored
May 26, 2025
by
lizhigong
Browse files
debug and fix tbo error in mtp
parent
385eeae9
Changes
2
Show whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
5 additions
and
5 deletions
+5
-5
vllm/two_batch_overlap/model_input_split.py
vllm/two_batch_overlap/model_input_split.py
+1
-1
vllm/two_batch_overlap/two_batch_overlap.py
vllm/two_batch_overlap/two_batch_overlap.py
+4
-4
No files found.
vllm/two_batch_overlap/model_input_split.py
View file @
bf790acd
...
...
@@ -102,7 +102,7 @@ def split_model_input(model_input, self_device, batch_size_left, batch_size_righ
previous_hidden_states_left
=
None
previous_hidden_states_right
=
None
if
model_input
.
previous_hidden_states
!=
None
:
split_previous_hidden_states
=
torch
.
split
(
model_input
.
previous_hidden_states
,
batch_size
_split
,
dim
=
0
)
split_previous_hidden_states
=
torch
.
split
(
model_input
.
previous_hidden_states
,
query_tokens
_split
,
dim
=
0
)
previous_hidden_states_left
=
split_previous_hidden_states
[
0
]
previous_hidden_states_right
=
split_previous_hidden_states
[
1
]
...
...
vllm/two_batch_overlap/two_batch_overlap.py
View file @
bf790acd
...
...
@@ -250,12 +250,12 @@ def tbo_model_executable(
model_input_left
,
model_input_right
=
split_model_input
(
model_input
,
self_device
,
batch_size_left
,
batch_size_right
)
model_kwargs_left
=
model_kwargs
model_kwargs_right
=
model_kwargs
model_kwargs_left
=
model_kwargs
.
copy
()
model_kwargs_right
=
model_kwargs
.
copy
()
if
"previous_hidden_states"
in
model_kwargs
:
previous_hidden_states
=
model_kwargs
[
"previous_hidden_states"
]
batch_size_split
=
[
batch_size_left
,
batch_size_
right
]
split_previous_hidden_states
=
torch
.
split
(
previous_hidden_states
,
batch_size
_split
,
dim
=
0
)
query_tokens_split
=
[
sum
(
model_input
.
query_lens
[
0
:
batch_size_left
]),
sum
(
model_input
.
query_lens
[
batch_size_
left
:])
]
split_previous_hidden_states
=
torch
.
split
(
previous_hidden_states
,
query_tokens
_split
,
dim
=
0
)
model_kwargs_left
[
"previous_hidden_states"
]
=
split_previous_hidden_states
[
0
]
model_kwargs_right
[
"previous_hidden_states"
]
=
split_previous_hidden_states
[
1
]
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment