Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
8c3e1999
Unverified
Commit
8c3e1999
authored
Aug 29, 2025
by
Yong Hoon Shin
Committed by
GitHub
Aug 29, 2025
Browse files
Revert gemma3n fast prefill changes (#23897)
Signed-off-by:
Yong Hoon Shin
<
yhshin@meta.com
>
parent
1c26b422
Changes
3
Expand all
Show whitespace changes
Inline
Side-by-side
Showing
3 changed files
with
67 additions
and
355 deletions
+67
-355
tests/v1/e2e/test_kv_sharing_fast_prefill.py
tests/v1/e2e/test_kv_sharing_fast_prefill.py
+1
-0
vllm/model_executor/models/gemma3n.py
vllm/model_executor/models/gemma3n.py
+65
-354
vllm/model_executor/models/gemma3n_mm.py
vllm/model_executor/models/gemma3n_mm.py
+1
-1
No files found.
tests/v1/e2e/test_kv_sharing_fast_prefill.py
View file @
8c3e1999
...
...
@@ -64,6 +64,7 @@ def cleanup(llm: LLM, compilation_config: CompilationConfig):
@
fork_new_process_for_each_test
@
pytest
.
mark
.
parametrize
(
"enforce_eager"
,
[
True
])
@
pytest
.
mark
.
skip
(
reason
=
"Disable until Gemma3n supports fast prefill"
)
def
test_kv_sharing_fast_prefill
(
monkeypatch
:
pytest
.
MonkeyPatch
,
enforce_eager
:
bool
,
...
...
vllm/model_executor/models/gemma3n.py
View file @
8c3e1999
This diff is collapsed.
Click to expand it.
vllm/model_executor/models/gemma3n_mm.py
View file @
8c3e1999
...
...
@@ -620,7 +620,7 @@ class Gemma3nForConditionalGeneration(nn.Module, SupportsMultiModal):
# NOTE (NickLucche) Each pass needs tokens to compute PLE so we cache
# them here, as the model forward has only access to the input_embeds.
if
input_ids
is
not
None
:
per_layer_inputs
=
self
.
language_model
.
model
.
self_decoder
.
get_per_layer_input_embeddings
(
per_layer_inputs
=
self
.
language_model
.
model
.
get_per_layer_input_embeddings
(
input_ids
)
per_layer_inputs
=
per_layer_inputs
.
reshape
(
-
1
,
self
.
config
.
text_config
.
num_hidden_layers
,
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment