Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
eefa41c1
Commit
eefa41c1
authored
Mar 24, 2026
by
zhuwenwen
Browse files
sync v0.18.0
parent
82155c76
Changes
253
Hide whitespace changes
Inline
Side-by-side
Showing
20 changed files
with
39 additions
and
40 deletions
+39
-40
vllm/model_executor/models/mixtral.py
vllm/model_executor/models/mixtral.py
+2
-2
vllm/model_executor/models/mllama4.py
vllm/model_executor/models/mllama4.py
+2
-2
vllm/model_executor/models/modernbert.py
vllm/model_executor/models/modernbert.py
+4
-5
vllm/model_executor/models/molmo.py
vllm/model_executor/models/molmo.py
+1
-1
vllm/model_executor/models/molmo2.py
vllm/model_executor/models/molmo2.py
+1
-1
vllm/model_executor/models/mpt.py
vllm/model_executor/models/mpt.py
+2
-2
vllm/model_executor/models/nano_nemotron_vl.py
vllm/model_executor/models/nano_nemotron_vl.py
+3
-3
vllm/model_executor/models/nemotron.py
vllm/model_executor/models/nemotron.py
+1
-1
vllm/model_executor/models/nemotron_h.py
vllm/model_executor/models/nemotron_h.py
+2
-2
vllm/model_executor/models/nemotron_nas.py
vllm/model_executor/models/nemotron_nas.py
+1
-1
vllm/model_executor/models/nemotron_parse.py
vllm/model_executor/models/nemotron_parse.py
+2
-2
vllm/model_executor/models/nemotron_vl.py
vllm/model_executor/models/nemotron_vl.py
+2
-2
vllm/model_executor/models/olmo.py
vllm/model_executor/models/olmo.py
+2
-2
vllm/model_executor/models/olmo2.py
vllm/model_executor/models/olmo2.py
+2
-2
vllm/model_executor/models/olmoe.py
vllm/model_executor/models/olmoe.py
+2
-2
vllm/model_executor/models/openpangu.py
vllm/model_executor/models/openpangu.py
+2
-2
vllm/model_executor/models/openpangu_mtp.py
vllm/model_executor/models/openpangu_mtp.py
+1
-1
vllm/model_executor/models/opt.py
vllm/model_executor/models/opt.py
+3
-3
vllm/model_executor/models/orion.py
vllm/model_executor/models/orion.py
+2
-2
vllm/model_executor/models/ouro.py
vllm/model_executor/models/ouro.py
+2
-2
No files found.
vllm/model_executor/models/mixtral.py
View file @
eefa41c1
...
...
@@ -338,7 +338,7 @@ class MixtralModel(nn.Module):
def
forward
(
self
,
input_ids
:
torch
.
Tensor
,
input_ids
:
torch
.
Tensor
|
None
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
@@ -574,7 +574,7 @@ class MixtralForCausalLM(nn.Module, SupportsLoRA, SupportsPP, MixtureOfExperts):
def
forward
(
self
,
input_ids
:
torch
.
Tensor
,
input_ids
:
torch
.
Tensor
|
None
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
vllm/model_executor/models/mllama4.py
View file @
eefa41c1
...
...
@@ -875,7 +875,7 @@ class Llama4ForConditionalGeneration(
def
forward
(
self
,
input_ids
:
torch
.
Tensor
,
input_ids
:
torch
.
Tensor
|
None
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
@@ -1157,4 +1157,4 @@ class Llama4ForConditionalGeneration(
return
0
num_chunks
=
num_vision_tokens
//
(
raw_patches
+
1
)
patches_per_chunk
=
Mllama4ProcessingInfo
.
get_patch_per_chunk
(
vision_config
)
return
num_chunks
*
patches_per_chunk
return
num_chunks
*
patches_per_chunk
\ No newline at end of file
vllm/model_executor/models/modernbert.py
View file @
eefa41c1
...
...
@@ -54,12 +54,11 @@ class ModernBertEmbeddings(nn.Module):
input_ids
:
torch
.
Tensor
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
)
->
torch
.
Tensor
:
if
inputs_embeds
is
not
None
:
return
self
.
norm
(
inputs_embeds
)
else
:
if
inputs_embeds
is
None
:
inputs_embeds
=
self
.
tok_embeddings
(
input_ids
)
embeddings
=
self
.
norm
(
inputs_embeds
)
return
embeddings
embeddings
=
self
.
norm
(
inputs_embeds
)
return
embeddings
class
ModernBertAttention
(
nn
.
Module
):
...
...
vllm/model_executor/models/molmo.py
View file @
eefa41c1
...
...
@@ -876,7 +876,7 @@ class MolmoModel(nn.Module, SupportsQuant):
def
forward
(
self
,
input_ids
:
torch
.
Tensor
,
input_ids
:
torch
.
Tensor
|
None
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
vllm/model_executor/models/molmo2.py
View file @
eefa41c1
...
...
@@ -1206,7 +1206,7 @@ class Molmo2TextModel(nn.Module, SupportsQuant):
def
forward
(
self
,
input_ids
:
torch
.
Tensor
,
input_ids
:
torch
.
Tensor
|
None
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
vllm/model_executor/models/mpt.py
View file @
eefa41c1
...
...
@@ -253,7 +253,7 @@ class MPTModel(nn.Module):
def
forward
(
self
,
input_ids
:
torch
.
Tensor
,
input_ids
:
torch
.
Tensor
|
None
,
position_ids
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
@@ -313,7 +313,7 @@ class MPTForCausalLM(nn.Module, SupportsPP):
def
forward
(
self
,
input_ids
:
torch
.
Tensor
,
input_ids
:
torch
.
Tensor
|
None
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
vllm/model_executor/models/nano_nemotron_vl.py
View file @
eefa41c1
...
...
@@ -2293,7 +2293,7 @@ class NemotronH_Nano_VL_V2(
def
forward
(
self
,
input_ids
:
torch
.
Tensor
,
input_ids
:
torch
.
Tensor
|
None
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
@@ -2359,7 +2359,7 @@ class NemotronH_Nano_VL_V2(
with
torch
.
no_grad
():
default_weight_loader
(
param
,
w
)
elif
is_vision_weights
(
name
):
# Convert: vision_model.radio_model.*
→
radio_model.*
# Convert: vision_model.radio_model.*
鈫?
radio_model.*
hf_key
=
name
[
len
(
"vision_model."
)
:]
# Remove "vision_model." prefix
vision_weights
.
append
((
hf_key
,
w
))
elif
is_sound_weights
(
name
):
...
...
@@ -2419,4 +2419,4 @@ class NemotronH_Nano_VL_V2(
@
classmethod
def
get_mamba_state_copy_func
(
cls
):
return
NemotronHForCausalLM
.
get_mamba_state_copy_func
()
return
NemotronHForCausalLM
.
get_mamba_state_copy_func
()
\ No newline at end of file
vllm/model_executor/models/nemotron.py
View file @
eefa41c1
...
...
@@ -477,7 +477,7 @@ class NemotronForCausalLM(nn.Module, SupportsLoRA, SupportsPP):
def
forward
(
self
,
input_ids
:
torch
.
Tensor
,
input_ids
:
torch
.
Tensor
|
None
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
vllm/model_executor/models/nemotron_h.py
View file @
eefa41c1
...
...
@@ -608,7 +608,7 @@ class NemotronHModel(nn.Module):
def
forward
(
self
,
input_ids
:
torch
.
Tensor
,
input_ids
:
torch
.
Tensor
|
None
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
@@ -933,7 +933,7 @@ class NemotronHForCausalLM(
def
forward
(
self
,
input_ids
:
torch
.
Tensor
,
input_ids
:
torch
.
Tensor
|
None
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
vllm/model_executor/models/nemotron_nas.py
View file @
eefa41c1
...
...
@@ -453,7 +453,7 @@ class DeciLMForCausalLM(nn.Module, SupportsLoRA, SupportsPP, HasNoOps):
def
forward
(
self
,
input_ids
:
torch
.
Tensor
,
input_ids
:
torch
.
Tensor
|
None
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
vllm/model_executor/models/nemotron_parse.py
View file @
eefa41c1
...
...
@@ -290,7 +290,7 @@ class MBartDecoderNoPos(nn.Module):
def
forward
(
self
,
decoder_input_ids
:
torch
.
Tensor
,
decoder_input_ids
:
torch
.
Tensor
|
None
,
*
,
encoder_hidden_states
:
torch
.
Tensor
|
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
@@ -901,7 +901,7 @@ class NemotronParseForConditionalGeneration(nn.Module, SupportsMultiModal):
def
forward
(
self
,
input_ids
:
torch
.
Tensor
,
input_ids
:
torch
.
Tensor
|
None
,
positions
:
torch
.
Tensor
,
encoder_outputs
:
list
[
torch
.
Tensor
]
|
None
=
None
,
**
kwargs
,
...
...
vllm/model_executor/models/nemotron_vl.py
View file @
eefa41c1
...
...
@@ -644,7 +644,7 @@ class LlamaNemotronVLChatModel(nn.Module, SupportsMultiModal, SupportsPP, Suppor
def
forward
(
self
,
input_ids
:
torch
.
Tensor
,
input_ids
:
torch
.
Tensor
|
None
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
@@ -941,4 +941,4 @@ class LlamaNemotronVLForSequenceClassification(
loaded_weights
.
add
(
name
)
return
loaded_weights
return
loaded_weights
\ No newline at end of file
vllm/model_executor/models/olmo.py
View file @
eefa41c1
...
...
@@ -271,7 +271,7 @@ class OlmoModel(nn.Module):
def
forward
(
self
,
input_ids
:
torch
.
Tensor
,
input_ids
:
torch
.
Tensor
|
None
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
@@ -382,7 +382,7 @@ class OlmoForCausalLM(nn.Module, SupportsPP, SupportsLoRA):
def
forward
(
self
,
input_ids
:
torch
.
Tensor
,
input_ids
:
torch
.
Tensor
|
None
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
vllm/model_executor/models/olmo2.py
View file @
eefa41c1
...
...
@@ -309,7 +309,7 @@ class Olmo2Model(nn.Module):
def
forward
(
self
,
input_ids
:
torch
.
Tensor
,
input_ids
:
torch
.
Tensor
|
None
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
@@ -424,7 +424,7 @@ class Olmo2ForCausalLM(nn.Module, SupportsPP, SupportsLoRA):
def
forward
(
self
,
input_ids
:
torch
.
Tensor
,
input_ids
:
torch
.
Tensor
|
None
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
vllm/model_executor/models/olmoe.py
View file @
eefa41c1
...
...
@@ -300,7 +300,7 @@ class OlmoeModel(nn.Module):
def
forward
(
self
,
input_ids
:
torch
.
Tensor
,
input_ids
:
torch
.
Tensor
|
None
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
@@ -476,7 +476,7 @@ class OlmoeForCausalLM(nn.Module, SupportsPP, SupportsLoRA):
def
forward
(
self
,
input_ids
:
torch
.
Tensor
,
input_ids
:
torch
.
Tensor
|
None
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
vllm/model_executor/models/openpangu.py
View file @
eefa41c1
...
...
@@ -1062,7 +1062,7 @@ class OpenPanguModel(nn.Module):
def
forward
(
self
,
input_ids
:
torch
.
Tensor
,
input_ids
:
torch
.
Tensor
|
None
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
@@ -1292,7 +1292,7 @@ class OpenPanguModelBase(nn.Module, SupportsPP, SupportsLoRA):
def
forward
(
self
,
input_ids
:
torch
.
Tensor
,
input_ids
:
torch
.
Tensor
|
None
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
vllm/model_executor/models/openpangu_mtp.py
View file @
eefa41c1
...
...
@@ -104,7 +104,7 @@ class OpenPanguMTP(nn.Module):
def
forward
(
self
,
input_ids
:
torch
.
Tensor
,
input_ids
:
torch
.
Tensor
|
None
,
positions
:
torch
.
Tensor
,
hidden_states
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
...
...
vllm/model_executor/models/opt.py
View file @
eefa41c1
...
...
@@ -267,7 +267,7 @@ class OPTDecoder(nn.Module):
def
forward
(
self
,
input_ids
:
torch
.
Tensor
,
input_ids
:
torch
.
Tensor
|
None
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
@@ -316,7 +316,7 @@ class OPTModel(nn.Module):
def
forward
(
self
,
input_ids
:
torch
.
Tensor
,
input_ids
:
torch
.
Tensor
|
None
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
@@ -399,7 +399,7 @@ class OPTForCausalLM(nn.Module, SupportsPP, SupportsLoRA):
def
forward
(
self
,
input_ids
:
torch
.
Tensor
,
input_ids
:
torch
.
Tensor
|
None
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
vllm/model_executor/models/orion.py
View file @
eefa41c1
...
...
@@ -253,7 +253,7 @@ class OrionModel(nn.Module):
def
forward
(
self
,
input_ids
:
torch
.
Tensor
,
input_ids
:
torch
.
Tensor
|
None
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
@@ -343,7 +343,7 @@ class OrionForCausalLM(nn.Module, SupportsPP):
def
forward
(
self
,
input_ids
:
torch
.
Tensor
,
input_ids
:
torch
.
Tensor
|
None
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
vllm/model_executor/models/ouro.py
View file @
eefa41c1
...
...
@@ -357,7 +357,7 @@ class OuroModel(nn.Module):
def
forward
(
self
,
input_ids
:
torch
.
Tensor
,
input_ids
:
torch
.
Tensor
|
None
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
@@ -482,7 +482,7 @@ class OuroForCausalLM(nn.Module, SupportsLoRA):
def
forward
(
self
,
input_ids
:
torch
.
Tensor
,
input_ids
:
torch
.
Tensor
|
None
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
Prev
1
…
6
7
8
9
10
11
12
13
Next
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment