Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
c721b814
Commit
c721b814
authored
Feb 05, 2026
by
zhuwenwen
Browse files
sync v0.15.1
parent
d53fe7e5
Changes
328
Hide whitespace changes
Inline
Side-by-side
Showing
20 changed files
with
41 additions
and
45 deletions
+41
-45
vllm/model_executor/models/granitemoe.py
vllm/model_executor/models/granitemoe.py
+2
-2
vllm/model_executor/models/granitemoehybrid.py
vllm/model_executor/models/granitemoehybrid.py
+2
-2
vllm/model_executor/models/granitemoeshared.py
vllm/model_executor/models/granitemoeshared.py
+2
-2
vllm/model_executor/models/grok1.py
vllm/model_executor/models/grok1.py
+2
-2
vllm/model_executor/models/hunyuan_v1.py
vllm/model_executor/models/hunyuan_v1.py
+1
-1
vllm/model_executor/models/hunyuan_vision.py
vllm/model_executor/models/hunyuan_vision.py
+1
-1
vllm/model_executor/models/hyperclovax_vision.py
vllm/model_executor/models/hyperclovax_vision.py
+1
-1
vllm/model_executor/models/idefics3.py
vllm/model_executor/models/idefics3.py
+2
-2
vllm/model_executor/models/interfaces.py
vllm/model_executor/models/interfaces.py
+1
-5
vllm/model_executor/models/internlm2.py
vllm/model_executor/models/internlm2.py
+4
-4
vllm/model_executor/models/internlm2_ve.py
vllm/model_executor/models/internlm2_ve.py
+2
-2
vllm/model_executor/models/interns1.py
vllm/model_executor/models/interns1.py
+2
-2
vllm/model_executor/models/internvl.py
vllm/model_executor/models/internvl.py
+2
-2
vllm/model_executor/models/iquest_loopcoder.py
vllm/model_executor/models/iquest_loopcoder.py
+3
-3
vllm/model_executor/models/isaac.py
vllm/model_executor/models/isaac.py
+2
-2
vllm/model_executor/models/jais.py
vllm/model_executor/models/jais.py
+3
-3
vllm/model_executor/models/jais2.py
vllm/model_executor/models/jais2.py
+2
-2
vllm/model_executor/models/jamba.py
vllm/model_executor/models/jamba.py
+3
-3
vllm/model_executor/models/jina_vl.py
vllm/model_executor/models/jina_vl.py
+2
-2
vllm/model_executor/models/kanana_v.py
vllm/model_executor/models/kanana_v.py
+2
-2
No files found.
vllm/model_executor/models/granitemoe.py
View file @
c721b814
...
...
@@ -312,7 +312,7 @@ class GraniteMoeModel(nn.Module):
def
forward
(
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
@@ -528,7 +528,7 @@ class GraniteMoeForCausalLM(nn.Module, SupportsLoRA, SupportsPP):
def
forward
(
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
vllm/model_executor/models/granitemoehybrid.py
View file @
c721b814
...
...
@@ -368,7 +368,7 @@ class GraniteMoeHybridModel(nn.Module):
def
forward
(
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
@@ -685,7 +685,7 @@ class GraniteMoeHybridForCausalLM(
def
forward
(
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
vllm/model_executor/models/granitemoeshared.py
View file @
c721b814
...
...
@@ -183,7 +183,7 @@ class GraniteMoeSharedModel(nn.Module):
def
forward
(
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
@@ -295,7 +295,7 @@ class GraniteMoeSharedForCausalLM(nn.Module, SupportsLoRA, SupportsPP):
def
forward
(
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
vllm/model_executor/models/grok1.py
View file @
c721b814
...
...
@@ -491,7 +491,7 @@ class Grok1Model(nn.Module):
def
forward
(
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
@@ -705,7 +705,7 @@ class GrokBaseForCausalLM(nn.Module, SupportsLoRA, SupportsPP):
def
forward
(
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
vllm/model_executor/models/hunyuan_v1.py
View file @
c721b814
...
...
@@ -938,7 +938,7 @@ class HunyuanV1ModelBase(nn.Module, SupportsLoRA, SupportsPP):
def
forward
(
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
vllm/model_executor/models/hunyuan_vision.py
View file @
c721b814
...
...
@@ -968,7 +968,7 @@ class HunYuanVLForConditionalGeneration(
def
forward
(
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
,
inputs_embeds
:
torch
.
Tensor
|
None
,
...
...
vllm/model_executor/models/hyperclovax_vision.py
View file @
c721b814
...
...
@@ -747,7 +747,7 @@ class HCXVisionForCausalLM(nn.Module, SupportsMultiModal, SupportsPP):
def
forward
(
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
vllm/model_executor/models/idefics3.py
View file @
c721b814
...
...
@@ -559,7 +559,7 @@ class Idefics3Model(nn.Module):
def
forward
(
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
@@ -689,7 +689,7 @@ class Idefics3ForConditionalGeneration(nn.Module, SupportsMultiModal, SupportsLo
def
forward
(
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
vllm/model_executor/models/interfaces.py
View file @
c721b814
...
...
@@ -603,8 +603,6 @@ class SupportsPP(Protocol):
def
forward
(
self
,
input_ids
:
Tensor
|
None
,
positions
:
Tensor
,
*
,
intermediate_tensors
:
IntermediateTensors
|
None
,
)
->
IntermediateTensors
|
None
:
...
...
@@ -633,8 +631,6 @@ class _SupportsPPType(Protocol):
def
forward
(
self
,
input_ids
:
Tensor
|
None
,
positions
:
Tensor
,
*
,
intermediate_tensors
:
IntermediateTensors
|
None
,
)
->
Tensor
|
IntermediateTensors
:
...
...
...
@@ -1335,4 +1331,4 @@ def supports_xdrope(model: object) -> TypeIs[SupportsXDRoPE]: ...
def
supports_xdrope
(
model
:
type
[
object
]
|
object
,
)
->
TypeIs
[
type
[
SupportsXDRoPE
]]
|
TypeIs
[
SupportsXDRoPE
]:
return
isinstance
(
model
,
SupportsXDRoPE
)
return
isinstance
(
model
,
SupportsXDRoPE
)
\ No newline at end of file
vllm/model_executor/models/internlm2.py
View file @
c721b814
...
...
@@ -284,7 +284,7 @@ class InternLM2Model(nn.Module):
def
forward
(
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
@@ -350,7 +350,7 @@ class InternLM2ForCausalLM(nn.Module, SupportsPP, SupportsLoRA):
def
forward
(
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
@@ -446,7 +446,7 @@ class InternLM2ForRewardModel(InternLM2ForCausalLM):
def
forward
(
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
@@ -456,4 +456,4 @@ class InternLM2ForRewardModel(InternLM2ForCausalLM):
)
hidden_states
=
hidden_states
.
to
(
self
.
head_dtype
)
logits
=
self
.
v_head
(
hidden_states
)
return
logits
return
logits
\ No newline at end of file
vllm/model_executor/models/internlm2_ve.py
View file @
c721b814
...
...
@@ -101,7 +101,7 @@ class InternLM2VEModel(InternLM2Model):
def
forward
(
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
@@ -136,4 +136,4 @@ class InternLM2VEForCausalLM(InternLM2ForCausalLM):
def
__init__
(
self
,
*
,
vllm_config
:
VllmConfig
,
prefix
:
str
=
""
):
super
().
__init__
(
vllm_config
=
vllm_config
,
prefix
=
prefix
,
model_type
=
InternLM2VEModel
)
)
\ No newline at end of file
vllm/model_executor/models/interns1.py
View file @
c721b814
...
...
@@ -782,7 +782,7 @@ class InternS1ForConditionalGeneration(
def
forward
(
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
@@ -819,4 +819,4 @@ class InternS1ForConditionalGeneration(
language_model
=
"language_model"
,
connector
=
"multi_modal_projector"
,
tower_model
=
"vision_tower"
,
)
)
\ No newline at end of file
vllm/model_executor/models/internvl.py
View file @
c721b814
...
...
@@ -1371,7 +1371,7 @@ class InternVLChatModel(nn.Module, SupportsMultiModal, SupportsPP, SupportsLoRA)
def
forward
(
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
@@ -1442,4 +1442,4 @@ class InternVLChatModel(nn.Module, SupportsMultiModal, SupportsPP, SupportsLoRA)
return
0
num_patches
=
num_vision_tokens
//
(
self
.
patch_tokens
+
1
)
return
num_patches
*
self
.
num_image_token
return
num_patches
*
self
.
num_image_token
\ No newline at end of file
vllm/model_executor/models/iquest_loopcoder.py
View file @
c721b814
...
...
@@ -438,7 +438,7 @@ class IQuestLoopCoderModel(nn.Module):
def
forward
(
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
@@ -570,7 +570,7 @@ class IQuestLoopCoderForCausalLM(nn.Module):
def
forward
(
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
@@ -592,4 +592,4 @@ class IQuestLoopCoderForCausalLM(nn.Module):
self
,
skip_prefixes
=
([
"lm_head."
]
if
self
.
config
.
tie_word_embeddings
else
None
),
)
return
loader
.
load_weights
(
weights
)
return
loader
.
load_weights
(
weights
)
\ No newline at end of file
vllm/model_executor/models/isaac.py
View file @
c721b814
...
...
@@ -1450,7 +1450,7 @@ class IsaacForConditionalGeneration(
def
forward
(
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
@@ -1479,4 +1479,4 @@ class IsaacForConditionalGeneration(
language_model
=
"language_model"
,
connector
=
"vision_embedding.linear_fc2"
,
# The final linear layer
tower_model
=
"vision_embedding"
,
)
)
\ No newline at end of file
vllm/model_executor/models/jais.py
View file @
c721b814
...
...
@@ -280,7 +280,7 @@ class JAISModel(nn.Module):
def
forward
(
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
position_ids
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
@@ -344,7 +344,7 @@ class JAISLMHeadModel(nn.Module, SupportsPP):
def
forward
(
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
@@ -394,4 +394,4 @@ class JAISLMHeadModel(nn.Module, SupportsPP):
weight_loader
=
getattr
(
param
,
"weight_loader"
,
default_weight_loader
)
weight_loader
(
param
,
loaded_weight
)
loaded_params
.
add
(
name
)
return
loaded_params
return
loaded_params
\ No newline at end of file
vllm/model_executor/models/jais2.py
View file @
c721b814
...
...
@@ -483,7 +483,7 @@ class Jais2ForCausalLM(nn.Module, SupportsLoRA, SupportsPP):
def
forward
(
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
@@ -505,4 +505,4 @@ class Jais2ForCausalLM(nn.Module, SupportsLoRA, SupportsPP):
self
,
skip_prefixes
=
([
"lm_head."
]
if
self
.
config
.
tie_word_embeddings
else
None
),
)
return
loader
.
load_weights
(
weights
)
return
loader
.
load_weights
(
weights
)
\ No newline at end of file
vllm/model_executor/models/jamba.py
View file @
c721b814
...
...
@@ -348,7 +348,7 @@ class JambaModel(nn.Module):
def
forward
(
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
@@ -516,7 +516,7 @@ class JambaForCausalLM(
def
forward
(
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
@@ -602,4 +602,4 @@ class JambaForSequenceClassification(JambaForCausalLM):
pooler_config
=
vllm_config
.
model_config
.
pooler_config
assert
pooler_config
is
not
None
self
.
pooler
=
DispatchPooler
.
for_seq_cls
(
pooler_config
,
classifier
=
self
.
score
)
self
.
pooler
=
DispatchPooler
.
for_seq_cls
(
pooler_config
,
classifier
=
self
.
score
)
\ No newline at end of file
vllm/model_executor/models/jina_vl.py
View file @
c721b814
...
...
@@ -125,7 +125,7 @@ class JinaVLForSequenceClassification(
def
forward
(
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
@@ -142,4 +142,4 @@ class JinaVLForSequenceClassification(
def
load_weights
(
self
,
weights
:
Iterable
[
tuple
[
str
,
torch
.
Tensor
]]):
loader
=
AutoWeightsLoader
(
self
)
return
loader
.
load_weights
(
weights
,
mapper
=
self
.
weight_mapper
)
return
loader
.
load_weights
(
weights
,
mapper
=
self
.
weight_mapper
)
\ No newline at end of file
vllm/model_executor/models/kanana_v.py
View file @
c721b814
...
...
@@ -732,7 +732,7 @@ class KananaVForConditionalGeneration(nn.Module, SupportsMultiModal, SupportsPP)
def
forward
(
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
...
@@ -755,4 +755,4 @@ class KananaVForConditionalGeneration(nn.Module, SupportsMultiModal, SupportsPP)
def
load_weights
(
self
,
weights
:
Iterable
[
tuple
[
str
,
torch
.
Tensor
]])
->
set
[
str
]:
loader
=
AutoWeightsLoader
(
self
)
return
loader
.
load_weights
(
weights
)
return
loader
.
load_weights
(
weights
)
\ No newline at end of file
Prev
1
…
7
8
9
10
11
12
13
14
15
…
17
Next
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment