Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
df704163
Commit
df704163
authored
Feb 06, 2026
by
zhuwenwen
Browse files
sync v0.15.1 (models)
parent
d7db129a
Changes
169
Hide whitespace changes
Inline
Side-by-side
Showing
20 changed files
with
48 additions
and
58 deletions
+48
-58
vllm/model_executor/models/granitemoe.py
vllm/model_executor/models/granitemoe.py
+3
-3
vllm/model_executor/models/granitemoehybrid.py
vllm/model_executor/models/granitemoehybrid.py
+3
-3
vllm/model_executor/models/granitemoeshared.py
vllm/model_executor/models/granitemoeshared.py
+3
-3
vllm/model_executor/models/grok1.py
vllm/model_executor/models/grok1.py
+3
-3
vllm/model_executor/models/hunyuan_v1.py
vllm/model_executor/models/hunyuan_v1.py
+2
-2
vllm/model_executor/models/hunyuan_vision.py
vllm/model_executor/models/hunyuan_vision.py
+2
-2
vllm/model_executor/models/hyperclovax_vision.py
vllm/model_executor/models/hyperclovax_vision.py
+2
-2
vllm/model_executor/models/idefics3.py
vllm/model_executor/models/idefics3.py
+3
-3
vllm/model_executor/models/interfaces.py
vllm/model_executor/models/interfaces.py
+1
-9
vllm/model_executor/models/intern_vit.py
vllm/model_executor/models/intern_vit.py
+1
-3
vllm/model_executor/models/internlm2.py
vllm/model_executor/models/internlm2.py
+4
-4
vllm/model_executor/models/internlm2_ve.py
vllm/model_executor/models/internlm2_ve.py
+2
-2
vllm/model_executor/models/interns1.py
vllm/model_executor/models/interns1.py
+2
-2
vllm/model_executor/models/internvl.py
vllm/model_executor/models/internvl.py
+2
-2
vllm/model_executor/models/iquest_loopcoder.py
vllm/model_executor/models/iquest_loopcoder.py
+3
-3
vllm/model_executor/models/isaac.py
vllm/model_executor/models/isaac.py
+2
-2
vllm/model_executor/models/jais.py
vllm/model_executor/models/jais.py
+3
-3
vllm/model_executor/models/jais2.py
vllm/model_executor/models/jais2.py
+2
-2
vllm/model_executor/models/jamba.py
vllm/model_executor/models/jamba.py
+3
-3
vllm/model_executor/models/jina_vl.py
vllm/model_executor/models/jina_vl.py
+2
-2
No files found.
vllm/model_executor/models/granitemoe.py
View file @
df704163
...
@@ -312,7 +312,7 @@ class GraniteMoeModel(nn.Module):
...
@@ -312,7 +312,7 @@ class GraniteMoeModel(nn.Module):
def
forward
(
def
forward
(
self
,
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
,
intermediate_tensors
:
IntermediateTensors
|
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
@@ -528,7 +528,7 @@ class GraniteMoeForCausalLM(nn.Module, SupportsLoRA, SupportsPP):
...
@@ -528,7 +528,7 @@ class GraniteMoeForCausalLM(nn.Module, SupportsLoRA, SupportsPP):
def
forward
(
def
forward
(
self
,
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
@@ -558,4 +558,4 @@ class GraniteMoeForCausalLM(nn.Module, SupportsLoRA, SupportsPP):
...
@@ -558,4 +558,4 @@ class GraniteMoeForCausalLM(nn.Module, SupportsLoRA, SupportsPP):
self
,
self
,
skip_prefixes
=
([
"lm_head."
]
if
self
.
config
.
tie_word_embeddings
else
None
),
skip_prefixes
=
([
"lm_head."
]
if
self
.
config
.
tie_word_embeddings
else
None
),
)
)
return
loader
.
load_weights
(
weights
)
return
loader
.
load_weights
(
weights
)
\ No newline at end of file
vllm/model_executor/models/granitemoehybrid.py
View file @
df704163
...
@@ -368,7 +368,7 @@ class GraniteMoeHybridModel(nn.Module):
...
@@ -368,7 +368,7 @@ class GraniteMoeHybridModel(nn.Module):
def
forward
(
def
forward
(
self
,
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
@@ -685,7 +685,7 @@ class GraniteMoeHybridForCausalLM(
...
@@ -685,7 +685,7 @@ class GraniteMoeHybridForCausalLM(
def
forward
(
def
forward
(
self
,
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
@@ -706,4 +706,4 @@ class GraniteMoeHybridForCausalLM(
...
@@ -706,4 +706,4 @@ class GraniteMoeHybridForCausalLM(
def
load_weights
(
self
,
weights
:
Iterable
[
tuple
[
str
,
torch
.
Tensor
]])
->
set
[
str
]:
def
load_weights
(
self
,
weights
:
Iterable
[
tuple
[
str
,
torch
.
Tensor
]])
->
set
[
str
]:
loader
=
AutoWeightsLoader
(
self
)
loader
=
AutoWeightsLoader
(
self
)
return
loader
.
load_weights
(
weights
)
return
loader
.
load_weights
(
weights
)
\ No newline at end of file
vllm/model_executor/models/granitemoeshared.py
View file @
df704163
...
@@ -183,7 +183,7 @@ class GraniteMoeSharedModel(nn.Module):
...
@@ -183,7 +183,7 @@ class GraniteMoeSharedModel(nn.Module):
def
forward
(
def
forward
(
self
,
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
,
intermediate_tensors
:
IntermediateTensors
|
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
@@ -295,7 +295,7 @@ class GraniteMoeSharedForCausalLM(nn.Module, SupportsLoRA, SupportsPP):
...
@@ -295,7 +295,7 @@ class GraniteMoeSharedForCausalLM(nn.Module, SupportsLoRA, SupportsPP):
def
forward
(
def
forward
(
self
,
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
@@ -325,4 +325,4 @@ class GraniteMoeSharedForCausalLM(nn.Module, SupportsLoRA, SupportsPP):
...
@@ -325,4 +325,4 @@ class GraniteMoeSharedForCausalLM(nn.Module, SupportsLoRA, SupportsPP):
self
,
self
,
skip_prefixes
=
([
"lm_head."
]
if
self
.
config
.
tie_word_embeddings
else
None
),
skip_prefixes
=
([
"lm_head."
]
if
self
.
config
.
tie_word_embeddings
else
None
),
)
)
return
loader
.
load_weights
(
weights
)
return
loader
.
load_weights
(
weights
)
\ No newline at end of file
vllm/model_executor/models/grok1.py
View file @
df704163
...
@@ -491,7 +491,7 @@ class Grok1Model(nn.Module):
...
@@ -491,7 +491,7 @@ class Grok1Model(nn.Module):
def
forward
(
def
forward
(
self
,
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
,
intermediate_tensors
:
IntermediateTensors
|
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
@@ -705,7 +705,7 @@ class GrokBaseForCausalLM(nn.Module, SupportsLoRA, SupportsPP):
...
@@ -705,7 +705,7 @@ class GrokBaseForCausalLM(nn.Module, SupportsLoRA, SupportsPP):
def
forward
(
def
forward
(
self
,
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
@@ -800,4 +800,4 @@ class GrokForCausalLM(GrokBaseForCausalLM):
...
@@ -800,4 +800,4 @@ class GrokForCausalLM(GrokBaseForCausalLM):
cls
.
packed_modules_mapping
=
dict
(
cls
.
packed_modules_mapping
)
cls
.
packed_modules_mapping
=
dict
(
cls
.
packed_modules_mapping
)
cls
.
packed_modules_mapping
.
update
(
instance_cls
.
packed_modules_mapping
)
cls
.
packed_modules_mapping
.
update
(
instance_cls
.
packed_modules_mapping
)
return
instance_cls
(
vllm_config
=
vllm_config
,
prefix
=
prefix
)
return
instance_cls
(
vllm_config
=
vllm_config
,
prefix
=
prefix
)
\ No newline at end of file
vllm/model_executor/models/hunyuan_v1.py
View file @
df704163
...
@@ -938,7 +938,7 @@ class HunyuanV1ModelBase(nn.Module, SupportsLoRA, SupportsPP):
...
@@ -938,7 +938,7 @@ class HunyuanV1ModelBase(nn.Module, SupportsLoRA, SupportsPP):
def
forward
(
def
forward
(
self
,
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
@@ -1039,4 +1039,4 @@ class HunYuanDenseV1ForCausalLM(HunYuanDenseV1Base):
...
@@ -1039,4 +1039,4 @@ class HunYuanDenseV1ForCausalLM(HunYuanDenseV1Base):
class
HunYuanMoEV1ForCausalLM
(
HunYuanMoEV1Base
):
class
HunYuanMoEV1ForCausalLM
(
HunYuanMoEV1Base
):
pass
pass
\ No newline at end of file
vllm/model_executor/models/hunyuan_vision.py
View file @
df704163
...
@@ -968,7 +968,7 @@ class HunYuanVLForConditionalGeneration(
...
@@ -968,7 +968,7 @@ class HunYuanVLForConditionalGeneration(
def
forward
(
def
forward
(
self
,
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
,
intermediate_tensors
:
IntermediateTensors
|
None
,
inputs_embeds
:
torch
.
Tensor
|
None
,
inputs_embeds
:
torch
.
Tensor
|
None
,
...
@@ -1006,4 +1006,4 @@ class HunYuanVLForConditionalGeneration(
...
@@ -1006,4 +1006,4 @@ class HunYuanVLForConditionalGeneration(
language_model
=
"language_model.model"
,
language_model
=
"language_model.model"
,
connector
=
"visual.perceive"
,
connector
=
"visual.perceive"
,
tower_model
=
"visual"
,
tower_model
=
"visual"
,
)
)
\ No newline at end of file
vllm/model_executor/models/hyperclovax_vision.py
View file @
df704163
...
@@ -747,7 +747,7 @@ class HCXVisionForCausalLM(nn.Module, SupportsMultiModal, SupportsPP):
...
@@ -747,7 +747,7 @@ class HCXVisionForCausalLM(nn.Module, SupportsMultiModal, SupportsPP):
def
forward
(
def
forward
(
self
,
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
@@ -1150,4 +1150,4 @@ def anyres_postprocessing(
...
@@ -1150,4 +1150,4 @@ def anyres_postprocessing(
)
)
new_image_features
.
append
(
image_feature
)
new_image_features
.
append
(
image_feature
)
return
new_image_features
return
new_image_features
\ No newline at end of file
vllm/model_executor/models/idefics3.py
View file @
df704163
...
@@ -559,7 +559,7 @@ class Idefics3Model(nn.Module):
...
@@ -559,7 +559,7 @@ class Idefics3Model(nn.Module):
def
forward
(
def
forward
(
self
,
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
@@ -689,7 +689,7 @@ class Idefics3ForConditionalGeneration(nn.Module, SupportsMultiModal, SupportsLo
...
@@ -689,7 +689,7 @@ class Idefics3ForConditionalGeneration(nn.Module, SupportsMultiModal, SupportsLo
def
forward
(
def
forward
(
self
,
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
@@ -738,4 +738,4 @@ class Idefics3ForConditionalGeneration(nn.Module, SupportsMultiModal, SupportsLo
...
@@ -738,4 +738,4 @@ class Idefics3ForConditionalGeneration(nn.Module, SupportsMultiModal, SupportsLo
hf_config
=
self
.
config
hf_config
=
self
.
config
scale_factor
=
hf_config
.
scale_factor
scale_factor
=
hf_config
.
scale_factor
return
num_vision_tokens
//
scale_factor
**
2
return
num_vision_tokens
//
scale_factor
**
2
\ No newline at end of file
vllm/model_executor/models/interfaces.py
View file @
df704163
...
@@ -44,10 +44,6 @@ else:
...
@@ -44,10 +44,6 @@ else:
_ProcessorFactories
=
object
_ProcessorFactories
=
object
IntermediateTensors
=
object
IntermediateTensors
=
object
if
TYPE_CHECKING
:
from
vllm.config
import
LoRAConfig
,
MultiModalConfig
,
SchedulerConfig
from
vllm.sequence
import
IntermediateTensors
logger
=
init_logger
(
__name__
)
logger
=
init_logger
(
__name__
)
MultiModalEmbeddings
:
TypeAlias
=
list
[
Tensor
]
|
Tensor
|
tuple
[
Tensor
,
...]
MultiModalEmbeddings
:
TypeAlias
=
list
[
Tensor
]
|
Tensor
|
tuple
[
Tensor
,
...]
...
@@ -607,8 +603,6 @@ class SupportsPP(Protocol):
...
@@ -607,8 +603,6 @@ class SupportsPP(Protocol):
def
forward
(
def
forward
(
self
,
self
,
input_ids
:
Tensor
|
None
,
positions
:
Tensor
,
*
,
*
,
intermediate_tensors
:
IntermediateTensors
|
None
,
intermediate_tensors
:
IntermediateTensors
|
None
,
)
->
IntermediateTensors
|
None
:
)
->
IntermediateTensors
|
None
:
...
@@ -637,8 +631,6 @@ class _SupportsPPType(Protocol):
...
@@ -637,8 +631,6 @@ class _SupportsPPType(Protocol):
def
forward
(
def
forward
(
self
,
self
,
input_ids
:
Tensor
|
None
,
positions
:
Tensor
,
*
,
*
,
intermediate_tensors
:
IntermediateTensors
|
None
,
intermediate_tensors
:
IntermediateTensors
|
None
,
)
->
Tensor
|
IntermediateTensors
:
...
)
->
Tensor
|
IntermediateTensors
:
...
...
@@ -1339,4 +1331,4 @@ def supports_xdrope(model: object) -> TypeIs[SupportsXDRoPE]: ...
...
@@ -1339,4 +1331,4 @@ def supports_xdrope(model: object) -> TypeIs[SupportsXDRoPE]: ...
def
supports_xdrope
(
def
supports_xdrope
(
model
:
type
[
object
]
|
object
,
model
:
type
[
object
]
|
object
,
)
->
TypeIs
[
type
[
SupportsXDRoPE
]]
|
TypeIs
[
SupportsXDRoPE
]:
)
->
TypeIs
[
type
[
SupportsXDRoPE
]]
|
TypeIs
[
SupportsXDRoPE
]:
return
isinstance
(
model
,
SupportsXDRoPE
)
return
isinstance
(
model
,
SupportsXDRoPE
)
\ No newline at end of file
vllm/model_executor/models/intern_vit.py
View file @
df704163
...
@@ -33,8 +33,6 @@ from vllm.model_executor.layers.linear import (
...
@@ -33,8 +33,6 @@ from vllm.model_executor.layers.linear import (
)
)
from
vllm.model_executor.layers.quantization
import
QuantizationConfig
from
vllm.model_executor.layers.quantization
import
QuantizationConfig
from
vllm.model_executor.model_loader.weight_utils
import
default_weight_loader
from
vllm.model_executor.model_loader.weight_utils
import
default_weight_loader
import
vllm.envs
as
envs
from
.vision
import
run_dp_sharded_vision_model
from
.vision
import
run_dp_sharded_vision_model
...
@@ -457,4 +455,4 @@ class InternVisionModel(nn.Module):
...
@@ -457,4 +455,4 @@ class InternVisionModel(nn.Module):
weight_loader
=
getattr
(
param
,
"weight_loader"
,
default_weight_loader
)
weight_loader
=
getattr
(
param
,
"weight_loader"
,
default_weight_loader
)
weight_loader
(
param
,
loaded_weight
)
weight_loader
(
param
,
loaded_weight
)
loaded_params
.
add
(
name
)
loaded_params
.
add
(
name
)
return
loaded_params
return
loaded_params
\ No newline at end of file
vllm/model_executor/models/internlm2.py
View file @
df704163
...
@@ -284,7 +284,7 @@ class InternLM2Model(nn.Module):
...
@@ -284,7 +284,7 @@ class InternLM2Model(nn.Module):
def
forward
(
def
forward
(
self
,
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
@@ -350,7 +350,7 @@ class InternLM2ForCausalLM(nn.Module, SupportsPP, SupportsLoRA):
...
@@ -350,7 +350,7 @@ class InternLM2ForCausalLM(nn.Module, SupportsPP, SupportsLoRA):
def
forward
(
def
forward
(
self
,
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
,
intermediate_tensors
:
IntermediateTensors
|
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
@@ -446,7 +446,7 @@ class InternLM2ForRewardModel(InternLM2ForCausalLM):
...
@@ -446,7 +446,7 @@ class InternLM2ForRewardModel(InternLM2ForCausalLM):
def
forward
(
def
forward
(
self
,
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
@@ -456,4 +456,4 @@ class InternLM2ForRewardModel(InternLM2ForCausalLM):
...
@@ -456,4 +456,4 @@ class InternLM2ForRewardModel(InternLM2ForCausalLM):
)
)
hidden_states
=
hidden_states
.
to
(
self
.
head_dtype
)
hidden_states
=
hidden_states
.
to
(
self
.
head_dtype
)
logits
=
self
.
v_head
(
hidden_states
)
logits
=
self
.
v_head
(
hidden_states
)
return
logits
return
logits
\ No newline at end of file
vllm/model_executor/models/internlm2_ve.py
View file @
df704163
...
@@ -101,7 +101,7 @@ class InternLM2VEModel(InternLM2Model):
...
@@ -101,7 +101,7 @@ class InternLM2VEModel(InternLM2Model):
def
forward
(
def
forward
(
self
,
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
@@ -136,4 +136,4 @@ class InternLM2VEForCausalLM(InternLM2ForCausalLM):
...
@@ -136,4 +136,4 @@ class InternLM2VEForCausalLM(InternLM2ForCausalLM):
def
__init__
(
self
,
*
,
vllm_config
:
VllmConfig
,
prefix
:
str
=
""
):
def
__init__
(
self
,
*
,
vllm_config
:
VllmConfig
,
prefix
:
str
=
""
):
super
().
__init__
(
super
().
__init__
(
vllm_config
=
vllm_config
,
prefix
=
prefix
,
model_type
=
InternLM2VEModel
vllm_config
=
vllm_config
,
prefix
=
prefix
,
model_type
=
InternLM2VEModel
)
)
\ No newline at end of file
vllm/model_executor/models/interns1.py
View file @
df704163
...
@@ -782,7 +782,7 @@ class InternS1ForConditionalGeneration(
...
@@ -782,7 +782,7 @@ class InternS1ForConditionalGeneration(
def
forward
(
def
forward
(
self
,
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
@@ -819,4 +819,4 @@ class InternS1ForConditionalGeneration(
...
@@ -819,4 +819,4 @@ class InternS1ForConditionalGeneration(
language_model
=
"language_model"
,
language_model
=
"language_model"
,
connector
=
"multi_modal_projector"
,
connector
=
"multi_modal_projector"
,
tower_model
=
"vision_tower"
,
tower_model
=
"vision_tower"
,
)
)
\ No newline at end of file
vllm/model_executor/models/internvl.py
View file @
df704163
...
@@ -1371,7 +1371,7 @@ class InternVLChatModel(nn.Module, SupportsMultiModal, SupportsPP, SupportsLoRA)
...
@@ -1371,7 +1371,7 @@ class InternVLChatModel(nn.Module, SupportsMultiModal, SupportsPP, SupportsLoRA)
def
forward
(
def
forward
(
self
,
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
@@ -1442,4 +1442,4 @@ class InternVLChatModel(nn.Module, SupportsMultiModal, SupportsPP, SupportsLoRA)
...
@@ -1442,4 +1442,4 @@ class InternVLChatModel(nn.Module, SupportsMultiModal, SupportsPP, SupportsLoRA)
return
0
return
0
num_patches
=
num_vision_tokens
//
(
self
.
patch_tokens
+
1
)
num_patches
=
num_vision_tokens
//
(
self
.
patch_tokens
+
1
)
return
num_patches
*
self
.
num_image_token
return
num_patches
*
self
.
num_image_token
\ No newline at end of file
vllm/model_executor/models/iquest_loopcoder.py
View file @
df704163
...
@@ -438,7 +438,7 @@ class IQuestLoopCoderModel(nn.Module):
...
@@ -438,7 +438,7 @@ class IQuestLoopCoderModel(nn.Module):
def
forward
(
def
forward
(
self
,
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
@@ -570,7 +570,7 @@ class IQuestLoopCoderForCausalLM(nn.Module):
...
@@ -570,7 +570,7 @@ class IQuestLoopCoderForCausalLM(nn.Module):
def
forward
(
def
forward
(
self
,
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
@@ -592,4 +592,4 @@ class IQuestLoopCoderForCausalLM(nn.Module):
...
@@ -592,4 +592,4 @@ class IQuestLoopCoderForCausalLM(nn.Module):
self
,
self
,
skip_prefixes
=
([
"lm_head."
]
if
self
.
config
.
tie_word_embeddings
else
None
),
skip_prefixes
=
([
"lm_head."
]
if
self
.
config
.
tie_word_embeddings
else
None
),
)
)
return
loader
.
load_weights
(
weights
)
return
loader
.
load_weights
(
weights
)
\ No newline at end of file
vllm/model_executor/models/isaac.py
View file @
df704163
...
@@ -1450,7 +1450,7 @@ class IsaacForConditionalGeneration(
...
@@ -1450,7 +1450,7 @@ class IsaacForConditionalGeneration(
def
forward
(
def
forward
(
self
,
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
@@ -1479,4 +1479,4 @@ class IsaacForConditionalGeneration(
...
@@ -1479,4 +1479,4 @@ class IsaacForConditionalGeneration(
language_model
=
"language_model"
,
language_model
=
"language_model"
,
connector
=
"vision_embedding.linear_fc2"
,
# The final linear layer
connector
=
"vision_embedding.linear_fc2"
,
# The final linear layer
tower_model
=
"vision_embedding"
,
tower_model
=
"vision_embedding"
,
)
)
\ No newline at end of file
vllm/model_executor/models/jais.py
View file @
df704163
...
@@ -280,7 +280,7 @@ class JAISModel(nn.Module):
...
@@ -280,7 +280,7 @@ class JAISModel(nn.Module):
def
forward
(
def
forward
(
self
,
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
position_ids
:
torch
.
Tensor
,
position_ids
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
@@ -344,7 +344,7 @@ class JAISLMHeadModel(nn.Module, SupportsPP):
...
@@ -344,7 +344,7 @@ class JAISLMHeadModel(nn.Module, SupportsPP):
def
forward
(
def
forward
(
self
,
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
@@ -394,4 +394,4 @@ class JAISLMHeadModel(nn.Module, SupportsPP):
...
@@ -394,4 +394,4 @@ class JAISLMHeadModel(nn.Module, SupportsPP):
weight_loader
=
getattr
(
param
,
"weight_loader"
,
default_weight_loader
)
weight_loader
=
getattr
(
param
,
"weight_loader"
,
default_weight_loader
)
weight_loader
(
param
,
loaded_weight
)
weight_loader
(
param
,
loaded_weight
)
loaded_params
.
add
(
name
)
loaded_params
.
add
(
name
)
return
loaded_params
return
loaded_params
\ No newline at end of file
vllm/model_executor/models/jais2.py
View file @
df704163
...
@@ -483,7 +483,7 @@ class Jais2ForCausalLM(nn.Module, SupportsLoRA, SupportsPP):
...
@@ -483,7 +483,7 @@ class Jais2ForCausalLM(nn.Module, SupportsLoRA, SupportsPP):
def
forward
(
def
forward
(
self
,
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
@@ -505,4 +505,4 @@ class Jais2ForCausalLM(nn.Module, SupportsLoRA, SupportsPP):
...
@@ -505,4 +505,4 @@ class Jais2ForCausalLM(nn.Module, SupportsLoRA, SupportsPP):
self
,
self
,
skip_prefixes
=
([
"lm_head."
]
if
self
.
config
.
tie_word_embeddings
else
None
),
skip_prefixes
=
([
"lm_head."
]
if
self
.
config
.
tie_word_embeddings
else
None
),
)
)
return
loader
.
load_weights
(
weights
)
return
loader
.
load_weights
(
weights
)
\ No newline at end of file
vllm/model_executor/models/jamba.py
View file @
df704163
...
@@ -348,7 +348,7 @@ class JambaModel(nn.Module):
...
@@ -348,7 +348,7 @@ class JambaModel(nn.Module):
def
forward
(
def
forward
(
self
,
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
@@ -516,7 +516,7 @@ class JambaForCausalLM(
...
@@ -516,7 +516,7 @@ class JambaForCausalLM(
def
forward
(
def
forward
(
self
,
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
@@ -602,4 +602,4 @@ class JambaForSequenceClassification(JambaForCausalLM):
...
@@ -602,4 +602,4 @@ class JambaForSequenceClassification(JambaForCausalLM):
pooler_config
=
vllm_config
.
model_config
.
pooler_config
pooler_config
=
vllm_config
.
model_config
.
pooler_config
assert
pooler_config
is
not
None
assert
pooler_config
is
not
None
self
.
pooler
=
DispatchPooler
.
for_seq_cls
(
pooler_config
,
classifier
=
self
.
score
)
self
.
pooler
=
DispatchPooler
.
for_seq_cls
(
pooler_config
,
classifier
=
self
.
score
)
\ No newline at end of file
vllm/model_executor/models/jina_vl.py
View file @
df704163
...
@@ -125,7 +125,7 @@ class JinaVLForSequenceClassification(
...
@@ -125,7 +125,7 @@ class JinaVLForSequenceClassification(
def
forward
(
def
forward
(
self
,
self
,
input_ids
:
torch
.
Tensor
|
None
,
input_ids
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
positions
:
torch
.
Tensor
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
intermediate_tensors
:
IntermediateTensors
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
inputs_embeds
:
torch
.
Tensor
|
None
=
None
,
...
@@ -142,4 +142,4 @@ class JinaVLForSequenceClassification(
...
@@ -142,4 +142,4 @@ class JinaVLForSequenceClassification(
def
load_weights
(
self
,
weights
:
Iterable
[
tuple
[
str
,
torch
.
Tensor
]]):
def
load_weights
(
self
,
weights
:
Iterable
[
tuple
[
str
,
torch
.
Tensor
]]):
loader
=
AutoWeightsLoader
(
self
)
loader
=
AutoWeightsLoader
(
self
)
return
loader
.
load_weights
(
weights
,
mapper
=
self
.
weight_mapper
)
return
loader
.
load_weights
(
weights
,
mapper
=
self
.
weight_mapper
)
\ No newline at end of file
Prev
1
2
3
4
5
6
7
8
9
Next
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment