Commit df704163 authored by zhuwenwen's avatar zhuwenwen
Browse files

sync v0.15.1 (models)

parent d7db129a
...@@ -312,7 +312,7 @@ class GraniteMoeModel(nn.Module): ...@@ -312,7 +312,7 @@ class GraniteMoeModel(nn.Module):
def forward( def forward(
self, self,
input_ids: torch.Tensor | None, input_ids: torch.Tensor,
positions: torch.Tensor, positions: torch.Tensor,
intermediate_tensors: IntermediateTensors | None, intermediate_tensors: IntermediateTensors | None,
inputs_embeds: torch.Tensor | None = None, inputs_embeds: torch.Tensor | None = None,
...@@ -528,7 +528,7 @@ class GraniteMoeForCausalLM(nn.Module, SupportsLoRA, SupportsPP): ...@@ -528,7 +528,7 @@ class GraniteMoeForCausalLM(nn.Module, SupportsLoRA, SupportsPP):
def forward( def forward(
self, self,
input_ids: torch.Tensor | None, input_ids: torch.Tensor,
positions: torch.Tensor, positions: torch.Tensor,
intermediate_tensors: IntermediateTensors | None = None, intermediate_tensors: IntermediateTensors | None = None,
inputs_embeds: torch.Tensor | None = None, inputs_embeds: torch.Tensor | None = None,
...@@ -558,4 +558,4 @@ class GraniteMoeForCausalLM(nn.Module, SupportsLoRA, SupportsPP): ...@@ -558,4 +558,4 @@ class GraniteMoeForCausalLM(nn.Module, SupportsLoRA, SupportsPP):
self, self,
skip_prefixes=(["lm_head."] if self.config.tie_word_embeddings else None), skip_prefixes=(["lm_head."] if self.config.tie_word_embeddings else None),
) )
return loader.load_weights(weights) return loader.load_weights(weights)
\ No newline at end of file
...@@ -368,7 +368,7 @@ class GraniteMoeHybridModel(nn.Module): ...@@ -368,7 +368,7 @@ class GraniteMoeHybridModel(nn.Module):
def forward( def forward(
self, self,
input_ids: torch.Tensor | None, input_ids: torch.Tensor,
positions: torch.Tensor, positions: torch.Tensor,
intermediate_tensors: IntermediateTensors | None = None, intermediate_tensors: IntermediateTensors | None = None,
inputs_embeds: torch.Tensor | None = None, inputs_embeds: torch.Tensor | None = None,
...@@ -685,7 +685,7 @@ class GraniteMoeHybridForCausalLM( ...@@ -685,7 +685,7 @@ class GraniteMoeHybridForCausalLM(
def forward( def forward(
self, self,
input_ids: torch.Tensor | None, input_ids: torch.Tensor,
positions: torch.Tensor, positions: torch.Tensor,
intermediate_tensors: IntermediateTensors | None = None, intermediate_tensors: IntermediateTensors | None = None,
inputs_embeds: torch.Tensor | None = None, inputs_embeds: torch.Tensor | None = None,
...@@ -706,4 +706,4 @@ class GraniteMoeHybridForCausalLM( ...@@ -706,4 +706,4 @@ class GraniteMoeHybridForCausalLM(
def load_weights(self, weights: Iterable[tuple[str, torch.Tensor]]) -> set[str]: def load_weights(self, weights: Iterable[tuple[str, torch.Tensor]]) -> set[str]:
loader = AutoWeightsLoader(self) loader = AutoWeightsLoader(self)
return loader.load_weights(weights) return loader.load_weights(weights)
\ No newline at end of file
...@@ -183,7 +183,7 @@ class GraniteMoeSharedModel(nn.Module): ...@@ -183,7 +183,7 @@ class GraniteMoeSharedModel(nn.Module):
def forward( def forward(
self, self,
input_ids: torch.Tensor | None, input_ids: torch.Tensor,
positions: torch.Tensor, positions: torch.Tensor,
intermediate_tensors: IntermediateTensors | None, intermediate_tensors: IntermediateTensors | None,
inputs_embeds: torch.Tensor | None = None, inputs_embeds: torch.Tensor | None = None,
...@@ -295,7 +295,7 @@ class GraniteMoeSharedForCausalLM(nn.Module, SupportsLoRA, SupportsPP): ...@@ -295,7 +295,7 @@ class GraniteMoeSharedForCausalLM(nn.Module, SupportsLoRA, SupportsPP):
def forward( def forward(
self, self,
input_ids: torch.Tensor | None, input_ids: torch.Tensor,
positions: torch.Tensor, positions: torch.Tensor,
intermediate_tensors: IntermediateTensors | None = None, intermediate_tensors: IntermediateTensors | None = None,
inputs_embeds: torch.Tensor | None = None, inputs_embeds: torch.Tensor | None = None,
...@@ -325,4 +325,4 @@ class GraniteMoeSharedForCausalLM(nn.Module, SupportsLoRA, SupportsPP): ...@@ -325,4 +325,4 @@ class GraniteMoeSharedForCausalLM(nn.Module, SupportsLoRA, SupportsPP):
self, self,
skip_prefixes=(["lm_head."] if self.config.tie_word_embeddings else None), skip_prefixes=(["lm_head."] if self.config.tie_word_embeddings else None),
) )
return loader.load_weights(weights) return loader.load_weights(weights)
\ No newline at end of file
...@@ -491,7 +491,7 @@ class Grok1Model(nn.Module): ...@@ -491,7 +491,7 @@ class Grok1Model(nn.Module):
def forward( def forward(
self, self,
input_ids: torch.Tensor | None, input_ids: torch.Tensor,
positions: torch.Tensor, positions: torch.Tensor,
intermediate_tensors: IntermediateTensors | None, intermediate_tensors: IntermediateTensors | None,
inputs_embeds: torch.Tensor | None = None, inputs_embeds: torch.Tensor | None = None,
...@@ -705,7 +705,7 @@ class GrokBaseForCausalLM(nn.Module, SupportsLoRA, SupportsPP): ...@@ -705,7 +705,7 @@ class GrokBaseForCausalLM(nn.Module, SupportsLoRA, SupportsPP):
def forward( def forward(
self, self,
input_ids: torch.Tensor | None, input_ids: torch.Tensor,
positions: torch.Tensor, positions: torch.Tensor,
intermediate_tensors: IntermediateTensors | None = None, intermediate_tensors: IntermediateTensors | None = None,
inputs_embeds: torch.Tensor | None = None, inputs_embeds: torch.Tensor | None = None,
...@@ -800,4 +800,4 @@ class GrokForCausalLM(GrokBaseForCausalLM): ...@@ -800,4 +800,4 @@ class GrokForCausalLM(GrokBaseForCausalLM):
cls.packed_modules_mapping = dict(cls.packed_modules_mapping) cls.packed_modules_mapping = dict(cls.packed_modules_mapping)
cls.packed_modules_mapping.update(instance_cls.packed_modules_mapping) cls.packed_modules_mapping.update(instance_cls.packed_modules_mapping)
return instance_cls(vllm_config=vllm_config, prefix=prefix) return instance_cls(vllm_config=vllm_config, prefix=prefix)
\ No newline at end of file
...@@ -938,7 +938,7 @@ class HunyuanV1ModelBase(nn.Module, SupportsLoRA, SupportsPP): ...@@ -938,7 +938,7 @@ class HunyuanV1ModelBase(nn.Module, SupportsLoRA, SupportsPP):
def forward( def forward(
self, self,
input_ids: torch.Tensor | None, input_ids: torch.Tensor,
positions: torch.Tensor, positions: torch.Tensor,
intermediate_tensors: IntermediateTensors | None = None, intermediate_tensors: IntermediateTensors | None = None,
inputs_embeds: torch.Tensor | None = None, inputs_embeds: torch.Tensor | None = None,
...@@ -1039,4 +1039,4 @@ class HunYuanDenseV1ForCausalLM(HunYuanDenseV1Base): ...@@ -1039,4 +1039,4 @@ class HunYuanDenseV1ForCausalLM(HunYuanDenseV1Base):
class HunYuanMoEV1ForCausalLM(HunYuanMoEV1Base): class HunYuanMoEV1ForCausalLM(HunYuanMoEV1Base):
pass pass
\ No newline at end of file
...@@ -968,7 +968,7 @@ class HunYuanVLForConditionalGeneration( ...@@ -968,7 +968,7 @@ class HunYuanVLForConditionalGeneration(
def forward( def forward(
self, self,
input_ids: torch.Tensor | None, input_ids: torch.Tensor,
positions: torch.Tensor, positions: torch.Tensor,
intermediate_tensors: IntermediateTensors | None, intermediate_tensors: IntermediateTensors | None,
inputs_embeds: torch.Tensor | None, inputs_embeds: torch.Tensor | None,
...@@ -1006,4 +1006,4 @@ class HunYuanVLForConditionalGeneration( ...@@ -1006,4 +1006,4 @@ class HunYuanVLForConditionalGeneration(
language_model="language_model.model", language_model="language_model.model",
connector="visual.perceive", connector="visual.perceive",
tower_model="visual", tower_model="visual",
) )
\ No newline at end of file
...@@ -747,7 +747,7 @@ class HCXVisionForCausalLM(nn.Module, SupportsMultiModal, SupportsPP): ...@@ -747,7 +747,7 @@ class HCXVisionForCausalLM(nn.Module, SupportsMultiModal, SupportsPP):
def forward( def forward(
self, self,
input_ids: torch.Tensor | None, input_ids: torch.Tensor,
positions: torch.Tensor, positions: torch.Tensor,
intermediate_tensors: IntermediateTensors | None = None, intermediate_tensors: IntermediateTensors | None = None,
inputs_embeds: torch.Tensor | None = None, inputs_embeds: torch.Tensor | None = None,
...@@ -1150,4 +1150,4 @@ def anyres_postprocessing( ...@@ -1150,4 +1150,4 @@ def anyres_postprocessing(
) )
new_image_features.append(image_feature) new_image_features.append(image_feature)
return new_image_features return new_image_features
\ No newline at end of file
...@@ -559,7 +559,7 @@ class Idefics3Model(nn.Module): ...@@ -559,7 +559,7 @@ class Idefics3Model(nn.Module):
def forward( def forward(
self, self,
input_ids: torch.Tensor | None, input_ids: torch.Tensor,
positions: torch.Tensor, positions: torch.Tensor,
intermediate_tensors: IntermediateTensors | None = None, intermediate_tensors: IntermediateTensors | None = None,
inputs_embeds: torch.Tensor | None = None, inputs_embeds: torch.Tensor | None = None,
...@@ -689,7 +689,7 @@ class Idefics3ForConditionalGeneration(nn.Module, SupportsMultiModal, SupportsLo ...@@ -689,7 +689,7 @@ class Idefics3ForConditionalGeneration(nn.Module, SupportsMultiModal, SupportsLo
def forward( def forward(
self, self,
input_ids: torch.Tensor | None, input_ids: torch.Tensor,
positions: torch.Tensor, positions: torch.Tensor,
intermediate_tensors: IntermediateTensors | None = None, intermediate_tensors: IntermediateTensors | None = None,
inputs_embeds: torch.Tensor | None = None, inputs_embeds: torch.Tensor | None = None,
...@@ -738,4 +738,4 @@ class Idefics3ForConditionalGeneration(nn.Module, SupportsMultiModal, SupportsLo ...@@ -738,4 +738,4 @@ class Idefics3ForConditionalGeneration(nn.Module, SupportsMultiModal, SupportsLo
hf_config = self.config hf_config = self.config
scale_factor = hf_config.scale_factor scale_factor = hf_config.scale_factor
return num_vision_tokens // scale_factor**2 return num_vision_tokens // scale_factor**2
\ No newline at end of file
...@@ -44,10 +44,6 @@ else: ...@@ -44,10 +44,6 @@ else:
_ProcessorFactories = object _ProcessorFactories = object
IntermediateTensors = object IntermediateTensors = object
if TYPE_CHECKING:
from vllm.config import LoRAConfig, MultiModalConfig, SchedulerConfig
from vllm.sequence import IntermediateTensors
logger = init_logger(__name__) logger = init_logger(__name__)
MultiModalEmbeddings: TypeAlias = list[Tensor] | Tensor | tuple[Tensor, ...] MultiModalEmbeddings: TypeAlias = list[Tensor] | Tensor | tuple[Tensor, ...]
...@@ -607,8 +603,6 @@ class SupportsPP(Protocol): ...@@ -607,8 +603,6 @@ class SupportsPP(Protocol):
def forward( def forward(
self, self,
input_ids: Tensor | None,
positions: Tensor,
*, *,
intermediate_tensors: IntermediateTensors | None, intermediate_tensors: IntermediateTensors | None,
) -> IntermediateTensors | None: ) -> IntermediateTensors | None:
...@@ -637,8 +631,6 @@ class _SupportsPPType(Protocol): ...@@ -637,8 +631,6 @@ class _SupportsPPType(Protocol):
def forward( def forward(
self, self,
input_ids: Tensor | None,
positions: Tensor,
*, *,
intermediate_tensors: IntermediateTensors | None, intermediate_tensors: IntermediateTensors | None,
) -> Tensor | IntermediateTensors: ... ) -> Tensor | IntermediateTensors: ...
...@@ -1339,4 +1331,4 @@ def supports_xdrope(model: object) -> TypeIs[SupportsXDRoPE]: ... ...@@ -1339,4 +1331,4 @@ def supports_xdrope(model: object) -> TypeIs[SupportsXDRoPE]: ...
def supports_xdrope( def supports_xdrope(
model: type[object] | object, model: type[object] | object,
) -> TypeIs[type[SupportsXDRoPE]] | TypeIs[SupportsXDRoPE]: ) -> TypeIs[type[SupportsXDRoPE]] | TypeIs[SupportsXDRoPE]:
return isinstance(model, SupportsXDRoPE) return isinstance(model, SupportsXDRoPE)
\ No newline at end of file
...@@ -33,8 +33,6 @@ from vllm.model_executor.layers.linear import ( ...@@ -33,8 +33,6 @@ from vllm.model_executor.layers.linear import (
) )
from vllm.model_executor.layers.quantization import QuantizationConfig from vllm.model_executor.layers.quantization import QuantizationConfig
from vllm.model_executor.model_loader.weight_utils import default_weight_loader from vllm.model_executor.model_loader.weight_utils import default_weight_loader
import vllm.envs as envs
from .vision import run_dp_sharded_vision_model from .vision import run_dp_sharded_vision_model
...@@ -457,4 +455,4 @@ class InternVisionModel(nn.Module): ...@@ -457,4 +455,4 @@ class InternVisionModel(nn.Module):
weight_loader = getattr(param, "weight_loader", default_weight_loader) weight_loader = getattr(param, "weight_loader", default_weight_loader)
weight_loader(param, loaded_weight) weight_loader(param, loaded_weight)
loaded_params.add(name) loaded_params.add(name)
return loaded_params return loaded_params
\ No newline at end of file
...@@ -284,7 +284,7 @@ class InternLM2Model(nn.Module): ...@@ -284,7 +284,7 @@ class InternLM2Model(nn.Module):
def forward( def forward(
self, self,
input_ids: torch.Tensor | None, input_ids: torch.Tensor,
positions: torch.Tensor, positions: torch.Tensor,
intermediate_tensors: IntermediateTensors | None = None, intermediate_tensors: IntermediateTensors | None = None,
inputs_embeds: torch.Tensor | None = None, inputs_embeds: torch.Tensor | None = None,
...@@ -350,7 +350,7 @@ class InternLM2ForCausalLM(nn.Module, SupportsPP, SupportsLoRA): ...@@ -350,7 +350,7 @@ class InternLM2ForCausalLM(nn.Module, SupportsPP, SupportsLoRA):
def forward( def forward(
self, self,
input_ids: torch.Tensor | None, input_ids: torch.Tensor,
positions: torch.Tensor, positions: torch.Tensor,
intermediate_tensors: IntermediateTensors | None, intermediate_tensors: IntermediateTensors | None,
inputs_embeds: torch.Tensor | None = None, inputs_embeds: torch.Tensor | None = None,
...@@ -446,7 +446,7 @@ class InternLM2ForRewardModel(InternLM2ForCausalLM): ...@@ -446,7 +446,7 @@ class InternLM2ForRewardModel(InternLM2ForCausalLM):
def forward( def forward(
self, self,
input_ids: torch.Tensor | None, input_ids: torch.Tensor,
positions: torch.Tensor, positions: torch.Tensor,
intermediate_tensors: IntermediateTensors | None = None, intermediate_tensors: IntermediateTensors | None = None,
inputs_embeds: torch.Tensor | None = None, inputs_embeds: torch.Tensor | None = None,
...@@ -456,4 +456,4 @@ class InternLM2ForRewardModel(InternLM2ForCausalLM): ...@@ -456,4 +456,4 @@ class InternLM2ForRewardModel(InternLM2ForCausalLM):
) )
hidden_states = hidden_states.to(self.head_dtype) hidden_states = hidden_states.to(self.head_dtype)
logits = self.v_head(hidden_states) logits = self.v_head(hidden_states)
return logits return logits
\ No newline at end of file
...@@ -101,7 +101,7 @@ class InternLM2VEModel(InternLM2Model): ...@@ -101,7 +101,7 @@ class InternLM2VEModel(InternLM2Model):
def forward( def forward(
self, self,
input_ids: torch.Tensor | None, input_ids: torch.Tensor,
positions: torch.Tensor, positions: torch.Tensor,
intermediate_tensors: IntermediateTensors | None = None, intermediate_tensors: IntermediateTensors | None = None,
inputs_embeds: torch.Tensor | None = None, inputs_embeds: torch.Tensor | None = None,
...@@ -136,4 +136,4 @@ class InternLM2VEForCausalLM(InternLM2ForCausalLM): ...@@ -136,4 +136,4 @@ class InternLM2VEForCausalLM(InternLM2ForCausalLM):
def __init__(self, *, vllm_config: VllmConfig, prefix: str = ""): def __init__(self, *, vllm_config: VllmConfig, prefix: str = ""):
super().__init__( super().__init__(
vllm_config=vllm_config, prefix=prefix, model_type=InternLM2VEModel vllm_config=vllm_config, prefix=prefix, model_type=InternLM2VEModel
) )
\ No newline at end of file
...@@ -782,7 +782,7 @@ class InternS1ForConditionalGeneration( ...@@ -782,7 +782,7 @@ class InternS1ForConditionalGeneration(
def forward( def forward(
self, self,
input_ids: torch.Tensor | None, input_ids: torch.Tensor,
positions: torch.Tensor, positions: torch.Tensor,
intermediate_tensors: IntermediateTensors | None = None, intermediate_tensors: IntermediateTensors | None = None,
inputs_embeds: torch.Tensor | None = None, inputs_embeds: torch.Tensor | None = None,
...@@ -819,4 +819,4 @@ class InternS1ForConditionalGeneration( ...@@ -819,4 +819,4 @@ class InternS1ForConditionalGeneration(
language_model="language_model", language_model="language_model",
connector="multi_modal_projector", connector="multi_modal_projector",
tower_model="vision_tower", tower_model="vision_tower",
) )
\ No newline at end of file
...@@ -1371,7 +1371,7 @@ class InternVLChatModel(nn.Module, SupportsMultiModal, SupportsPP, SupportsLoRA) ...@@ -1371,7 +1371,7 @@ class InternVLChatModel(nn.Module, SupportsMultiModal, SupportsPP, SupportsLoRA)
def forward( def forward(
self, self,
input_ids: torch.Tensor | None, input_ids: torch.Tensor,
positions: torch.Tensor, positions: torch.Tensor,
intermediate_tensors: IntermediateTensors | None = None, intermediate_tensors: IntermediateTensors | None = None,
inputs_embeds: torch.Tensor | None = None, inputs_embeds: torch.Tensor | None = None,
...@@ -1442,4 +1442,4 @@ class InternVLChatModel(nn.Module, SupportsMultiModal, SupportsPP, SupportsLoRA) ...@@ -1442,4 +1442,4 @@ class InternVLChatModel(nn.Module, SupportsMultiModal, SupportsPP, SupportsLoRA)
return 0 return 0
num_patches = num_vision_tokens // (self.patch_tokens + 1) num_patches = num_vision_tokens // (self.patch_tokens + 1)
return num_patches * self.num_image_token return num_patches * self.num_image_token
\ No newline at end of file
...@@ -438,7 +438,7 @@ class IQuestLoopCoderModel(nn.Module): ...@@ -438,7 +438,7 @@ class IQuestLoopCoderModel(nn.Module):
def forward( def forward(
self, self,
input_ids: torch.Tensor | None, input_ids: torch.Tensor,
positions: torch.Tensor, positions: torch.Tensor,
intermediate_tensors: IntermediateTensors | None = None, intermediate_tensors: IntermediateTensors | None = None,
inputs_embeds: torch.Tensor | None = None, inputs_embeds: torch.Tensor | None = None,
...@@ -570,7 +570,7 @@ class IQuestLoopCoderForCausalLM(nn.Module): ...@@ -570,7 +570,7 @@ class IQuestLoopCoderForCausalLM(nn.Module):
def forward( def forward(
self, self,
input_ids: torch.Tensor | None, input_ids: torch.Tensor,
positions: torch.Tensor, positions: torch.Tensor,
intermediate_tensors: IntermediateTensors | None = None, intermediate_tensors: IntermediateTensors | None = None,
inputs_embeds: torch.Tensor | None = None, inputs_embeds: torch.Tensor | None = None,
...@@ -592,4 +592,4 @@ class IQuestLoopCoderForCausalLM(nn.Module): ...@@ -592,4 +592,4 @@ class IQuestLoopCoderForCausalLM(nn.Module):
self, self,
skip_prefixes=(["lm_head."] if self.config.tie_word_embeddings else None), skip_prefixes=(["lm_head."] if self.config.tie_word_embeddings else None),
) )
return loader.load_weights(weights) return loader.load_weights(weights)
\ No newline at end of file
...@@ -1450,7 +1450,7 @@ class IsaacForConditionalGeneration( ...@@ -1450,7 +1450,7 @@ class IsaacForConditionalGeneration(
def forward( def forward(
self, self,
input_ids: torch.Tensor | None, input_ids: torch.Tensor,
positions: torch.Tensor, positions: torch.Tensor,
intermediate_tensors: IntermediateTensors | None = None, intermediate_tensors: IntermediateTensors | None = None,
inputs_embeds: torch.Tensor | None = None, inputs_embeds: torch.Tensor | None = None,
...@@ -1479,4 +1479,4 @@ class IsaacForConditionalGeneration( ...@@ -1479,4 +1479,4 @@ class IsaacForConditionalGeneration(
language_model="language_model", language_model="language_model",
connector="vision_embedding.linear_fc2", # The final linear layer connector="vision_embedding.linear_fc2", # The final linear layer
tower_model="vision_embedding", tower_model="vision_embedding",
) )
\ No newline at end of file
...@@ -280,7 +280,7 @@ class JAISModel(nn.Module): ...@@ -280,7 +280,7 @@ class JAISModel(nn.Module):
def forward( def forward(
self, self,
input_ids: torch.Tensor | None, input_ids: torch.Tensor,
position_ids: torch.Tensor, position_ids: torch.Tensor,
intermediate_tensors: IntermediateTensors | None = None, intermediate_tensors: IntermediateTensors | None = None,
inputs_embeds: torch.Tensor | None = None, inputs_embeds: torch.Tensor | None = None,
...@@ -344,7 +344,7 @@ class JAISLMHeadModel(nn.Module, SupportsPP): ...@@ -344,7 +344,7 @@ class JAISLMHeadModel(nn.Module, SupportsPP):
def forward( def forward(
self, self,
input_ids: torch.Tensor | None, input_ids: torch.Tensor,
positions: torch.Tensor, positions: torch.Tensor,
intermediate_tensors: IntermediateTensors | None = None, intermediate_tensors: IntermediateTensors | None = None,
inputs_embeds: torch.Tensor | None = None, inputs_embeds: torch.Tensor | None = None,
...@@ -394,4 +394,4 @@ class JAISLMHeadModel(nn.Module, SupportsPP): ...@@ -394,4 +394,4 @@ class JAISLMHeadModel(nn.Module, SupportsPP):
weight_loader = getattr(param, "weight_loader", default_weight_loader) weight_loader = getattr(param, "weight_loader", default_weight_loader)
weight_loader(param, loaded_weight) weight_loader(param, loaded_weight)
loaded_params.add(name) loaded_params.add(name)
return loaded_params return loaded_params
\ No newline at end of file
...@@ -483,7 +483,7 @@ class Jais2ForCausalLM(nn.Module, SupportsLoRA, SupportsPP): ...@@ -483,7 +483,7 @@ class Jais2ForCausalLM(nn.Module, SupportsLoRA, SupportsPP):
def forward( def forward(
self, self,
input_ids: torch.Tensor | None, input_ids: torch.Tensor,
positions: torch.Tensor, positions: torch.Tensor,
intermediate_tensors: IntermediateTensors | None = None, intermediate_tensors: IntermediateTensors | None = None,
inputs_embeds: torch.Tensor | None = None, inputs_embeds: torch.Tensor | None = None,
...@@ -505,4 +505,4 @@ class Jais2ForCausalLM(nn.Module, SupportsLoRA, SupportsPP): ...@@ -505,4 +505,4 @@ class Jais2ForCausalLM(nn.Module, SupportsLoRA, SupportsPP):
self, self,
skip_prefixes=(["lm_head."] if self.config.tie_word_embeddings else None), skip_prefixes=(["lm_head."] if self.config.tie_word_embeddings else None),
) )
return loader.load_weights(weights) return loader.load_weights(weights)
\ No newline at end of file
...@@ -348,7 +348,7 @@ class JambaModel(nn.Module): ...@@ -348,7 +348,7 @@ class JambaModel(nn.Module):
def forward( def forward(
self, self,
input_ids: torch.Tensor | None, input_ids: torch.Tensor,
positions: torch.Tensor, positions: torch.Tensor,
intermediate_tensors: IntermediateTensors | None = None, intermediate_tensors: IntermediateTensors | None = None,
inputs_embeds: torch.Tensor | None = None, inputs_embeds: torch.Tensor | None = None,
...@@ -516,7 +516,7 @@ class JambaForCausalLM( ...@@ -516,7 +516,7 @@ class JambaForCausalLM(
def forward( def forward(
self, self,
input_ids: torch.Tensor | None, input_ids: torch.Tensor,
positions: torch.Tensor, positions: torch.Tensor,
intermediate_tensors: IntermediateTensors | None = None, intermediate_tensors: IntermediateTensors | None = None,
inputs_embeds: torch.Tensor | None = None, inputs_embeds: torch.Tensor | None = None,
...@@ -602,4 +602,4 @@ class JambaForSequenceClassification(JambaForCausalLM): ...@@ -602,4 +602,4 @@ class JambaForSequenceClassification(JambaForCausalLM):
pooler_config = vllm_config.model_config.pooler_config pooler_config = vllm_config.model_config.pooler_config
assert pooler_config is not None assert pooler_config is not None
self.pooler = DispatchPooler.for_seq_cls(pooler_config, classifier=self.score) self.pooler = DispatchPooler.for_seq_cls(pooler_config, classifier=self.score)
\ No newline at end of file
...@@ -125,7 +125,7 @@ class JinaVLForSequenceClassification( ...@@ -125,7 +125,7 @@ class JinaVLForSequenceClassification(
def forward( def forward(
self, self,
input_ids: torch.Tensor | None, input_ids: torch.Tensor,
positions: torch.Tensor, positions: torch.Tensor,
intermediate_tensors: IntermediateTensors | None = None, intermediate_tensors: IntermediateTensors | None = None,
inputs_embeds: torch.Tensor | None = None, inputs_embeds: torch.Tensor | None = None,
...@@ -142,4 +142,4 @@ class JinaVLForSequenceClassification( ...@@ -142,4 +142,4 @@ class JinaVLForSequenceClassification(
def load_weights(self, weights: Iterable[tuple[str, torch.Tensor]]): def load_weights(self, weights: Iterable[tuple[str, torch.Tensor]]):
loader = AutoWeightsLoader(self) loader = AutoWeightsLoader(self)
return loader.load_weights(weights, mapper=self.weight_mapper) return loader.load_weights(weights, mapper=self.weight_mapper)
\ No newline at end of file
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment