Commit 770d33f9 authored by zhuwenwen's avatar zhuwenwen
Browse files

Merge branch 'v0.11.0-dev' into 'v0.11.0-dev'

Update MiniMax-M2/M2.1/M2.5

See merge request dcutoolkit/deeplearing/vllm!437
parents 6f06966e 930d8b58
...@@ -54,7 +54,7 @@ class _HfExamplesInfo: ...@@ -54,7 +54,7 @@ class _HfExamplesInfo:
skip_tokenizer_init: bool = False skip_tokenizer_init: bool = False
""" """
If true, skip initialization of tokenizer and detokenizer. If true, skip initialization of tokenizer and detokenizer.
""" """
dtype: ModelDType = "auto" dtype: ModelDType = "auto"
...@@ -103,7 +103,7 @@ class _HfExamplesInfo: ...@@ -103,7 +103,7 @@ class _HfExamplesInfo:
use_original_num_layers: bool = False use_original_num_layers: bool = False
""" """
If True, use the original number of layers from the model config If True, use the original number of layers from the model config
instead of minimal layers for testing. instead of minimal layers for testing.
""" """
...@@ -300,6 +300,8 @@ _TEXT_GENERATION_EXAMPLE_MODELS = { ...@@ -300,6 +300,8 @@ _TEXT_GENERATION_EXAMPLE_MODELS = {
revision="a59aa9cbc53b9fb8742ca4e9e1531b9802b6fdc3"), # noqa: E501 revision="a59aa9cbc53b9fb8742ca4e9e1531b9802b6fdc3"), # noqa: E501
"MiniMaxM1ForCausalLM": _HfExamplesInfo(os.path.join(models_path_prefix, "MiniMaxAI/MiniMax-M1-40k"), "MiniMaxM1ForCausalLM": _HfExamplesInfo(os.path.join(models_path_prefix, "MiniMaxAI/MiniMax-M1-40k"),
trust_remote_code=True), trust_remote_code=True),
"MiniMaxM2ForCausalLM": _HfExamplesInfo(os.path.join(models_path_prefix, "MiniMaxAI/MiniMax-M2"),
trust_remote_code=True),
"MistralForCausalLM": _HfExamplesInfo(os.path.join(models_path_prefix, "mistralai/Mistral-7B-Instruct-v0.1")), "MistralForCausalLM": _HfExamplesInfo(os.path.join(models_path_prefix, "mistralai/Mistral-7B-Instruct-v0.1")),
"MixtralForCausalLM": _HfExamplesInfo(os.path.join(models_path_prefix, "mistralai/Mixtral-8x7B-Instruct-v0.1"), # noqa: E501 "MixtralForCausalLM": _HfExamplesInfo(os.path.join(models_path_prefix, "mistralai/Mixtral-8x7B-Instruct-v0.1"), # noqa: E501
{"tiny": os.path.join(models_path_prefix, "TitanML/tiny-mixtral")}), # noqa: E501 {"tiny": os.path.join(models_path_prefix, "TitanML/tiny-mixtral")}), # noqa: E501
......
...@@ -12,7 +12,7 @@ from .mistral_reasoning_parser import MistralReasoningParser ...@@ -12,7 +12,7 @@ from .mistral_reasoning_parser import MistralReasoningParser
from .qwen3_reasoning_parser import Qwen3ReasoningParser from .qwen3_reasoning_parser import Qwen3ReasoningParser
from .seedoss_reasoning_parser import SeedOSSReasoningParser from .seedoss_reasoning_parser import SeedOSSReasoningParser
from .step3_reasoning_parser import Step3ReasoningParser from .step3_reasoning_parser import Step3ReasoningParser
from .minimax_m2_reasoning_parser import MiniMaxM2ReasoningParser from .minimax_m2_reasoning_parser import MiniMaxM2ReasoningParser,MiniMaxM2AppendThinkReasoningParser
__all__ = [ __all__ = [
"ReasoningParser", "ReasoningParser",
...@@ -29,4 +29,5 @@ __all__ = [ ...@@ -29,4 +29,5 @@ __all__ = [
"GptOssReasoningParser", "GptOssReasoningParser",
"SeedOSSReasoningParser", "SeedOSSReasoningParser",
"MiniMaxM2ReasoningParser", "MiniMaxM2ReasoningParser",
"MiniMaxM2AppendThinkReasoningParser"
] ]
...@@ -74,7 +74,7 @@ class MiniMaxM2ReasoningParser(BaseThinkingReasoningParser): ...@@ -74,7 +74,7 @@ class MiniMaxM2ReasoningParser(BaseThinkingReasoningParser):
# No end token yet, all content is reasoning # No end token yet, all content is reasoning
return DeltaMessage(reasoning=delta_text) return DeltaMessage(reasoning=delta_text)
@ReasoningParserManager.register_module("minimax_m2_append_think")
class MiniMaxM2AppendThinkReasoningParser(ReasoningParser): class MiniMaxM2AppendThinkReasoningParser(ReasoningParser):
""" """
Reasoning parser for MiniMax M2 model. Reasoning parser for MiniMax M2 model.
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment