Commit 770d33f9 authored by zhuwenwen's avatar zhuwenwen
Browse files

Merge branch 'v0.11.0-dev' into 'v0.11.0-dev'

Update MiniMax-M2/M2.1/M2.5

See merge request dcutoolkit/deeplearing/vllm!437
parents 6f06966e 930d8b58
...@@ -300,6 +300,8 @@ _TEXT_GENERATION_EXAMPLE_MODELS = { ...@@ -300,6 +300,8 @@ _TEXT_GENERATION_EXAMPLE_MODELS = {
revision="a59aa9cbc53b9fb8742ca4e9e1531b9802b6fdc3"), # noqa: E501 revision="a59aa9cbc53b9fb8742ca4e9e1531b9802b6fdc3"), # noqa: E501
"MiniMaxM1ForCausalLM": _HfExamplesInfo(os.path.join(models_path_prefix, "MiniMaxAI/MiniMax-M1-40k"), "MiniMaxM1ForCausalLM": _HfExamplesInfo(os.path.join(models_path_prefix, "MiniMaxAI/MiniMax-M1-40k"),
trust_remote_code=True), trust_remote_code=True),
"MiniMaxM2ForCausalLM": _HfExamplesInfo(os.path.join(models_path_prefix, "MiniMaxAI/MiniMax-M2"),
trust_remote_code=True),
"MistralForCausalLM": _HfExamplesInfo(os.path.join(models_path_prefix, "mistralai/Mistral-7B-Instruct-v0.1")), "MistralForCausalLM": _HfExamplesInfo(os.path.join(models_path_prefix, "mistralai/Mistral-7B-Instruct-v0.1")),
"MixtralForCausalLM": _HfExamplesInfo(os.path.join(models_path_prefix, "mistralai/Mixtral-8x7B-Instruct-v0.1"), # noqa: E501 "MixtralForCausalLM": _HfExamplesInfo(os.path.join(models_path_prefix, "mistralai/Mixtral-8x7B-Instruct-v0.1"), # noqa: E501
{"tiny": os.path.join(models_path_prefix, "TitanML/tiny-mixtral")}), # noqa: E501 {"tiny": os.path.join(models_path_prefix, "TitanML/tiny-mixtral")}), # noqa: E501
......
...@@ -12,7 +12,7 @@ from .mistral_reasoning_parser import MistralReasoningParser ...@@ -12,7 +12,7 @@ from .mistral_reasoning_parser import MistralReasoningParser
from .qwen3_reasoning_parser import Qwen3ReasoningParser from .qwen3_reasoning_parser import Qwen3ReasoningParser
from .seedoss_reasoning_parser import SeedOSSReasoningParser from .seedoss_reasoning_parser import SeedOSSReasoningParser
from .step3_reasoning_parser import Step3ReasoningParser from .step3_reasoning_parser import Step3ReasoningParser
from .minimax_m2_reasoning_parser import MiniMaxM2ReasoningParser from .minimax_m2_reasoning_parser import MiniMaxM2ReasoningParser,MiniMaxM2AppendThinkReasoningParser
__all__ = [ __all__ = [
"ReasoningParser", "ReasoningParser",
...@@ -29,4 +29,5 @@ __all__ = [ ...@@ -29,4 +29,5 @@ __all__ = [
"GptOssReasoningParser", "GptOssReasoningParser",
"SeedOSSReasoningParser", "SeedOSSReasoningParser",
"MiniMaxM2ReasoningParser", "MiniMaxM2ReasoningParser",
"MiniMaxM2AppendThinkReasoningParser"
] ]
...@@ -74,7 +74,7 @@ class MiniMaxM2ReasoningParser(BaseThinkingReasoningParser): ...@@ -74,7 +74,7 @@ class MiniMaxM2ReasoningParser(BaseThinkingReasoningParser):
# No end token yet, all content is reasoning # No end token yet, all content is reasoning
return DeltaMessage(reasoning=delta_text) return DeltaMessage(reasoning=delta_text)
@ReasoningParserManager.register_module("minimax_m2_append_think")
class MiniMaxM2AppendThinkReasoningParser(ReasoningParser): class MiniMaxM2AppendThinkReasoningParser(ReasoningParser):
""" """
Reasoning parser for MiniMax M2 model. Reasoning parser for MiniMax M2 model.
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment