Commit 2a0104e2 authored by chenych's avatar chenych
Browse files

Update minimax-m2

parent 6f06966e
......@@ -54,7 +54,7 @@ class _HfExamplesInfo:
skip_tokenizer_init: bool = False
"""
If true, skip initialization of tokenizer and detokenizer.
If true, skip initialization of tokenizer and detokenizer.
"""
dtype: ModelDType = "auto"
......@@ -103,7 +103,7 @@ class _HfExamplesInfo:
use_original_num_layers: bool = False
"""
If True, use the original number of layers from the model config
If True, use the original number of layers from the model config
instead of minimal layers for testing.
"""
......@@ -300,6 +300,8 @@ _TEXT_GENERATION_EXAMPLE_MODELS = {
revision="a59aa9cbc53b9fb8742ca4e9e1531b9802b6fdc3"), # noqa: E501
"MiniMaxM1ForCausalLM": _HfExamplesInfo(os.path.join(models_path_prefix, "MiniMaxAI/MiniMax-M1-40k"),
trust_remote_code=True),
"MiniMaxM2ForCausalLM": _HfExamplesInfo(os.path.join(models_path_prefix, "MiniMaxAI/MiniMax-M2"),
trust_remote_code=True),
"MistralForCausalLM": _HfExamplesInfo(os.path.join(models_path_prefix, "mistralai/Mistral-7B-Instruct-v0.1")),
"MixtralForCausalLM": _HfExamplesInfo(os.path.join(models_path_prefix, "mistralai/Mixtral-8x7B-Instruct-v0.1"), # noqa: E501
{"tiny": os.path.join(models_path_prefix, "TitanML/tiny-mixtral")}), # noqa: E501
......
......@@ -74,7 +74,7 @@ class MiniMaxM2ReasoningParser(BaseThinkingReasoningParser):
# No end token yet, all content is reasoning
return DeltaMessage(reasoning=delta_text)
@ReasoningParserManager.register_module("minimax_m2_append_think")
class MiniMaxM2AppendThinkReasoningParser(ReasoningParser):
"""
Reasoning parser for MiniMax M2 model.
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment