Commit 2a0104e2 authored by chenych's avatar chenych
Browse files

Update minimax-m2

parent 6f06966e
...@@ -54,7 +54,7 @@ class _HfExamplesInfo: ...@@ -54,7 +54,7 @@ class _HfExamplesInfo:
skip_tokenizer_init: bool = False skip_tokenizer_init: bool = False
""" """
If true, skip initialization of tokenizer and detokenizer. If true, skip initialization of tokenizer and detokenizer.
""" """
dtype: ModelDType = "auto" dtype: ModelDType = "auto"
...@@ -103,7 +103,7 @@ class _HfExamplesInfo: ...@@ -103,7 +103,7 @@ class _HfExamplesInfo:
use_original_num_layers: bool = False use_original_num_layers: bool = False
""" """
If True, use the original number of layers from the model config If True, use the original number of layers from the model config
instead of minimal layers for testing. instead of minimal layers for testing.
""" """
...@@ -300,6 +300,8 @@ _TEXT_GENERATION_EXAMPLE_MODELS = { ...@@ -300,6 +300,8 @@ _TEXT_GENERATION_EXAMPLE_MODELS = {
revision="a59aa9cbc53b9fb8742ca4e9e1531b9802b6fdc3"), # noqa: E501 revision="a59aa9cbc53b9fb8742ca4e9e1531b9802b6fdc3"), # noqa: E501
"MiniMaxM1ForCausalLM": _HfExamplesInfo(os.path.join(models_path_prefix, "MiniMaxAI/MiniMax-M1-40k"), "MiniMaxM1ForCausalLM": _HfExamplesInfo(os.path.join(models_path_prefix, "MiniMaxAI/MiniMax-M1-40k"),
trust_remote_code=True), trust_remote_code=True),
"MiniMaxM2ForCausalLM": _HfExamplesInfo(os.path.join(models_path_prefix, "MiniMaxAI/MiniMax-M2"),
trust_remote_code=True),
"MistralForCausalLM": _HfExamplesInfo(os.path.join(models_path_prefix, "mistralai/Mistral-7B-Instruct-v0.1")), "MistralForCausalLM": _HfExamplesInfo(os.path.join(models_path_prefix, "mistralai/Mistral-7B-Instruct-v0.1")),
"MixtralForCausalLM": _HfExamplesInfo(os.path.join(models_path_prefix, "mistralai/Mixtral-8x7B-Instruct-v0.1"), # noqa: E501 "MixtralForCausalLM": _HfExamplesInfo(os.path.join(models_path_prefix, "mistralai/Mixtral-8x7B-Instruct-v0.1"), # noqa: E501
{"tiny": os.path.join(models_path_prefix, "TitanML/tiny-mixtral")}), # noqa: E501 {"tiny": os.path.join(models_path_prefix, "TitanML/tiny-mixtral")}), # noqa: E501
......
...@@ -74,7 +74,7 @@ class MiniMaxM2ReasoningParser(BaseThinkingReasoningParser): ...@@ -74,7 +74,7 @@ class MiniMaxM2ReasoningParser(BaseThinkingReasoningParser):
# No end token yet, all content is reasoning # No end token yet, all content is reasoning
return DeltaMessage(reasoning=delta_text) return DeltaMessage(reasoning=delta_text)
@ReasoningParserManager.register_module("minimax_m2_append_think")
class MiniMaxM2AppendThinkReasoningParser(ReasoningParser): class MiniMaxM2AppendThinkReasoningParser(ReasoningParser):
""" """
Reasoning parser for MiniMax M2 model. Reasoning parser for MiniMax M2 model.
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment