Unverified Commit 195c9972 authored by Harry Mellor's avatar Harry Mellor Committed by GitHub
Browse files

Fix LFM2 MoE test for Transformers v5 (#36534)


Signed-off-by: default avatarHarry Mellor <19981378+hmellor@users.noreply.github.com>
parent 04b67d8f
...@@ -351,7 +351,11 @@ _TEXT_GENERATION_EXAMPLE_MODELS = { ...@@ -351,7 +351,11 @@ _TEXT_GENERATION_EXAMPLE_MODELS = {
), ),
"Lfm2ForCausalLM": _HfExamplesInfo("LiquidAI/LFM2-1.2B"), "Lfm2ForCausalLM": _HfExamplesInfo("LiquidAI/LFM2-1.2B"),
"Lfm2MoeForCausalLM": _HfExamplesInfo( "Lfm2MoeForCausalLM": _HfExamplesInfo(
"LiquidAI/LFM2-8B-A1B", min_transformers_version="4.58" "LiquidAI/LFM2-8B-A1B",
min_transformers_version="5.0.0",
use_original_num_layers=True,
# Initialize at least one MoE layer
hf_overrides={"num_hidden_layers": 4},
), ),
"LlamaForCausalLM": _HfExamplesInfo( "LlamaForCausalLM": _HfExamplesInfo(
"meta-llama/Llama-3.2-1B-Instruct", "meta-llama/Llama-3.2-1B-Instruct",
...@@ -511,9 +515,7 @@ _TEXT_GENERATION_EXAMPLE_MODELS = { ...@@ -511,9 +515,7 @@ _TEXT_GENERATION_EXAMPLE_MODELS = {
"stepfun-ai/Step-3.5-Flash", "stepfun-ai/Step-3.5-Flash",
use_original_num_layers=True, use_original_num_layers=True,
# Initialize at least one MoE layer # Initialize at least one MoE layer
hf_overrides={ hf_overrides={"num_hidden_layers": 4},
"num_hidden_layers": 4,
},
), ),
"Step3TextForCausalLM": _HfExamplesInfo("stepfun-ai/step3", trust_remote_code=True), "Step3TextForCausalLM": _HfExamplesInfo("stepfun-ai/step3", trust_remote_code=True),
"SolarForCausalLM": _HfExamplesInfo( "SolarForCausalLM": _HfExamplesInfo(
...@@ -1233,9 +1235,7 @@ _SPECULATIVE_DECODING_EXAMPLE_MODELS = { ...@@ -1233,9 +1235,7 @@ _SPECULATIVE_DECODING_EXAMPLE_MODELS = {
speculative_model="stepfun-ai/Step-3.5-Flash", speculative_model="stepfun-ai/Step-3.5-Flash",
use_original_num_layers=True, use_original_num_layers=True,
# Initialize at least one MoE layer # Initialize at least one MoE layer
hf_overrides={ hf_overrides={"num_hidden_layers": 4},
"num_hidden_layers": 4,
},
is_available_online=False, is_available_online=False,
), ),
} }
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment