Unverified Commit fd4a90f3 authored by wang.yuqi's avatar wang.yuqi Committed by GitHub
Browse files

[CI] And PPL test for Qwen3.5. (#35853)


Signed-off-by: default avatarwang.yuqi <yuqi.wang@daocloud.io>
Signed-off-by: default avatarwang.yuqi <noooop@126.com>
Co-authored-by: default avatargemini-code-assist[bot] <176961590+gemini-code-assist[bot]@users.noreply.github.com>
parent ad9d09e2
...@@ -7,9 +7,9 @@ from tests.models.utils import GenerateModelInfo ...@@ -7,9 +7,9 @@ from tests.models.utils import GenerateModelInfo
from .ppl_utils import wikitext_ppl_test from .ppl_utils import wikitext_ppl_test
MODELS = [ MODELS = [
GenerateModelInfo("google/gemma-2b"), GenerateModelInfo("google/gemma-2b", hf_ppl=21.48524284362793),
GenerateModelInfo("google/gemma-2-2b"), GenerateModelInfo("google/gemma-2-2b", hf_ppl=102.59290313720703),
GenerateModelInfo("google/gemma-3-4b-it"), GenerateModelInfo("google/gemma-3-4b-it", hf_ppl=27.79648208618164),
] ]
......
...@@ -6,7 +6,7 @@ from tests.models.utils import GenerateModelInfo ...@@ -6,7 +6,7 @@ from tests.models.utils import GenerateModelInfo
from .ppl_utils import wikitext_ppl_test from .ppl_utils import wikitext_ppl_test
MODELS = [GenerateModelInfo("openai-community/gpt2-large")] MODELS = [GenerateModelInfo("openai-community/gpt2-large", hf_ppl=19.457056045532227)]
@pytest.mark.parametrize("model_info", MODELS) @pytest.mark.parametrize("model_info", MODELS)
......
...@@ -8,14 +8,20 @@ from tests.models.utils import GenerateModelInfo ...@@ -8,14 +8,20 @@ from tests.models.utils import GenerateModelInfo
from .ppl_utils import wikitext_ppl_test from .ppl_utils import wikitext_ppl_test
MODELS = [ MODELS = [
GenerateModelInfo("Qwen/Qwen3-0.6B"), # for Qwen3
GenerateModelInfo("Qwen/Qwen3-0.6B-FP8"), GenerateModelInfo("Qwen/Qwen3-0.6B", hf_ppl=23.864173889160156),
# transformers: GenerateModelInfo("Qwen/Qwen3-0.6B-FP8", hf_ppl=24.313045501708984),
# Loading a GPTQ quantized model requires optimum, gptqmodel # for Qwen3.5
# GenerateModelInfo("Qwen/Qwen3-0.6B-GPTQ-Int8"), GenerateModelInfo("Qwen/Qwen3.5-0.8B", hf_ppl=19.38858413696289),
] ]
@pytest.mark.parametrize("model_info", MODELS) @pytest.mark.parametrize("model_info", MODELS)
def test_ppl(hf_runner, vllm_runner, model_info: GenerateModelInfo): def test_ppl(hf_runner, vllm_runner, model_info: GenerateModelInfo):
wikitext_ppl_test(hf_runner, vllm_runner, model_info) vllm_extra_kwargs = {}
if model_info.name == "Qwen/Qwen3.5-0.8B":
vllm_extra_kwargs["language_model_only"] = True
wikitext_ppl_test(
hf_runner, vllm_runner, model_info, vllm_extra_kwargs=vllm_extra_kwargs
)
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment