Unverified Commit ee2e69d6 authored by Isotr0py's avatar Isotr0py Committed by GitHub
Browse files

[Bugfix][CI/Build] Fix failing pooling models test due to Triton kernel accuracy diff (#31776)


Signed-off-by: default avatarIsotr0py <mozf@mail2.sysu.edu.cn>
parent 7101e085
...@@ -78,7 +78,7 @@ def test_modernbert_models( ...@@ -78,7 +78,7 @@ def test_modernbert_models(
for hf_output, vllm_output in zip(hf_outputs, vllm_outputs): for hf_output, vllm_output in zip(hf_outputs, vllm_outputs):
hf_output = hf_output.detach().clone().cpu().float() hf_output = hf_output.detach().clone().cpu().float()
vllm_output = vllm_output.detach().clone().cpu().float() vllm_output = vllm_output.detach().clone().cpu().float()
assert torch.allclose(hf_output, vllm_output, atol=1e-2) torch.testing.assert_close(hf_output, vllm_output, atol=1.2e-2, rtol=1e-3)
@pytest.mark.parametrize("model", ["bd2lcco/Qwen3-0.6B-finetuned"]) @pytest.mark.parametrize("model", ["bd2lcco/Qwen3-0.6B-finetuned"])
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment