Unverified Commit c25231c6 authored by shangmingc's avatar shangmingc Committed by GitHub
Browse files

[CI] Fix flaky pp single node test (#6689)


Signed-off-by: default avatarShangming Cai <caishangming@linux.alibaba.com>
parent fba03b29
......@@ -108,11 +108,13 @@ class TestQwenPPAccuracy(unittest.TestCase):
print(f"[Qwen PP Comparison] Baseline: {baseline} | PP: {pp_metrics}")
self.assertAlmostEqual(
self.assertGreaterEqual(
pp_metrics["accuracy"],
baseline["accuracy"],
delta=0.01,
msg=f"PP accuracy exceeds 1% (baseline: {baseline['accuracy']}, pp: {pp_metrics['accuracy']})",
baseline["accuracy"] - 0.01,
msg=(
f"PP accuracy dropped more than 1% compared to baseline. "
f"Baseline: {baseline['accuracy']:.2%}, PP: {pp_metrics['accuracy']:.2%}"
),
)
......@@ -164,11 +166,13 @@ class TestQwenPPTieWeightsAccuracy(unittest.TestCase):
print(f"[Qwen PP Comparison] Baseline: {baseline} | PP: {pp_metrics}")
self.assertAlmostEqual(
self.assertGreaterEqual(
pp_metrics["accuracy"],
baseline["accuracy"],
delta=0.01,
msg=f"PP accuracy exceeds 1% (baseline: {baseline['accuracy']}, pp: {pp_metrics['accuracy']})",
baseline["accuracy"] - 0.01,
msg=(
f"PP accuracy dropped more than 1% compared to baseline. "
f"Baseline: {baseline['accuracy']:.2%}, PP: {pp_metrics['accuracy']:.2%}"
),
)
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment