Unverified Commit 664688b9 authored by Yih-Dar's avatar Yih-Dar Committed by GitHub
Browse files

higher atol to avoid flaky trainer test failure (#17979)


Co-authored-by: default avatarydshieh <ydshieh@users.noreply.github.com>
parent 8bb2c387
...@@ -1252,8 +1252,8 @@ class TrainerIntegrationTest(TestCasePlus, TrainerIntegrationCommon): ...@@ -1252,8 +1252,8 @@ class TrainerIntegrationTest(TestCasePlus, TrainerIntegrationCommon):
trainer.train(resume_from_checkpoint=os.path.join(tmp_dir, "checkpoint-15")) trainer.train(resume_from_checkpoint=os.path.join(tmp_dir, "checkpoint-15"))
(a1, b1) = trainer.model.a.item(), trainer.model.b.item() (a1, b1) = trainer.model.a.item(), trainer.model.b.item()
self.assertAlmostEqual(a, a1, delta=1e-8) self.assertAlmostEqual(a, a1, delta=1e-5)
self.assertAlmostEqual(b, b1, delta=1e-8) self.assertAlmostEqual(b, b1, delta=1e-5)
with self.subTest("Test every epoch"): with self.subTest("Test every epoch"):
config = RegressionModelConfig(a=0, b=2, random_torch=random_torch) config = RegressionModelConfig(a=0, b=2, random_torch=random_torch)
...@@ -1277,8 +1277,8 @@ class TrainerIntegrationTest(TestCasePlus, TrainerIntegrationCommon): ...@@ -1277,8 +1277,8 @@ class TrainerIntegrationTest(TestCasePlus, TrainerIntegrationCommon):
trainer.train(resume_from_checkpoint=os.path.join(tmp_dir, checkpoint_dir)) trainer.train(resume_from_checkpoint=os.path.join(tmp_dir, checkpoint_dir))
(a1, b1) = trainer.model.a.item(), trainer.model.b.item() (a1, b1) = trainer.model.a.item(), trainer.model.b.item()
self.assertAlmostEqual(a, a1, delta=1e-8) self.assertAlmostEqual(a, a1, delta=1e-5)
self.assertAlmostEqual(b, b1, delta=1e-8) self.assertAlmostEqual(b, b1, delta=1e-5)
@slow @slow
@require_torch_non_multi_gpu @require_torch_non_multi_gpu
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment