Adds absolute error comparison function with better messaging.

30195c4a · Jennifer · 8f8b537d · 30195c4a · 30195c4a · 30195c4a
Commit 30195c4a authored Jan 24, 2024 by Jennifer
10 changed files
--- a/tests/compare_utils.py
+++ b/tests/compare_utils.py
@@ -6,6 +6,7 @@ import sys
 import unittest
 import numpy as np
+import torch
 from openfold.config import model_config
 from openfold.model.model import AlphaFold
@@ -119,3 +120,20 @@ def fetch_alphafold_module_weights(weight_path):
            "Make sure to call import_alphafold before running this function"
        )
    return params
+def _assert_abs_diff_small_base(compare_func, expected, actual, eps):
+    # Helper function for comparing absolute differences of two torch tensors.
+    abs_diff = torch.abs(expected - actual)
+    err = compare_func(abs_diff)
+    zero_tensor = torch.tensor(0, dtype=err.dtype)
+    rtol = 1.6e-2 if err.dtype == torch.bfloat16 else 1.3e-6  
+    torch.testing.assert_close(err, zero_tensor, atol=eps, rtol=rtol)
+def assert_max_abs_diff_small(expected, actual, eps):
+    _assert_abs_diff_small_base(torch.max, expected, actual, eps)
+def assert_mean_abs_diff_small(expected, actual, eps):
+    _assert_abs_diff_small_base(torch.mean, expected, actual, eps)
--- a/tests/test_deepspeed_evo_attention.py
+++ b/tests/test_deepspeed_evo_attention.py
@@ -276,8 +276,7 @@ class TestDeepSpeedKernel(unittest.TestCase):
            )
            out_repro_ds = out_repro_ds["template_pair_embedding"].cpu()
-            err = torch.max(torch.abs(out_repro - out_repro_ds))
+            compare_utils.assert_max_abs_diff_small(out_repro, out_repro_ds, eps)
-            self.assertTrue(err < eps, f'Error {err}')
    def test_compare_model(self):
        """
@@ -335,8 +334,7 @@ class TestDeepSpeedKernel(unittest.TestCase):
                out_repro = out_repro["sm"]["positions"][-1].squeeze(0)
                out_repro_ds = out_repro_ds["sm"]["positions"][-1].squeeze(0)
-                err = torch.mean(torch.abs(out_repro - out_repro_ds))
+                compare_utils.assert_mean_abs_diff_small(out_repro, out_repro_ds, eps)
-                self.assertTrue(err < eps, f'Error: {err}')
 if __name__ == "__main__":

--- a/tests/test_evoformer.py
+++ b/tests/test_evoformer.py
@@ -200,8 +200,8 @@ class TestEvoformerStack(unittest.TestCase):
        out_repro_msa = out_repro_msa.cpu()
        out_repro_pair = out_repro_pair.cpu()
-        self.assertTrue(torch.mean(torch.abs(out_repro_msa - out_gt_msa)) < consts.eps)
+        compare_utils.assert_mean_abs_diff_small(out_gt_msa, out_repro_msa, consts.eps)
-        self.assertTrue(torch.max(torch.abs(out_repro_pair - out_gt_pair)) < consts.eps)
+        compare_utils.assert_max_abs_diff_small(out_gt_pair, out_repro_pair, consts.eps)
        # Inplace version
        out_repro_msa, out_repro_pair = model.evoformer.blocks[0](
@@ -217,8 +217,8 @@ class TestEvoformerStack(unittest.TestCase):
        out_repro_msa = out_repro_msa.cpu()
        out_repro_pair = out_repro_pair.cpu()
-        self.assertTrue(torch.mean(torch.abs(out_repro_msa - out_gt_msa)) < consts.eps)
+        compare_utils.assert_mean_abs_diff_small(out_gt_msa, out_repro_msa, consts.eps)
-        self.assertTrue(torch.max(torch.abs(out_repro_pair - out_gt_pair)) < consts.eps)
+        compare_utils.assert_max_abs_diff_small(out_gt_pair, out_repro_pair, consts.eps)
 class TestExtraMSAStack(unittest.TestCase):
@@ -354,8 +354,7 @@ class TestMSATransition(unittest.TestCase):
            .cpu()
        )
-        self.assertTrue(torch.max(torch.abs(out_gt - out_repro)) < consts.eps)
+        compare_utils.assert_max_abs_diff_small(out_gt, out_repro, consts.eps)
 if __name__ == "__main__":
    unittest.main()
--- a/tests/test_feats.py
+++ b/tests/test_feats.py
@@ -386,7 +386,7 @@ class TestFeats(unittest.TestCase):
            torch.tensor(restype_atom14_rigid_group_positions).cuda(),
        ).cpu()
-        self.assertTrue(torch.max(torch.abs(out_gt - out_repro) < consts.eps))
+        compare_utils.assert_max_abs_diff_small(out_gt, out_repro, consts.eps)
 if __name__ == "__main__":

--- a/tests/test_msa.py
+++ b/tests/test_msa.py
@@ -96,7 +96,7 @@ class TestMSARowAttentionWithPairBias(unittest.TestCase):
            )
        ).cpu()
-        self.assertTrue(torch.mean(torch.abs(out_gt - out_repro)) < consts.eps)
+        compare_utils.assert_mean_abs_diff_small(out_gt, out_repro, consts.eps)
 class TestMSAColumnAttention(unittest.TestCase):
@@ -158,7 +158,7 @@ class TestMSAColumnAttention(unittest.TestCase):
            )
        ).cpu()
-        self.assertTrue(torch.mean(torch.abs(out_gt - out_repro)) < consts.eps)
+        compare_utils.assert_mean_abs_diff_small(out_gt, out_repro, consts.eps)
 class TestMSAColumnGlobalAttention(unittest.TestCase):
@@ -222,7 +222,7 @@ class TestMSAColumnGlobalAttention(unittest.TestCase):
            .cpu()
        )
-        self.assertTrue(torch.max(torch.abs(out_gt - out_repro) < consts.eps))
+        compare_utils.assert_max_abs_diff_small(out_gt, out_repro, consts.eps)
 if __name__ == "__main__":

--- a/tests/test_outer_product_mean.py
+++ b/tests/test_outer_product_mean.py
@@ -92,7 +92,7 @@ class TestOuterProductMean(unittest.TestCase):
        # Even when correct, OPM has large, precision-related errors. It gets
        # a special pass from consts.eps.
-        self.assertTrue(torch.max(torch.abs(out_gt - out_repro)) < 5e-4)
+        compare_utils.assert_max_abs_diff_small(out_gt, out_repro, 5e-4)
 if __name__ == "__main__":

--- a/tests/test_structure_module.py
+++ b/tests/test_structure_module.py
@@ -197,7 +197,7 @@ class TestStructureModule(unittest.TestCase):
        # The structure module, thanks to angle normalization, is very volatile
        # We only assess the mean here. Heuristically speaking, it seems to
        # have lower error in general on real rather than synthetic data.
-        self.assertTrue(torch.mean(torch.abs(out_gt - out_repro)) < 0.05)
+        compare_utils.assert_mean_abs_diff_small(out_gt, out_repro, 0.05)
 class TestInvariantPointAttention(unittest.TestCase):
@@ -321,7 +321,7 @@ class TestInvariantPointAttention(unittest.TestCase):
                torch.as_tensor(sample_mask.squeeze(-1)).float().cuda(),
            ).cpu()
-        self.assertTrue(torch.max(torch.abs(out_gt - out_repro)) < consts.eps)
+        compare_utils.assert_max_abs_diff_small(out_gt, out_repro, consts.eps)
 class TestAngleResnet(unittest.TestCase):

--- a/tests/test_template.py
+++ b/tests/test_template.py
@@ -191,9 +191,7 @@ class TestTemplatePairStack(unittest.TestCase):
            _mask_trans=False,
        ).cpu()
-        diff = torch.max(torch.abs(out_gt - out_repro))
+        compare_utils.assert_max_abs_diff_small(out_gt, out_repro, consts.eps)
-        self.assertTrue(diff < consts.eps, 
-                msg=f"Found difference between ground truth and reproduction of {diff}")
 class Template(unittest.TestCase):
@@ -286,7 +284,7 @@ class Template(unittest.TestCase):
        out_repro = out_repro_all["template_pair_embedding"]
        out_repro = out_repro.cpu()
-        self.assertTrue(torch.max(torch.abs(out_gt - out_repro)) < consts.eps)
+        compare_utils.assert_mean_abs_diff_small(out_gt, out_repro, consts.eps)
 if __name__ == "__main__":

--- a/tests/test_triangular_attention.py
+++ b/tests/test_triangular_attention.py
@@ -102,7 +102,7 @@ class TestTriangularAttention(unittest.TestCase):
            chunk_size=None,
        ).cpu()
-        self.assertTrue(torch.mean(torch.abs(out_gt - out_repro)) < consts.eps)
+        compare_utils.assert_mean_abs_diff_small(out_gt, out_repro, consts.eps)
    @compare_utils.skip_unless_alphafold_installed()
    def test_tri_att_end_compare(self):

--- a/tests/test_triangular_multiplicative_update.py
+++ b/tests/test_triangular_multiplicative_update.py
@@ -103,7 +103,7 @@ class TestTriangularMultiplicativeUpdate(unittest.TestCase):
            inplace_safe=True, _inplace_chunk_size=4,
        ).cpu()
-        self.assertTrue(torch.mean(torch.abs(out_gt - out_repro)) < consts.eps)
+        compare_utils.assert_mean_abs_diff_small(out_gt, out_repro, consts.eps)
    @compare_utils.skip_unless_alphafold_installed()
    def test_tri_mul_out_compare(self):