Add tests for results in script vs eager mode (#1430)

* Add tests for results in script vs eager mode This copies some logic from `test_jit.py` to check that a TorchScript'ed model's outputs are the same as outputs from the model in eager mode. To support differences in TorchScript / eager mode outputs, an `unwrapper` function can be provided per-model. * Fix inception, use PYTORCH_TEST_WITH_SLOW * Update * Remove assertNestedTensorObjectsEqual * Add PYTORCH_TEST_WITH_SLOW to CircleCI config * Add MaskRCNN unwrapper * fix prec args * Remove CI changes * update * Update * remove expect changes * Fix tolerance bug * Fix breakages * Fix quantized resnet * Fix merge errors and simplify code * DeepLabV3 has been fixed * Temporarily disable jit compilation

Add tests for results in script vs eager mode (#1430)
* Add tests for results in script vs eager mode This copies some logic from `test_jit.py` to check that a TorchScript'ed model's outputs are the same as outputs from the model in eager mode. To support differences in TorchScript / eager mode outputs, an `unwrapper` function can be provided per-model. * Fix inception, use PYTORCH_TEST_WITH_SLOW * Update * Remove assertNestedTensorObjectsEqual * Add PYTORCH_TEST_WITH_SLOW to CircleCI config * Add MaskRCNN unwrapper * fix prec args * Remove CI changes * update * Update * remove expect changes * Fix tolerance bug * Fix breakages * Fix quantized resnet * Fix merge errors and simplify code * DeepLabV3 has been fixed * Temporarily disable jit compilation
227027d5 · driazati · Francisco Massa · a44d55d8 · 227027d5 · 227027d5
Commit 227027d5 authored Nov 30, 2019 by driazati Committed by Francisco Massa Nov 30, 2019
9 changed files
--- a/test/common_utils.py
+++ b/test/common_utils.py
@@ -5,10 +5,15 @@ import contextlib
 import unittest
 import argparse
 import sys
+import io
 import torch
 import errno
 import __main__
+from numbers import Number
+from torch._six import string_classes, inf
+from collections import OrderedDict
 @contextlib.contextmanager
 def get_tmp_dir(src=None, **kwargs):
@@ -23,6 +28,9 @@ def get_tmp_dir(src=None, **kwargs):
 ACCEPT = os.getenv('EXPECTTEST_ACCEPT')
+TEST_WITH_SLOW = os.getenv('PYTORCH_TEST_WITH_SLOW', '0') == '1'
+# TEST_WITH_SLOW = True  # TODO: Delete this line once there is a PYTORCH_TEST_WITH_SLOW aware CI job
 parser = argparse.ArgumentParser(add_help=False)
 parser.add_argument('--accept', action='store_true')
@@ -64,10 +72,20 @@ def map_nested_tensor_object(object, tensor_map_fn):
    return impl(object)
+def is_iterable(obj):
+    try:
+        iter(obj)
+        return True
+    except TypeError:
+        return False
 # adapted from TestCase in torch/test/common_utils to accept non-string
 # inputs and set maximum binary size
 class TestCase(unittest.TestCase):
-    def assertExpected(self, output, subname=None, rtol=None, atol=None):
+    precision = 1e-5
+    def assertExpected(self, output, subname=None, prec=None):
        r"""
        Test that a python value matches the recorded contents of a file
        derived from the name of this test and subname.  The value must be
@@ -123,31 +141,182 @@ class TestCase(unittest.TestCase):
        if ACCEPT:
            equal = False
            try:
-                equal = self.assertNestedTensorObjectsEqual(output, expected, rtol=rtol, atol=atol)
+                equal = self.assertEqual(output, expected, prec=prec)
            except Exception:
                equal = False
            if not equal:
                return accept_output("updated output")
        else:
-            self.assertNestedTensorObjectsEqual(output, expected, rtol=rtol, atol=atol)
+            self.assertEqual(output, expected, prec=prec)
-    def assertNestedTensorObjectsEqual(self, a, b, rtol=None, atol=None):
+    def assertEqual(self, x, y, prec=None, message='', allow_inf=False):
-        self.assertEqual(type(a), type(b))
+        """
+        This is copied from pytorch/test/common_utils.py's TestCase.assertEqual
+        """
+        if isinstance(prec, str) and message == '':
+            message = prec
+            prec = None
+        if prec is None:
+            prec = self.precision
-        if isinstance(a, torch.Tensor):
+        if isinstance(x, torch.Tensor) and isinstance(y, Number):
-            torch.testing.assert_allclose(a, b, rtol=rtol, atol=atol)
+            self.assertEqual(x.item(), y, prec=prec, message=message,
+                             allow_inf=allow_inf)
+        elif isinstance(y, torch.Tensor) and isinstance(x, Number):
+            self.assertEqual(x, y.item(), prec=prec, message=message,
+                             allow_inf=allow_inf)
+        elif isinstance(x, torch.Tensor) and isinstance(y, torch.Tensor):
+            def assertTensorsEqual(a, b):
+                super(TestCase, self).assertEqual(a.size(), b.size(), message)
+                if a.numel() > 0:
+                    if (a.device.type == 'cpu' and (a.dtype == torch.float16 or a.dtype == torch.bfloat16)):
+                        # CPU half and bfloat16 tensors don't have the methods we need below
+                        a = a.to(torch.float32)
+                    b = b.to(a)
-        elif isinstance(a, dict):
+                    if (a.dtype == torch.bool) != (b.dtype == torch.bool):
-            self.assertEqual(len(a), len(b))
+                        raise TypeError("Was expecting both tensors to be bool type.")
-            for key, value in a.items():
+                    else:
-                self.assertTrue(key in b, "key: " + str(key))
+                        if a.dtype == torch.bool and b.dtype == torch.bool:
+                            # we want to respect precision but as bool doesn't support substraction,
+                            # boolean tensor has to be converted to int
+                            a = a.to(torch.int)
+                            b = b.to(torch.int)
-                self.assertNestedTensorObjectsEqual(value, b[key], rtol=rtol, atol=atol)
+                        diff = a - b
-        elif isinstance(a, (list, tuple)):
+                        if a.is_floating_point():
-            self.assertEqual(len(a), len(b))
+                            # check that NaNs are in the same locations
+                            nan_mask = torch.isnan(a)
+                            self.assertTrue(torch.equal(nan_mask, torch.isnan(b)), message)
+                            diff[nan_mask] = 0
+                            # inf check if allow_inf=True
+                            if allow_inf:
+                                inf_mask = torch.isinf(a)
+                                inf_sign = inf_mask.sign()
+                                self.assertTrue(torch.equal(inf_sign, torch.isinf(b).sign()), message)
+                                diff[inf_mask] = 0
+                        # TODO: implement abs on CharTensor (int8)
+                        if diff.is_signed() and diff.dtype != torch.int8:
+                            diff = diff.abs()
+                        max_err = diff.max()
+                        tolerance = prec + prec * abs(a.max())
+                        self.assertLessEqual(max_err, tolerance, message)
+            super(TestCase, self).assertEqual(x.is_sparse, y.is_sparse, message)
+            super(TestCase, self).assertEqual(x.is_quantized, y.is_quantized, message)
+            if x.is_sparse:
+                x = self.safeCoalesce(x)
+                y = self.safeCoalesce(y)
+                assertTensorsEqual(x._indices(), y._indices())
+                assertTensorsEqual(x._values(), y._values())
+            elif x.is_quantized and y.is_quantized:
+                self.assertEqual(x.qscheme(), y.qscheme(), prec=prec,
+                                 message=message, allow_inf=allow_inf)
+                if x.qscheme() == torch.per_tensor_affine:
+                    self.assertEqual(x.q_scale(), y.q_scale(), prec=prec,
+                                     message=message, allow_inf=allow_inf)
+                    self.assertEqual(x.q_zero_point(), y.q_zero_point(),
+                                     prec=prec, message=message,
+                                     allow_inf=allow_inf)
+                elif x.qscheme() == torch.per_channel_affine:
+                    self.assertEqual(x.q_per_channel_scales(), y.q_per_channel_scales(), prec=prec,
+                                     message=message, allow_inf=allow_inf)
+                    self.assertEqual(x.q_per_channel_zero_points(), y.q_per_channel_zero_points(),
+                                     prec=prec, message=message,
+                                     allow_inf=allow_inf)
+                    self.assertEqual(x.q_per_channel_axis(), y.q_per_channel_axis(),
+                                     prec=prec, message=message)
+                self.assertEqual(x.dtype, y.dtype)
+                self.assertEqual(x.int_repr().to(torch.int32),
+                                 y.int_repr().to(torch.int32), prec=prec,
+                                 message=message, allow_inf=allow_inf)
+            else:
+                assertTensorsEqual(x, y)
+        elif isinstance(x, string_classes) and isinstance(y, string_classes):
+            super(TestCase, self).assertEqual(x, y, message)
+        elif type(x) == set and type(y) == set:
+            super(TestCase, self).assertEqual(x, y, message)
+        elif isinstance(x, dict) and isinstance(y, dict):
+            if isinstance(x, OrderedDict) and isinstance(y, OrderedDict):
+                self.assertEqual(x.items(), y.items(), prec=prec,
+                                 message=message, allow_inf=allow_inf)
+            else:
+                self.assertEqual(set(x.keys()), set(y.keys()), prec=prec,
+                                 message=message, allow_inf=allow_inf)
+                key_list = list(x.keys())
+                self.assertEqual([x[k] for k in key_list],
+                                 [y[k] for k in key_list],
+                                 prec=prec, message=message,
+                                 allow_inf=allow_inf)
+        elif is_iterable(x) and is_iterable(y):
+            super(TestCase, self).assertEqual(len(x), len(y), message)
+            for x_, y_ in zip(x, y):
+                self.assertEqual(x_, y_, prec=prec, message=message,
+                                 allow_inf=allow_inf)
+        elif isinstance(x, bool) and isinstance(y, bool):
+            super(TestCase, self).assertEqual(x, y, message)
+        elif isinstance(x, Number) and isinstance(y, Number):
+            if abs(x) == inf or abs(y) == inf:
+                if allow_inf:
+                    super(TestCase, self).assertEqual(x, y, message)
+                else:
+                    self.fail("Expected finite numeric values - x={}, y={}".format(x, y))
+                return
+            super(TestCase, self).assertLessEqual(abs(x - y), prec, message)
+        else:
+            super(TestCase, self).assertEqual(x, y, message)
-            for val1, val2 in zip(a, b):
+    def checkModule(self, nn_module, args, unwrapper=None, skip=False):
-                self.assertNestedTensorObjectsEqual(val1, val2, rtol=rtol, atol=atol)
+        """
+        Check that a nn.Module's results in TorchScript match eager and that it
+        can be exported
+        """
+        if not TEST_WITH_SLOW or skip:
+            # TorchScript is not enabled, skip these tests
+            return
-        else:
+        sm = torch.jit.script(nn_module)
-            self.assertEqual(a, b)
+        with freeze_rng_state():
+            eager_out = nn_module(*args)
+        with freeze_rng_state():
+            script_out = sm(*args)
+            if unwrapper:
+                script_out = unwrapper(script_out)
+        self.assertEqual(eager_out, script_out)
+        self.assertExportImportModule(sm, args)
+        return sm
+    def getExportImportCopy(self, m):
+        """
+        Save and load a TorchScript model
+        """
+        buffer = io.BytesIO()
+        torch.jit.save(m, buffer)
+        buffer.seek(0)
+        imported = torch.jit.load(buffer)
+        return imported
+    def assertExportImportModule(self, m, args):
+        """
+        Check that the results of a model are the same after saving and loading
+        """
+        m_import = self.getExportImportCopy(m)
+        with freeze_rng_state():
+            results = m(*args)
+        with freeze_rng_state():
+            results_from_imported = m_import(*args)
+        self.assertEqual(results, results_from_imported)
+@contextlib.contextmanager
+def freeze_rng_state():
+    rng_state = torch.get_rng_state()
+    if torch.cuda.is_available():
+        cuda_rng_state = torch.cuda.get_rng_state()
+    yield
+    if torch.cuda.is_available():
+        torch.cuda.set_rng_state(cuda_rng_state)
+    torch.set_rng_state(rng_state)
--- a/test/test_models.py
+++ b/test/test_models.py
-from common_utils import TestCase, map_nested_tensor_object
+from common_utils import TestCase, map_nested_tensor_object, freeze_rng_state
 from collections import OrderedDict
 from itertools import product
 import torch
@@ -38,62 +38,68 @@ def get_available_video_models():
 # models that are in torch hub, as well as r3d_18. we tried testing all models
 # but the test was too slow. not included are detection models, because
 # they are not yet supported in JIT.
-script_test_models = [
+# If 'unwrapper' is provided it will be called with the script model outputs
-    "deeplabv3_resnet101",
+# before they are compared to the eager model outputs. This is useful if the
-    "mobilenet_v2",
+# model outputs are different between TorchScript / Eager mode
-    "resnext50_32x4d",
+script_test_models = {
-    "fcn_resnet101",
+    'deeplabv3_resnet101': {},
-    "googlenet",
+    'mobilenet_v2': {},
-    "densenet121",
+    'resnext50_32x4d': {},
-    "resnet18",
+    'fcn_resnet101': {},
-    "alexnet",
+    'googlenet': {
-    "shufflenet_v2_x1_0",
+        'unwrapper': lambda x: x.logits
-    "squeezenet1_0",
+    },
-    "vgg11",
+    'densenet121': {},
-    "inception_v3",
+    'resnet18': {},
-    "r3d_18",
+    'alexnet': {},
-    "fasterrcnn_resnet50_fpn",
+    'shufflenet_v2_x1_0': {},
-    "maskrcnn_resnet50_fpn",
+    'squeezenet1_0': {},
-    "keypointrcnn_resnet50_fpn",
+    'vgg11': {},
-]
+    'inception_v3': {
+        'unwrapper': lambda x: x.logits
+    },
+    'r3d_18': {},
+    "fasterrcnn_resnet50_fpn": {
+        'unwrapper': lambda x: x[1]
+    },
+    "maskrcnn_resnet50_fpn": {
+        'unwrapper': lambda x: x[1]
+    },
+    "keypointrcnn_resnet50_fpn": {
+        'unwrapper': lambda x: x[1]
+    },
+}
 class ModelTester(TestCase):
-    def check_script(self, model, name):
+    def checkModule(self, model, name, args):
        if name not in script_test_models:
            return
-        scriptable = True
+        unwrapper = script_test_models[name].get('unwrapper', None)
-        msg = ""
+        return super(ModelTester, self).checkModule(model, args, unwrapper=unwrapper, skip=False)
-        try:
-            torch.jit.script(model)
-        except Exception as e:
-            tb = traceback.format_exc()
-            scriptable = False
-            msg = str(e) + str(tb)
-        self.assertTrue(scriptable, msg)
    def _test_classification_model(self, name, input_shape):
+        set_rng_seed(0)
        # passing num_class equal to a number other than 1000 helps in making the test
        # more enforcing in nature
-        set_rng_seed(0)
        model = models.__dict__[name](num_classes=50)
-        self.check_script(model, name)
        model.eval()
        x = torch.rand(input_shape)
        out = model(x)
-        self.assertExpected(out, rtol=1e-2, atol=0.)
+        self.assertExpected(out, prec=0.1)
        self.assertEqual(out.shape[-1], 50)
+        self.checkModule(model, name, (x,))
    def _test_segmentation_model(self, name):
        # passing num_class equal to a number other than 1000 helps in making the test
        # more enforcing in nature
        model = models.segmentation.__dict__[name](num_classes=50, pretrained_backbone=False)
-        self.check_script(model, name)
        model.eval()
        input_shape = (1, 3, 300, 300)
        x = torch.rand(input_shape)
        out = model(x)
        self.assertEqual(tuple(out["out"].shape), (1, 50, 300, 300))
+        self.checkModule(model, name, (x,))
    def _test_detection_model(self, name):
        set_rng_seed(0)
@@ -127,24 +133,25 @@ class ModelTester(TestCase):
        # compare results with mean and std
        if name == "maskrcnn_resnet50_fpn":
            test_value = map_nested_tensor_object(out, tensor_map_fn=compute_mean_std)
-            # mean values are small, use large rtol
+            # mean values are small, use large prec
-            self.assertExpected(test_value, rtol=.01, atol=.01)
+            self.assertExpected(test_value, prec=.01)
        else:
-            self.assertExpected(map_nested_tensor_object(out, tensor_map_fn=subsample_tensor))
+            self.assertExpected(map_nested_tensor_object(out, tensor_map_fn=subsample_tensor), prec=0.01)
        scripted_model = torch.jit.script(model)
        scripted_model.eval()
        scripted_out = scripted_model(model_input)[1]
-        self.assertNestedTensorObjectsEqual(scripted_out[0]["boxes"], out[0]["boxes"])
+        self.assertEqual(scripted_out[0]["boxes"], out[0]["boxes"])
-        self.assertNestedTensorObjectsEqual(scripted_out[0]["scores"], out[0]["scores"])
+        self.assertEqual(scripted_out[0]["scores"], out[0]["scores"])
        # labels currently float in script: need to investigate (though same result)
-        self.assertNestedTensorObjectsEqual(scripted_out[0]["labels"].to(dtype=torch.long), out[0]["labels"])
+        self.assertEqual(scripted_out[0]["labels"].to(dtype=torch.long), out[0]["labels"])
        self.assertTrue("boxes" in out[0])
        self.assertTrue("scores" in out[0])
        self.assertTrue("labels" in out[0])
        # don't check script because we are compiling it here:
        # TODO: refactor tests
        # self.check_script(model, name)
+        self.checkModule(model, name, ([x],))
    def _test_video_model(self, name):
        # the default input shape is
@@ -152,9 +159,10 @@ class ModelTester(TestCase):
        input_shape = (1, 3, 4, 112, 112)
        # test both basicblock and Bottleneck
        model = models.video.__dict__[name](num_classes=50)
-        self.check_script(model, name)
+        model.eval()
        x = torch.rand(input_shape)
        out = model(x)
+        self.checkModule(model, name, (x,))
        self.assertEqual(out.shape[-1], 50)
    def _make_sliced_model(self, model, stop_layer):

--- a/torchvision/models/detection/rpn.py
+++ b/torchvision/models/detection/rpn.py
@@ -216,7 +216,6 @@ def concat_box_prediction_layers(box_cls, box_regression):
    # same format as the labels. Note that the labels are computed for
    # all feature levels concatenated, so we keep the same representation
    # for the objectness and the box_regression
-    last_C = torch.jit.annotate(Optional[int], None)
    for box_cls_per_level, box_regression_per_level in zip(
        box_cls, box_regression
    ):
@@ -229,16 +228,14 @@ def concat_box_prediction_layers(box_cls, box_regression):
        )
        box_cls_flattened.append(box_cls_per_level)
-        last_C = C
        box_regression_per_level = permute_and_flatten(
            box_regression_per_level, N, A, 4, H, W
        )
        box_regression_flattened.append(box_regression_per_level)
-    assert last_C is not None
    # concatenate on the first dimension (representing the feature levels), to
    # take into account the way the labels were generated (with all feature maps
    # being concatenated as well)
-    box_cls = torch.cat(box_cls_flattened, dim=1).reshape(-1, last_C)
+    box_cls = torch.cat(box_cls_flattened, dim=1).flatten(0, -2)
    box_regression = torch.cat(box_regression_flattened, dim=1).reshape(-1, 4)
    return box_cls, box_regression

--- a/torchvision/models/mobilenet.py
+++ b/torchvision/models/mobilenet.py
@@ -147,14 +147,16 @@ class MobileNetV2(nn.Module):
                nn.init.normal_(m.weight, 0, 0.01)
                nn.init.zeros_(m.bias)
-    def _forward(self, x):
+    def _forward_impl(self, x):
+        # This exists since TorchScript doesn't support inheritance, so the superclass method
+        # (this one) needs to have a name other than `forward` that can be accessed in a subclass
        x = self.features(x)
        x = x.mean([2, 3])
        x = self.classifier(x)
        return x
-    # Allow for accessing forward method in a inherited class
+    def forward(self, x):
-    forward = _forward
+        return self._forward_impl(x)
 def mobilenet_v2(pretrained=False, progress=True, **kwargs):

--- a/torchvision/models/quantization/mobilenet.py
+++ b/torchvision/models/quantization/mobilenet.py
@@ -44,7 +44,7 @@ class QuantizableMobileNetV2(MobileNetV2):
    def forward(self, x):
        x = self.quant(x)
-        x = self._forward(x)
+        x = self._forward_impl(x)
        x = self.dequant(x)
        return x

--- a/torchvision/models/quantization/resnet.py
+++ b/torchvision/models/quantization/resnet.py
@@ -95,7 +95,7 @@ class QuantizableResNet(ResNet):
        # Ensure scriptability
        # super(QuantizableResNet,self).forward(x)
        # is not scriptable
-        x = self._forward(x)
+        x = self._forward_impl(x)
        x = self.dequant(x)
        return x

--- a/torchvision/models/quantization/shufflenetv2.py
+++ b/torchvision/models/quantization/shufflenetv2.py
@@ -46,7 +46,7 @@ class QuantizableShuffleNetV2(shufflenetv2.ShuffleNetV2):
    def forward(self, x):
        x = self.quant(x)
-        x = self._forward(x)
+        x = self._forward_impl(x)
        x = self.dequant(x)
        return x

--- a/torchvision/models/resnet.py
+++ b/torchvision/models/resnet.py
@@ -194,7 +194,8 @@ class ResNet(nn.Module):
        return nn.Sequential(*layers)
-    def _forward(self, x):
+    def _forward_impl(self, x):
+        # See note [TorchScript super()]
        x = self.conv1(x)
        x = self.bn1(x)
        x = self.relu(x)
@@ -211,8 +212,8 @@ class ResNet(nn.Module):
        return x
-    # Allow for accessing forward method in a inherited class
+    def forward(self, x):
-    forward = _forward
+        return self._forward_impl(x)
 def _resnet(arch, block, layers, pretrained, progress, **kwargs):

--- a/torchvision/models/shufflenetv2.py
+++ b/torchvision/models/shufflenetv2.py
@@ -122,7 +122,8 @@ class ShuffleNetV2(nn.Module):
        self.fc = nn.Linear(output_channels, num_classes)
-    def _forward(self, x):
+    def _forward_impl(self, x):
+        # See note [TorchScript super()]
        x = self.conv1(x)
        x = self.maxpool(x)
        x = self.stage2(x)
@@ -133,7 +134,8 @@ class ShuffleNetV2(nn.Module):
        x = self.fc(x)
        return x
-    forward = _forward
+    def forward(self, x):
+        return self._forward_impl(x)
 def _shufflenetv2(arch, pretrained, progress, *args, **kwargs):