test_models.py 6.54 KB
Newer Older
1
2
from collections import OrderedDict
from itertools import product
3
4
5
6
7
import torch
from torchvision import models
import unittest


8
def get_available_classification_models():
9
    # TODO add a registration mechanism to torchvision.models
10
11
12
13
14
15
    return [k for k, v in models.__dict__.items() if callable(v) and k[0].lower() == k[0] and k[0] != "_"]


def get_available_segmentation_models():
    # TODO add a registration mechanism to torchvision.models
    return [k for k, v in models.segmentation.__dict__.items() if callable(v) and k[0].lower() == k[0] and k[0] != "_"]
16
17


18
19
20
21
22
def get_available_detection_models():
    # TODO add a registration mechanism to torchvision.models
    return [k for k, v in models.detection.__dict__.items() if callable(v) and k[0].lower() == k[0] and k[0] != "_"]


23
24
25
26
27
def get_available_video_models():
    # TODO add a registration mechanism to torchvision.models
    return [k for k, v in models.video.__dict__.items() if callable(v) and k[0].lower() == k[0] and k[0] != "_"]


28
29
30
31
# model_name, expected to script without error
torchub_models = {
    "deeplabv3_resnet101": False,
    "mobilenet_v2": True,
eellison's avatar
eellison committed
32
    "resnext50_32x4d": True,
33
34
35
    "fcn_resnet101": False,
    "googlenet": False,
    "densenet121": False,
36
    "resnet18": True,
37
    "alexnet": True,
38
    "shufflenet_v2_x1_0": True,
39
40
41
42
43
44
    "squeezenet1_0": True,
    "vgg11": True,
    "inception_v3": False,
}


45
class Tester(unittest.TestCase):
46
47
48
49
50
51
52
53
54
55
    def check_script(self, model, name):
        if name not in torchub_models:
            return
        scriptable = True
        try:
            torch.jit.script(model)
        except Exception:
            scriptable = False
        self.assertEqual(torchub_models[name], scriptable)

56
    def _test_classification_model(self, name, input_shape):
57
58
        # passing num_class equal to a number other than 1000 helps in making the test
        # more enforcing in nature
59
        model = models.__dict__[name](num_classes=50)
60
        self.check_script(model, name)
61
62
63
        model.eval()
        x = torch.rand(input_shape)
        out = model(x)
64
        self.assertEqual(out.shape[-1], 50)
65

66
67
68
69
    def _test_segmentation_model(self, name):
        # passing num_class equal to a number other than 1000 helps in making the test
        # more enforcing in nature
        model = models.segmentation.__dict__[name](num_classes=50, pretrained_backbone=False)
70
        self.check_script(model, name)
71
72
73
74
75
76
        model.eval()
        input_shape = (1, 3, 300, 300)
        x = torch.rand(input_shape)
        out = model(x)
        self.assertEqual(tuple(out["out"].shape), (1, 50, 300, 300))

77
78
    def _test_detection_model(self, name):
        model = models.detection.__dict__[name](num_classes=50, pretrained_backbone=False)
79
        self.check_script(model, name)
80
81
82
        model.eval()
        input_shape = (3, 300, 300)
        x = torch.rand(input_shape)
83
84
85
        model_input = [x]
        out = model(model_input)
        self.assertIs(model_input[0], x)
86
87
88
89
90
        self.assertEqual(len(out), 1)
        self.assertTrue("boxes" in out[0])
        self.assertTrue("scores" in out[0])
        self.assertTrue("labels" in out[0])

91
92
93
    def _test_video_model(self, name):
        # the default input shape is
        # bs * num_channels * clip_len * h *w
94
        input_shape = (1, 3, 4, 112, 112)
95
96
        # test both basicblock and Bottleneck
        model = models.video.__dict__[name](num_classes=50)
97
        self.check_script(model, name)
98
99
100
101
        x = torch.rand(input_shape)
        out = model(x)
        self.assertEqual(out.shape[-1], 50)

102
103
104
105
106
107
108
109
110
    def _make_sliced_model(self, model, stop_layer):
        layers = OrderedDict()
        for name, layer in model.named_children():
            layers[name] = layer
            if name == stop_layer:
                break
        new_model = torch.nn.Sequential(layers)
        return new_model

111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
    def test_memory_efficient_densenet(self):
        input_shape = (1, 3, 300, 300)
        x = torch.rand(input_shape)

        for name in ['densenet121', 'densenet169', 'densenet201', 'densenet161']:
            model1 = models.__dict__[name](num_classes=50, memory_efficient=True)
            params = model1.state_dict()
            model1.eval()
            out1 = model1(x)
            out1.sum().backward()

            model2 = models.__dict__[name](num_classes=50, memory_efficient=False)
            model2.load_state_dict(params)
            model2.eval()
            out2 = model2(x)

            max_diff = (out1 - out2).abs().max()

            self.assertTrue(max_diff < 1e-5)

131
132
133
134
135
136
137
138
139
140
141
    def test_resnet_dilation(self):
        # TODO improve tests to also check that each layer has the right dimensionality
        for i in product([False, True], [False, True], [False, True]):
            model = models.__dict__["resnet50"](replace_stride_with_dilation=i)
            model = self._make_sliced_model(model, stop_layer="layer4")
            model.eval()
            x = torch.rand(1, 3, 224, 224)
            out = model(x)
            f = 2 ** sum(i)
            self.assertEqual(out.shape, (1, 2048, 7 * f, 7 * f))

142
143
144
145
146
147
148
    def test_mobilenetv2_residual_setting(self):
        model = models.__dict__["mobilenet_v2"](inverted_residual_setting=[[1, 16, 1, 1], [6, 24, 2, 2]])
        model.eval()
        x = torch.rand(1, 3, 224, 224)
        out = model(x)
        self.assertEqual(out.shape[-1], 1000)

149

150
for model_name in get_available_classification_models():
151
152
153
154
155
156
    # for-loop bodies don't define scopes, so we have to save the variables
    # we want to close over in some way
    def do_test(self, model_name=model_name):
        input_shape = (1, 3, 224, 224)
        if model_name in ['inception_v3']:
            input_shape = (1, 3, 299, 299)
157
158
159
160
161
162
163
164
165
166
        self._test_classification_model(model_name, input_shape)

    setattr(Tester, "test_" + model_name, do_test)


for model_name in get_available_segmentation_models():
    # for-loop bodies don't define scopes, so we have to save the variables
    # we want to close over in some way
    def do_test(self, model_name=model_name):
        self._test_segmentation_model(model_name)
167
168
169
170

    setattr(Tester, "test_" + model_name, do_test)


171
172
173
174
175
176
177
178
for model_name in get_available_detection_models():
    # for-loop bodies don't define scopes, so we have to save the variables
    # we want to close over in some way
    def do_test(self, model_name=model_name):
        self._test_detection_model(model_name)

    setattr(Tester, "test_" + model_name, do_test)

179

180
181
182
183
184
185
for model_name in get_available_video_models():

    def do_test(self, model_name=model_name):
        self._test_video_model(model_name)

    setattr(Tester, "test_" + model_name, do_test)
186

187
188
if __name__ == '__main__':
    unittest.main()