test_convmixer.py 2.08 KB
Newer Older
limm's avatar
limm committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
# Copyright (c) OpenMMLab. All rights reserved.
import pytest
import torch

from mmpretrain.models.backbones import ConvMixer


def test_assertion():
    with pytest.raises(AssertionError):
        ConvMixer(arch='unknown')

    with pytest.raises(AssertionError):
        # ConvMixer arch dict should include essential_keys,
        ConvMixer(arch=dict(channels=[2, 3, 4, 5]))

    with pytest.raises(AssertionError):
        # ConvMixer out_indices should be valid depth.
        ConvMixer(out_indices=-100)


@torch.no_grad()  # To save memory
def test_convmixer():

    # Test forward
    model = ConvMixer(arch='768/32')
    model.init_weights()
    model.train()

    imgs = torch.randn(1, 3, 224, 224)
    feat = model(imgs)
    assert len(feat) == 1
    assert feat[0].shape == torch.Size([1, 768, 32, 32])

    # Test forward with multiple outputs
    model = ConvMixer(arch='768/32', out_indices=range(32))

    imgs = torch.randn(1, 3, 224, 224)
    feat = model(imgs)
    assert len(feat) == 32
    for f in feat:
        assert f.shape == torch.Size([1, 768, 32, 32])

    # Test with custom arch
    model = ConvMixer(
        arch={
            'embed_dims': 99,
            'depth': 5,
            'patch_size': 5,
            'kernel_size': 9
        },
        out_indices=range(5))
    model.init_weights()
    model.train()

    imgs = torch.randn(1, 3, 224, 224)
    feat = model(imgs)
    assert len(feat) == 5
    for f in feat:
        assert f.shape == torch.Size([1, 99, 44, 44])

    # Test with even kernel size arch
    model = ConvMixer(arch={
        'embed_dims': 99,
        'depth': 5,
        'patch_size': 5,
        'kernel_size': 8
    })
    model.init_weights()
    model.train()

    imgs = torch.randn(1, 3, 224, 224)
    feat = model(imgs)
    assert len(feat) == 1
    assert feat[0].shape == torch.Size([1, 99, 44, 44])

    # Test frozen_stages
    model = ConvMixer(arch='768/32', frozen_stages=10)
    model.init_weights()
    model.train()

    for i in range(10):
        assert not model.stages[i].training

    for i in range(10, 32):
        assert model.stages[i].training