model_speedup.py 3.44 KB
Newer Older
1
import os
QuanluZhang's avatar
QuanluZhang committed
2
3
4
5
6
7
8
import argparse
import time
import torch
import torch.nn as nn
import torch.nn.functional as F
from torchvision import datasets, transforms
from models.cifar10.vgg import VGG
9
from models.mnist.lenet import LeNet
liuzhe-lz's avatar
liuzhe-lz committed
10
from nni.compression.pytorch import apply_compression_results, ModelSpeedup
QuanluZhang's avatar
QuanluZhang committed
11
12

torch.manual_seed(0)
13
14
15
use_mask = True
use_speedup = True
compare_results = True
QuanluZhang's avatar
QuanluZhang committed
16

17
18
config = {
    'apoz': {
J-shang's avatar
J-shang committed
19
20
21
        'model_name': 'vgg16',
        'input_shape': [64, 3, 32, 32],
        'masks_file': './experiment_data/mask_vgg16_cifar10_apoz.pth'
22
23
24
25
    },
    'l1filter': {
        'model_name': 'vgg16',
        'input_shape': [64, 3, 32, 32],
26
        'masks_file': './experiment_data/mask_vgg16_cifar10_l1filter.pth'
27
28
    },
    'fpgm': {
29
30
31
        'model_name': 'vgg16',
        'input_shape': [64, 3, 32, 32],
        'masks_file': './experiment_data/mask_vgg16_cifar10_fpgm.pth'
32
33
34
35
    },
    'slim': {
        'model_name': 'vgg19',
        'input_shape': [64, 3, 32, 32],
36
        'masks_file': './experiment_data/mask_vgg19_cifar10_slim.pth'
37
38
    }
}
QuanluZhang's avatar
QuanluZhang committed
39

40
41
def model_inference(config):
    masks_file = config['masks_file']
42
43
44
45
    device = torch.device(
        'cuda') if torch.cuda.is_available() else torch.device('cpu')
        
    # device = torch.device(config['device'])
46
47
48
49
    if config['model_name'] == 'vgg16':
        model = VGG(depth=16)
    elif config['model_name'] == 'vgg19':
        model = VGG(depth=19)
50
51
52
    elif config['model_name'] == 'lenet':
        model = LeNet()

QuanluZhang's avatar
QuanluZhang committed
53
54
55
    model.to(device)
    model.eval()

56
57
58
    dummy_input = torch.randn(config['input_shape']).to(device)
    use_mask_out = use_speedup_out = None
    # must run use_mask before use_speedup because use_speedup modify the model
QuanluZhang's avatar
QuanluZhang committed
59
    if use_mask:
60
        apply_compression_results(model, masks_file, device)
QuanluZhang's avatar
QuanluZhang committed
61
62
        start = time.time()
        for _ in range(32):
63
64
65
            use_mask_out = model(dummy_input)
        print('elapsed time when use mask: ', time.time() - start)
    if use_speedup:
66
        m_speedup = ModelSpeedup(model, dummy_input, masks_file, device)
QuanluZhang's avatar
QuanluZhang committed
67
68
69
        m_speedup.speedup_model()
        start = time.time()
        for _ in range(32):
70
71
72
73
74
75
76
            use_speedup_out = model(dummy_input)
        print('elapsed time when use speedup: ', time.time() - start)
    if compare_results:
        if torch.allclose(use_mask_out, use_speedup_out, atol=1e-07):
            print('the outputs from use_mask and use_speedup are the same')
        else:
            raise RuntimeError('the outputs from use_mask and use_speedup are different')
QuanluZhang's avatar
QuanluZhang committed
77
78
79
80
81
82

if __name__ == '__main__':
    parser = argparse.ArgumentParser("speedup")
    parser.add_argument("--example_name", type=str, default="slim", help="the name of pruning example")
    parser.add_argument("--masks_file", type=str, default=None, help="the path of the masks file")
    args = parser.parse_args()
83
84
85
86
87
88
89
90
91

    if args.example_name != 'all':
        if args.masks_file is not None:
            config[args.example_name]['masks_file'] = args.masks_file
        if not os.path.exists(config[args.example_name]['masks_file']):
            msg = '{} does not exist! You should specify masks_file correctly, ' \
                  'or use default one which is generated by model_prune_torch.py'
            raise RuntimeError(msg.format(config[args.example_name]['masks_file']))
        model_inference(config[args.example_name])
QuanluZhang's avatar
QuanluZhang committed
92
    else:
93
94
95
96
        model_inference(config['fpgm'])
        model_inference(config['slim'])
        model_inference(config['l1filter'])
        model_inference(config['apoz'])