votenet.py 2.55 KB
Newer Older
liyinhao's avatar
liyinhao committed
1
2
model = dict(
    type='VoteNet',
jshilong's avatar
jshilong committed
3
    data_preprocessor=dict(type='Det3DDataPreprocessor'),
liyinhao's avatar
liyinhao committed
4
5
6
7
8
9
10
11
12
13
    backbone=dict(
        type='PointNet2SASSG',
        in_channels=4,
        num_points=(2048, 1024, 512, 256),
        radius=(0.2, 0.4, 0.8, 1.2),
        num_samples=(64, 32, 16, 16),
        sa_channels=((64, 64, 128), (128, 128, 256), (128, 128, 256),
                     (128, 128, 256)),
        fp_channels=((256, 256), (256, 256)),
        norm_cfg=dict(type='BN2d'),
14
15
16
17
18
        sa_cfg=dict(
            type='PointSAModule',
            pool_mod='max',
            use_xyz=True,
            normalize_xyz=True)),
liyinhao's avatar
liyinhao committed
19
20
    bbox_head=dict(
        type='VoteHead',
21
        vote_module_cfg=dict(
liyinhao's avatar
liyinhao committed
22
23
24
25
26
27
28
29
30
31
32
33
34
            in_channels=256,
            vote_per_seed=1,
            gt_per_seed=3,
            conv_channels=(256, 256),
            conv_cfg=dict(type='Conv1d'),
            norm_cfg=dict(type='BN1d'),
            norm_feats=True,
            vote_loss=dict(
                type='ChamferDistance',
                mode='l1',
                reduction='none',
                loss_dst_weight=10.0)),
        vote_aggregation_cfg=dict(
35
            type='PointSAModule',
liyinhao's avatar
liyinhao committed
36
37
38
39
40
41
            num_point=256,
            radius=0.3,
            num_sample=16,
            mlp_channels=[256, 128, 128, 128],
            use_xyz=True,
            normalize_xyz=True),
42
43
        pred_layer_cfg=dict(
            in_channels=128, shared_conv_channels=(128, 128), bias=True),
liyinhao's avatar
liyinhao committed
44
        objectness_loss=dict(
jshilong's avatar
jshilong committed
45
            type='mmdet.CrossEntropyLoss',
liyinhao's avatar
liyinhao committed
46
47
48
49
50
51
52
53
54
55
            class_weight=[0.2, 0.8],
            reduction='sum',
            loss_weight=5.0),
        center_loss=dict(
            type='ChamferDistance',
            mode='l2',
            reduction='sum',
            loss_src_weight=10.0,
            loss_dst_weight=10.0),
        dir_class_loss=dict(
jshilong's avatar
jshilong committed
56
            type='mmdet.CrossEntropyLoss', reduction='sum', loss_weight=1.0),
liyinhao's avatar
liyinhao committed
57
        dir_res_loss=dict(
jshilong's avatar
jshilong committed
58
            type='mmdet.SmoothL1Loss', reduction='sum', loss_weight=10.0),
liyinhao's avatar
liyinhao committed
59
        size_class_loss=dict(
jshilong's avatar
jshilong committed
60
            type='mmdet.CrossEntropyLoss', reduction='sum', loss_weight=1.0),
liyinhao's avatar
liyinhao committed
61
        size_res_loss=dict(
jshilong's avatar
jshilong committed
62
63
            type='mmdet.SmoothL1Loss', reduction='sum',
            loss_weight=10.0 / 3.0),
liyinhao's avatar
liyinhao committed
64
        semantic_loss=dict(
jshilong's avatar
jshilong committed
65
            type='mmdet.CrossEntropyLoss', reduction='sum', loss_weight=1.0)),
66
67
    # model training and testing settings
    train_cfg=dict(
jshilong's avatar
jshilong committed
68
        pos_distance_thr=0.3, neg_distance_thr=0.6, sample_mode='vote'),
69
    test_cfg=dict(
jshilong's avatar
jshilong committed
70
        sample_mode='seed',
71
72
73
        nms_thr=0.25,
        score_thr=0.05,
        per_class_proposal=True))