Merge pull request #604 from thangvubk/master

change frozen to requires_grad for clear behavior

Merge pull request #604 from thangvubk/master
change frozen to requires_grad for clear behavior
14fc9f0f · Kai Chen · GitHub · 01e5ec51 · 025149c1 · 14fc9f0f
Unverified Commit 14fc9f0f authored May 07, 2019 by Kai Chen Committed by GitHub May 07, 2019
16 changed files
--- a/configs/cascade_mask_rcnn_r50_c4_1x.py
+++ b/configs/cascade_mask_rcnn_r50_c4_1x.py
@@ -11,7 +11,7 @@ model = dict(
        dilations=(1, 1, 1),
        out_indices=(2, ),
        frozen_stages=1,
-        normalize=dict(type='BN', frozen=True),
+        normalize=dict(type='BN', requires_grad=False),
        norm_eval=True,
        style='caffe'),
    shared_head=dict(
@@ -21,7 +21,7 @@ model = dict(
        stride=2,
        dilation=1,
        style='caffe',
-        normalize=dict(type='BN', frozen=True),
+        normalize=dict(type='BN', requires_grad=False),
        norm_eval=True),
    rpn_head=dict(
        type='RPNHead',

--- a/configs/cascade_rcnn_r50_c4_1x.py
+++ b/configs/cascade_rcnn_r50_c4_1x.py
@@ -11,7 +11,7 @@ model = dict(
        dilations=(1, 1, 1),
        out_indices=(2, ),
        frozen_stages=1,
-        normalize=dict(type='BN', frozen=True),
+        normalize=dict(type='BN', requires_grad=False),
        norm_eval=True,
        style='caffe'),
    shared_head=dict(
@@ -21,7 +21,7 @@ model = dict(
        stride=2,
        dilation=1,
        style='caffe',
-        normalize=dict(type='BN', frozen=True),
+        normalize=dict(type='BN', requires_grad=False),
        norm_eval=True),
    rpn_head=dict(
        type='RPNHead',

--- a/configs/fast_rcnn_r50_c4_1x.py
+++ b/configs/fast_rcnn_r50_c4_1x.py
@@ -10,7 +10,7 @@ model = dict(
        dilations=(1, 1, 1),
        out_indices=(2, ),
        frozen_stages=1,
-        normalize=dict(type='BN', frozen=True),
+        normalize=dict(type='BN', requires_grad=False),
        norm_eval=True,
        style='caffe'),
    shared_head=dict(
@@ -20,7 +20,7 @@ model = dict(
        stride=2,
        dilation=1,
        style='caffe',
-        normalize=dict(type='BN', frozen=True),
+        normalize=dict(type='BN', requires_grad=False),
        norm_eval=True),
    bbox_roi_extractor=dict(
        type='SingleRoIExtractor',

--- a/configs/faster_rcnn_r50_c4_1x.py
+++ b/configs/faster_rcnn_r50_c4_1x.py
@@ -10,7 +10,7 @@ model = dict(
        dilations=(1, 1, 1),
        out_indices=(2, ),
        frozen_stages=1,
-        normalize=dict(type='BN', frozen=True),
+        normalize=dict(type='BN', requires_grad=False),
        norm_eval=True,
        style='caffe'),
    shared_head=dict(
@@ -20,7 +20,7 @@ model = dict(
        stride=2,
        dilation=1,
        style='caffe',
-        normalize=dict(type='BN', frozen=True),
+        normalize=dict(type='BN', requires_grad=False),
        norm_eval=True),
    rpn_head=dict(
        type='RPNHead',

--- a/configs/gn+ws/faster_rcnn_r50_fpn_gn_ws_1x.py
+++ b/configs/gn+ws/faster_rcnn_r50_fpn_gn_ws_1x.py
 # model settings
 conv_cfg = dict(type='ConvWS')
-normalize = dict(type='GN', num_groups=32, frozen=False)
+normalize = dict(type='GN', num_groups=32, requires_grad=True)
 model = dict(
    type='FasterRCNN',
    pretrained='open-mmlab://jhu/resnet50_gn_ws',

--- a/configs/gn+ws/mask_rcnn_r50_fpn_gn_ws_20_23_24e.py
+++ b/configs/gn+ws/mask_rcnn_r50_fpn_gn_ws_20_23_24e.py
 # model settings
 conv_cfg = dict(type='ConvWS')
-normalize = dict(type='GN', num_groups=32, frozen=False)
+normalize = dict(type='GN', num_groups=32, requires_grad=True)
 model = dict(
    type='MaskRCNN',
    pretrained='open-mmlab://jhu/resnet50_gn_ws',

--- a/configs/gn+ws/mask_rcnn_r50_fpn_gn_ws_2x.py
+++ b/configs/gn+ws/mask_rcnn_r50_fpn_gn_ws_2x.py
 # model settings
 conv_cfg = dict(type='ConvWS')
-normalize = dict(type='GN', num_groups=32, frozen=False)
+normalize = dict(type='GN', num_groups=32, requires_grad=True)
 model = dict(
    type='MaskRCNN',
    pretrained='open-mmlab://jhu/resnet50_gn_ws',

--- a/configs/gn+ws/mask_rcnn_x101_32x4d_fpn_gn_ws_2x.py
+++ b/configs/gn+ws/mask_rcnn_x101_32x4d_fpn_gn_ws_2x.py
 # model settings
 conv_cfg = dict(type='ConvWS')
-normalize = dict(type='GN', num_groups=32, frozen=False)
+normalize = dict(type='GN', num_groups=32, requires_grad=True)
 model = dict(
    type='MaskRCNN',
    pretrained='open-mmlab://jhu/resnext101_32x4d_gn_ws',

--- a/configs/gn/mask_rcnn_r101_fpn_gn_2x.py
+++ b/configs/gn/mask_rcnn_r101_fpn_gn_2x.py
 # model settings
-normalize = dict(type='GN', num_groups=32, frozen=False)
+normalize = dict(type='GN', num_groups=32, requires_grad=True)
 model = dict(
    type='MaskRCNN',

--- a/configs/gn/mask_rcnn_r50_fpn_gn_2x.py
+++ b/configs/gn/mask_rcnn_r50_fpn_gn_2x.py
 # model settings
-normalize = dict(type='GN', num_groups=32, frozen=False)
+normalize = dict(type='GN', num_groups=32, requires_grad=True)
 model = dict(
    type='MaskRCNN',

--- a/configs/gn/mask_rcnn_r50_fpn_gn_contrib_2x.py
+++ b/configs/gn/mask_rcnn_r50_fpn_gn_contrib_2x.py
 # model settings
-normalize = dict(type='GN', num_groups=32, frozen=False)
+normalize = dict(type='GN', num_groups=32, requires_grad=True)
 model = dict(
    type='MaskRCNN',

--- a/configs/mask_rcnn_r50_c4_1x.py
+++ b/configs/mask_rcnn_r50_c4_1x.py
@@ -10,7 +10,7 @@ model = dict(
        dilations=(1, 1, 1),
        out_indices=(2, ),
        frozen_stages=1,
-        normalize=dict(type='BN', frozen=True),
+        normalize=dict(type='BN', requires_grad=False),
        norm_eval=True,
        style='caffe'),
    shared_head=dict(
@@ -20,7 +20,7 @@ model = dict(
        stride=2,
        dilation=1,
        style='caffe',
-        normalize=dict(type='BN', frozen=True),
+        normalize=dict(type='BN', requires_grad=False),
        norm_eval=True),
    rpn_head=dict(
        type='RPNHead',

--- a/configs/rpn_r50_c4_1x.py
+++ b/configs/rpn_r50_c4_1x.py
@@ -10,7 +10,7 @@ model = dict(
        dilations=(1, 1, 1),
        out_indices=(2, ),
        frozen_stages=1,
-        normalize=dict(type='BN', frozen=True),
+        normalize=dict(type='BN', requires_grad=False),
        norm_eval=True,
        style='caffe'),
    neck=None,

--- a/mmdet/models/backbones/resnet.py
+++ b/mmdet/models/backbones/resnet.py
@@ -307,8 +307,8 @@ class ResNet(nn.Module):
        style (str): `pytorch` or `caffe`. If set to "pytorch", the stride-two
            layer is the 3x3 conv layer, otherwise the stride-two layer is
            the first 1x1 conv layer.
-        frozen_stages (int): Stages to be frozen (all param fixed). -1 means
+        frozen_stages (int): Stages to be frozen (stop grad and set eval mode).
-            not freezing any parameters.
+            -1 means not freezing any parameters.
        normalize (dict): dictionary to construct and config norm layer.
        norm_eval (bool): Whether to set norm layers to eval mode, namely,
            freeze running stats (mean and var). Note: Effect on Batch Norm
@@ -336,7 +336,7 @@ class ResNet(nn.Module):
                 style='pytorch',
                 frozen_stages=-1,
                 conv_cfg=None,
-                 normalize=dict(type='BN', frozen=False),
+                 normalize=dict(type='BN', requires_grad=True),
                 norm_eval=True,
                 dcn=None,
                 stage_with_dcn=(False, False, False, False),

--- a/mmdet/models/shared_heads/res_layer.py
+++ b/mmdet/models/shared_heads/res_layer.py
@@ -17,7 +17,7 @@ class ResLayer(nn.Module):
                 stride=2,
                 dilation=1,
                 style='pytorch',
-                 normalize=dict(type='BN', frozen=False),
+                 normalize=dict(type='BN', requires_grad=True),
                 norm_eval=True,
                 with_cp=False,
                 dcn=None):

--- a/mmdet/models/utils/norm.py
+++ b/mmdet/models/utils/norm.py
@@ -17,15 +17,13 @@ def build_norm_layer(cfg, num_features, postfix=''):
        cfg (dict): cfg should contain:
            type (str): identify norm layer type.
            layer args: args needed to instantiate a norm layer.
-            frozen (bool): [optional] whether stop gradient updates
+            requires_grad (bool): [optional] whether stop gradient updates
-                of norm layer, it is helpful to set frozen mode
+        num_features (int): number of channels from input.
-                in backbone's norms.
+        postfix (int, str): appended into norm abbreviation to
-        num_features (int): number of channels from input
-        postfix (int, str): appended into norm abbreation to
            create named layer.
    Returns:
-        name (str): abbreation + postfix
+        name (str): abbreviation + postfix
        layer (nn.Module): created norm layer
    """
    assert isinstance(cfg, dict) and 'type' in cfg
@@ -42,7 +40,7 @@ def build_norm_layer(cfg, num_features, postfix=''):
    assert isinstance(postfix, (int, str))
    name = abbr + str(postfix)
-    frozen = cfg_.pop('frozen', False)
+    requires_grad = cfg_.pop('requires_grad', True)
    cfg_.setdefault('eps', 1e-5)
    if layer_type != 'GN':
        layer = norm_layer(num_features, **cfg_)
@@ -50,8 +48,7 @@ def build_norm_layer(cfg, num_features, postfix=''):
        assert 'num_groups' in cfg_
        layer = norm_layer(num_channels=num_features, **cfg_)
-    if frozen:
+    for param in layer.parameters():
-        for param in layer.parameters():
+        param.requires_grad = requires_grad
-            param.requires_grad = False
    return name, layer