Merge pull request #2685 from tensorflow/nas-fix-3

Fix nasnet image classification and object detection

Merge pull request #2685 from tensorflow/nas-fix-3
Fix nasnet image classification and object detection
3f5dbba9 · Jonathan Huang · GitHub · b3f04bca · cf8f014b · 3f5dbba9
Unverified Commit 3f5dbba9 authored Nov 01, 2017 by Jonathan Huang Committed by GitHub Nov 01, 2017
Showing with 59 additions and 44 deletions

research/object_detection/models/faster_rcnn_nas_feature_extractor.py ...ect_detection/models/faster_rcnn_nas_feature_extractor.py +19 -2

research/slim/nets/nasnet/nasnet.py research/slim/nets/nasnet/nasnet.py +40 -42

No files found.
--- a/research/object_detection/models/faster_rcnn_nas_feature_extractor.py
+++ b/research/object_detection/models/faster_rcnn_nas_feature_extractor.py
@@ -30,6 +30,23 @@ arg_scope = tf.contrib.framework.arg_scope
 slim = tf.contrib.slim
+def nasnet_large_arg_scope_for_detection(is_batch_norm_training=False):
+  """Defines the default arg scope for the NASNet-A Large for object detection.
+  This provides a small edit to switch batch norm training on and off.
+  Args:
+    is_batch_norm_training: Boolean indicating whether to train with batch norm.
+  Returns:
+    An `arg_scope` to use for the NASNet Large Model.
+  """
+  imagenet_scope = nasnet.nasnet_large_arg_scope()
+  with arg_scope(imagenet_scope):
+    with arg_scope([slim.batch_norm], is_training=is_batch_norm_training) as sc:
+      return sc
 # Note: This is largely a copy of _build_nasnet_base inside nasnet.py but
 # with special edits to remove instantiation of the stem and the special
 # ability to receive as input a pair of hidden states.
@@ -163,11 +180,11 @@ class FasterRCNNNASFeatureExtractor(
      raise ValueError('`preprocessed_inputs` must be 4 dimensional, got a '
                       'tensor of shape %s' % preprocessed_inputs.get_shape())
-    with slim.arg_scope(nasnet.nasnet_large_arg_scope()):
+    with slim.arg_scope(nasnet_large_arg_scope_for_detection(
+        is_batch_norm_training=self._train_batch_norm)):
      _, end_points = nasnet.build_nasnet_large(
          preprocessed_inputs, num_classes=None,
          is_training=self._is_training,
-          is_batchnorm_training=self._train_batch_norm,
          final_endpoint='Cell_11')
    # Note that both 'Cell_10' and 'Cell_11' have equal depth = 2016.

--- a/research/slim/nets/nasnet/nasnet.py
+++ b/research/slim/nets/nasnet/nasnet.py
@@ -324,7 +324,7 @@ build_nasnet_cifar.default_image_size = 32
 def build_nasnet_mobile(images, num_classes,
-                        is_training=True, is_batchnorm_training=True,
+                        is_training=True,
                        final_endpoint=None):
  """Build NASNet Mobile model for the ImageNet Dataset."""
  hparams = _mobile_imagenet_config()
@@ -348,32 +348,31 @@ def build_nasnet_mobile(images, num_classes,
  reduction_cell = nasnet_utils.NasNetAReductionCell(
      hparams.num_conv_filters, hparams.drop_path_keep_prob,
      total_num_cells, hparams.total_training_steps)
-  with arg_scope([slim.dropout, nasnet_utils.drop_path],
+  with arg_scope([slim.dropout, nasnet_utils.drop_path, slim.batch_norm],
                 is_training=is_training):
-    with arg_scope([slim.batch_norm], is_training=is_batchnorm_training):
+    with arg_scope([slim.avg_pool2d,
-      with arg_scope([slim.avg_pool2d,
+                    slim.max_pool2d,
-                      slim.max_pool2d,
+                    slim.conv2d,
-                      slim.conv2d,
+                    slim.batch_norm,
-                      slim.batch_norm,
+                    slim.separable_conv2d,
-                      slim.separable_conv2d,
+                    nasnet_utils.factorized_reduction,
-                      nasnet_utils.factorized_reduction,
+                    nasnet_utils.global_avg_pool,
-                      nasnet_utils.global_avg_pool,
+                    nasnet_utils.get_channel_index,
-                      nasnet_utils.get_channel_index,
+                    nasnet_utils.get_channel_dim],
-                      nasnet_utils.get_channel_dim],
+                   data_format=hparams.data_format):
-                     data_format=hparams.data_format):
+      return _build_nasnet_base(images,
-        return _build_nasnet_base(images,
+                                normal_cell=normal_cell,
-                                  normal_cell=normal_cell,
+                                reduction_cell=reduction_cell,
-                                  reduction_cell=reduction_cell,
+                                num_classes=num_classes,
-                                  num_classes=num_classes,
+                                hparams=hparams,
-                                  hparams=hparams,
+                                is_training=is_training,
-                                  is_training=is_training,
+                                stem_type='imagenet',
-                                  stem_type='imagenet',
+                                final_endpoint=final_endpoint)
-                                  final_endpoint=final_endpoint)
 build_nasnet_mobile.default_image_size = 224
 def build_nasnet_large(images, num_classes,
-                       is_training=True, is_batchnorm_training=True,
+                       is_training=True,
                       final_endpoint=None):
  """Build NASNet Large model for the ImageNet Dataset."""
  hparams = _large_imagenet_config(is_training=is_training)
@@ -397,27 +396,26 @@ def build_nasnet_large(images, num_classes,
  reduction_cell = nasnet_utils.NasNetAReductionCell(
      hparams.num_conv_filters, hparams.drop_path_keep_prob,
      total_num_cells, hparams.total_training_steps)
-  with arg_scope([slim.dropout, nasnet_utils.drop_path],
+  with arg_scope([slim.dropout, nasnet_utils.drop_path, slim.batch_norm],
                 is_training=is_training):
-    with arg_scope([slim.batch_norm], is_training=is_batchnorm_training):
+    with arg_scope([slim.avg_pool2d,
-      with arg_scope([slim.avg_pool2d,
+                    slim.max_pool2d,
-                      slim.max_pool2d,
+                    slim.conv2d,
-                      slim.conv2d,
+                    slim.batch_norm,
-                      slim.batch_norm,
+                    slim.separable_conv2d,
-                      slim.separable_conv2d,
+                    nasnet_utils.factorized_reduction,
-                      nasnet_utils.factorized_reduction,
+                    nasnet_utils.global_avg_pool,
-                      nasnet_utils.global_avg_pool,
+                    nasnet_utils.get_channel_index,
-                      nasnet_utils.get_channel_index,
+                    nasnet_utils.get_channel_dim],
-                      nasnet_utils.get_channel_dim],
+                   data_format=hparams.data_format):
-                     data_format=hparams.data_format):
+      return _build_nasnet_base(images,
-        return _build_nasnet_base(images,
+                                normal_cell=normal_cell,
-                                  normal_cell=normal_cell,
+                                reduction_cell=reduction_cell,
-                                  reduction_cell=reduction_cell,
+                                num_classes=num_classes,
-                                  num_classes=num_classes,
+                                hparams=hparams,
-                                  hparams=hparams,
+                                is_training=is_training,
-                                  is_training=is_training,
+                                stem_type='imagenet',
-                                  stem_type='imagenet',
+                                final_endpoint=final_endpoint)
-                                  final_endpoint=final_endpoint)
 build_nasnet_large.default_image_size = 331