fixed semantic mask rescaling

6366773f · srihari-humbarwadi · 05541cbe · 6366773f · 6366773f
Unverified Commit 6366773f authored Oct 26, 2021 by srihari-humbarwadi
2 changed files
--- a/official/vision/beta/evaluation/panoptic_quality_evaluator.py
+++ b/official/vision/beta/evaluation/panoptic_quality_evaluator.py
@@ -32,22 +32,13 @@ import tensorflow as tf
 from official.vision.beta.evaluation import panoptic_quality
-def _crop_padding(groundtruth, prediction, image_info):
+def _crop_padding(mask, image_info):
  image_shape = tf.cast(image_info[0, :], tf.int32)
-  offsets = tf.cast(image_info[3, :], tf.int32)
+  mask = tf.image.crop_to_bounding_box(
+      tf.expand_dims(mask, axis=-1), 0, 0,
-  prediction = tf.image.crop_to_bounding_box(
-      tf.expand_dims(prediction, axis=-1),
-      offsets[0], offsets[1],
-      image_shape[0],
-      image_shape[1])
-  groundtruth = tf.image.crop_to_bounding_box(
-      tf.expand_dims(groundtruth, axis=-1), 0, 0,
      image_shape[0], image_shape[1])
-  return (
+  return tf.expand_dims(mask[:, :, 0], axis=0)
-      tf.expand_dims(groundtruth[:, :, 0], axis=0),
-      tf.expand_dims(prediction[:, :, 0], axis=0))
 class PanopticQualityEvaluator:
  """Panoptic Quality metric class."""
@@ -163,21 +154,17 @@ class PanopticQualityEvaluator:
    if self._rescale_predictions:
      for idx in range(len(groundtruths['category_mask'])):
        image_info = groundtruths['image_info'][idx]
-        groundtruth_category_mask, prediction_category_mask = _crop_padding(
-            groundtruths['category_mask'][idx],
-            predictions['category_mask'][idx],
-            image_info)
-        groundtruth_instance_mask, prediction_instance_mask = _crop_padding(
-            groundtruths['instance_mask'][idx],
-            predictions['instance_mask'][idx],
-            image_info)
        _groundtruths = {
-            'category_mask': groundtruth_category_mask,
+            'category_mask':
-            'instance_mask': groundtruth_instance_mask
+                _crop_padding(groundtruths['category_mask'][idx], image_info),
+            'instance_mask':
+                _crop_padding(groundtruths['instance_mask'][idx], image_info),
            }
        _predictions = {
-            'category_mask': prediction_category_mask,
+            'category_mask':
-            'instance_mask': prediction_instance_mask
+                _crop_padding(predictions['category_mask'][idx], image_info),
+            'instance_mask':
+                _crop_padding(predictions['instance_mask'][idx], image_info),
            }
        _groundtruths, _predictions = self._convert_to_numpy(
            _groundtruths, _predictions)

--- a/official/vision/beta/projects/panoptic_maskrcnn/modeling/layers/panoptic_segmentation_generator.py
+++ b/official/vision/beta/projects/panoptic_maskrcnn/modeling/layers/panoptic_segmentation_generator.py
@@ -224,6 +224,25 @@ class PanopticSegmentationGenerator(tf.keras.layers.Layer):
    }
    return results
+  def _resize_and_pad_masks(self, mask, image_info):
+    rescale_size = tf.cast(
+        tf.math.ceil(image_info[1, :] / image_info[2, :]), tf.int32)
+    image_shape = tf.cast(image_info[0, :], tf.int32)
+    offsets = tf.cast(image_info[3, :], tf.int32)
+    mask = tf.image.resize(
+        mask,
+        rescale_size,
+        method=tf.image.ResizeMethod.BILINEAR)
+    mask = tf.image.crop_to_bounding_box(
+        mask,
+        offsets[0], offsets[1],
+        image_shape[0],
+        image_shape[1])
+    mask = tf.image.pad_to_bounding_box(
+        mask, 0, 0, self._output_size[0], self._output_size[1])
+    return mask
  def call(self, inputs: tf.Tensor, image_info: Mapping[str, tf.Tensor]):
    detections = inputs
@@ -232,20 +251,26 @@ class PanopticSegmentationGenerator(tf.keras.layers.Layer):
    batched_detections_masks = tf.expand_dims(
        detections['detection_masks'], axis=-1)
-    batched_segmentation_masks = tf.image.resize(
-        detections['segmentation_outputs'],
-        size=self._output_size,
-        method='bilinear')
-    batched_segmentation_masks = tf.expand_dims(tf.cast(
-        tf.argmax(batched_segmentation_masks, axis=-1),
-        dtype=tf.float32), axis=-1)
    batched_boxes = detections['detection_boxes']
    scale = tf.tile(
        tf.cast(image_info[:, 2:3, :], dtype=batched_boxes.dtype),
        multiples=[1, 1, 2])
    batched_boxes /= scale
+    batched_segmentation_masks = tf.cast(
+        detections['segmentation_outputs'], dtype=tf.float32)
+    batched_segmentation_masks = tf.map_fn(
+        fn=lambda x: self._resize_and_pad_masks(
+            x[0], x[1]),
+        elems=(
+            batched_segmentation_masks,
+            image_info),
+        fn_output_signature=tf.float32,
+        parallel_iterations=32)
+    batched_segmentation_masks = tf.expand_dims(tf.cast(
+        tf.argmax(batched_segmentation_masks, axis=-1),
+        dtype=tf.float32), axis=-1)
    panoptic_masks = tf.map_fn(
        fn=lambda x: self._generate_panoptic_masks(  # pylint:disable=g-long-lambda
            x[0], x[1], x[2], x[3], x[4]),