Fix issue with processing partial batches for CoLa dataset.

PiperOrigin-RevId: 329012198

Fix issue with processing partial batches for CoLa dataset.
PiperOrigin-RevId: 329012198
379f951d · A. Unique TensorFlower · 45542535 · 379f951d · 379f951d
Commit 379f951d authored Aug 28, 2020 by A. Unique TensorFlower
Showing with 31 additions and 2 deletions

official/nlp/tasks/sentence_prediction.py official/nlp/tasks/sentence_prediction.py +2 -1

official/nlp/tasks/sentence_prediction_test.py official/nlp/tasks/sentence_prediction_test.py +29 -1

No files found.
--- a/official/nlp/tasks/sentence_prediction.py
+++ b/official/nlp/tasks/sentence_prediction.py
@@ -159,7 +159,8 @@ class SentencePredictionTask(base_task.Task):
    if self.metric_type == 'matthews_corrcoef':
      logs.update({
          'sentence_prediction':
-              tf.expand_dims(tf.math.argmax(outputs, axis=1), axis=0),
+              # Ensure one prediction along batch dimension.
+              tf.expand_dims(tf.math.argmax(outputs, axis=1), axis=1),
          'labels':
              labels,
      })

--- a/official/nlp/tasks/sentence_prediction_test.py
+++ b/official/nlp/tasks/sentence_prediction_test.py
@@ -86,7 +86,7 @@ class SentencePredictionTaskTest(tf.test.TestCase, parameterized.TestCase):
    iterator = iter(dataset)
    optimizer = tf.keras.optimizers.SGD(lr=0.1)
    task.train_step(next(iterator), model, optimizer, metrics=metrics)
-    task.validation_step(next(iterator), model, metrics=metrics)
+    return task.validation_step(next(iterator), model, metrics=metrics)
  @parameterized.named_parameters(
      ("init_cls_pooler", True),
@@ -182,6 +182,34 @@ class SentencePredictionTaskTest(tf.test.TestCase, parameterized.TestCase):
    aggregated = task.aggregate_logs(state=aggregated, step_outputs=outputs)
    self.assertIn(metric_type, task.reduce_aggregated_logs(aggregated))
+  def test_np_metrics_cola_partial_batch(self):
+    train_data_path = os.path.join(self.get_temp_dir(), "train.tf_record")
+    num_examples = 5
+    global_batch_size = 8
+    seq_length = 16
+    _create_fake_dataset(
+        train_data_path,
+        seq_length=seq_length,
+        num_classes=2,
+        num_examples=num_examples)
+    train_data_config = (
+        sentence_prediction_dataloader.SentencePredictionDataConfig(
+            input_path=train_data_path,
+            seq_length=seq_length,
+            is_training=True,
+            label_type="int",
+            global_batch_size=global_batch_size,
+            drop_remainder=False,
+            include_example_id=True))
+    config = sentence_prediction.SentencePredictionConfig(
+        metric_type="matthews_corrcoef",
+        model=self.get_model_config(2),
+        train_data=train_data_config)
+    outputs = self._run_task(config)
+    self.assertEqual(outputs["sentence_prediction"].shape.as_list(), [8, 1])
  def test_task_with_fit(self):
    config = sentence_prediction.SentencePredictionConfig(
        model=self.get_model_config(2), train_data=self._train_data_config)