Internal change

PiperOrigin-RevId: 344294492

Internal change
PiperOrigin-RevId: 344294492
577867c6 · Poorva Potdar · A. Unique TensorFlower · a8ac58ea · a8ac58ea
Commit 577867c6 authored Nov 25, 2020 by Poorva Potdar Committed by A. Unique TensorFlower Nov 25, 2020
Hide whitespace changes
Inline Side-by-side

Showing with 0 additions and 177 deletions

official/nlp/modeling/ops/sampling_module_test.py official/nlp/modeling/ops/sampling_module_test.py +0 -177

No files found.
--- a/official/nlp/modeling/ops/sampling_module_test.py
+++ b/official/nlp/modeling/ops/sampling_module_test.py
-# Copyright 2020 The TensorFlow Authors. All Rights Reserved.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-# ==============================================================================
-"""Tests for Sampling Strategies."""
-from absl.testing import parameterized
-import tensorflow as tf
-from official.nlp.modeling.ops import sampling_module
-def length_norm(length, dtype):
-  """Return length normalization factor."""
-  return tf.pow(((5. + tf.cast(length, dtype)) / 6.), 0.0)
-greedy_expected = tf.constant([[9, 1, 2, 2, 2], [1, 1, 1, 2, 2]])
-class SamplingModuleTest(tf.test.TestCase, parameterized.TestCase):
-  cache = {'layer_%d' % layer: {'k': tf.zeros([2, 2, 2, 2], dtype=tf.float32),
-                                'v': tf.zeros([2, 2, 2, 2], dtype=tf.float32)
-                               } for layer in range(2)}
-  probabilities = tf.constant([[[0.3, 0.4, 0.3], [0.3, 0.3, 0.4],
-                                [0.1, 0.1, 0.8], [0.1, 0.1, 0.8]],
-                               [[0.2, 0.5, 0.3], [0.2, 0.7, 0.1],
-                                [0.1, 0.1, 0.8], [0.1, 0.1, 0.8]]])
-  def _get_test_symbols_to_logits_fn(self):
-    """Calculates logits of the next tokens."""
-    def symbols_to_logits_fn(ids, i, cache):
-      del ids
-      logits = tf.cast(tf.math.log(self.probabilities[:, i, :]), tf.float32)
-      return logits, cache
-    return symbols_to_logits_fn
-  @parameterized.named_parameters([
-      ('padded_decode_true', True),
-      ('padded_decode_false', False),
-  ])
-  def test_greedy(self, padded_decode):
-    greedy_obj = sampling_module.SamplingModule(
-        length_normalization_fn=None,
-        dtype=tf.float32,
-        symbols_to_logits_fn=self._get_test_symbols_to_logits_fn(),
-        vocab_size=3,
-        max_decode_length=4,
-        eos_id=10,
-        padded_decode=padded_decode)
-    ids, _ = greedy_obj.generate(
-        initial_ids=tf.constant([9, 1]), initial_cache=self.cache)
-    self.assertAllEqual(greedy_expected, ids)
-  @parameterized.named_parameters([
-      ('padded_decode_true', True),
-      ('padded_decode_false', False),
-  ])
-  def test_topk(self, padded_decode):
-    top_k_obj = sampling_module.SamplingModule(
-        length_normalization_fn=length_norm,
-        dtype=tf.float32,
-        symbols_to_logits_fn=self._get_test_symbols_to_logits_fn(),
-        vocab_size=3,
-        max_decode_length=4,
-        eos_id=10,
-        sample_temperature=tf.constant(1.0),
-        top_k=tf.constant(3),
-        padded_decode=padded_decode,
-        enable_greedy=False)
-    tf.random.set_seed(1)
-    ids, _ = top_k_obj.generate(
-        initial_ids=tf.constant([9, 1]), initial_cache=self.cache)
-    top_k_expected = tf.constant([[9, 1, 0, 2, 2], [1, 0, 1, 1, 0]])
-    self.assertAllEqual(top_k_expected, ids)
-  @parameterized.named_parameters([
-      ('padded_decode_true', True),
-      ('padded_decode_false', False),
-  ])
-  def test_topp(self, padded_decode):
-    top_p_obj = sampling_module.SamplingModule(
-        length_normalization_fn=length_norm,
-        dtype=tf.float32,
-        symbols_to_logits_fn=self._get_test_symbols_to_logits_fn(),
-        vocab_size=3,
-        max_decode_length=4,
-        eos_id=10,
-        sample_temperature=tf.constant(1.0),
-        top_p=tf.constant(0.9),
-        padded_decode=padded_decode,
-        enable_greedy=False)
-    tf.random.set_seed(1)
-    ids, _ = top_p_obj.generate(
-        initial_ids=tf.constant([9, 1]), initial_cache=self.cache)
-    top_p_expected = tf.constant([[9, 1, 0, 2, 2], [1, 0, 1, 2, 0]])
-    self.assertAllEqual(top_p_expected, ids)
-  @parameterized.named_parameters([
-      ('padded_decode_true', True),
-      ('padded_decode_false', False),
-  ])
-  def test_sampling_equivalent_greedy(self, padded_decode):
-    # Ensure that p=0.0 with no sample temperature is same as greedy.
-    top_p_obj = sampling_module.SamplingModule(
-        length_normalization_fn=length_norm,
-        dtype=tf.float32,
-        symbols_to_logits_fn=self._get_test_symbols_to_logits_fn(),
-        vocab_size=3,
-        max_decode_length=4,
-        eos_id=10,
-        sample_temperature=0.0,
-        top_p=tf.constant(0.0),
-        padded_decode=padded_decode,
-        enable_greedy=False)
-    ids, _ = top_p_obj.generate(
-        initial_ids=tf.constant([9, 1]), initial_cache=self.cache)
-    self.assertAllEqual(greedy_expected, ids)
-    # Ensure that k=1 with no sample temperature is same as greedy.
-    top_k_obj = sampling_module.SamplingModule(
-        length_normalization_fn=length_norm,
-        dtype=tf.float32,
-        symbols_to_logits_fn=self._get_test_symbols_to_logits_fn(),
-        vocab_size=3,
-        max_decode_length=4,
-        eos_id=10,
-        sample_temperature=0.0,
-        top_k=tf.constant(1),
-        padded_decode=padded_decode,
-        enable_greedy=False)
-    ids, _ = top_k_obj.generate(
-        initial_ids=tf.constant([9, 1]), initial_cache=self.cache)
-    # Ensure that low sample temperature results in Sharp Distribution (greedy).
-    low_temperature_obj = sampling_module.SamplingModule(
-        length_normalization_fn=length_norm,
-        dtype=tf.float32,
-        symbols_to_logits_fn=self._get_test_symbols_to_logits_fn(),
-        vocab_size=3,
-        max_decode_length=4,
-        eos_id=10,
-        sample_temperature=0.0001,
-        padded_decode=padded_decode)
-    ids, _ = low_temperature_obj.generate(
-        initial_ids=tf.constant([9, 1]), initial_cache=self.cache)
-    self.assertAllEqual(greedy_expected, ids)
-    # Ensure that high sample temperature results in Flat Distribution (random).
-    high_temperature_obj = sampling_module.SamplingModule(
-        length_normalization_fn=length_norm,
-        dtype=tf.float32,
-        symbols_to_logits_fn=self._get_test_symbols_to_logits_fn(),
-        vocab_size=3,
-        max_decode_length=4,
-        eos_id=10,
-        sample_temperature=10.0,
-        padded_decode=padded_decode,
-        enable_greedy=False)
-    tf.random.set_seed(1)
-    ids, _ = high_temperature_obj.generate(
-        initial_ids=tf.constant([9, 1]), initial_cache=self.cache)
-    expected = tf.constant([[9, 0, 0, 2, 2], [1, 0, 0, 0, 0]])
-    self.assertAllEqual(expected, ids)
-if __name__ == '__main__':
-  tf.test.main()