Merge branch 'qianyj_tf' into 'main'

update tf code See merge request dcutoolkit/deeplearing/dlexamples_new!35

Merge branch 'qianyj_tf' into 'main'
update tf code See merge request dcutoolkit/deeplearing/dlexamples_new!35
9dafea91 · sunxx1 · 92a2ca36 · a4146470 · 92a2ca36 · 92a2ca36
Commit 9dafea91 authored Aug 02, 2022 by sunxx1
20 changed files
--- a/TensorFlow/ComputeVision/Accuracy_Validation/ResNet50_Official/official/transformer/utils/tokenizer.py
+++ b/TensorFlow/ComputeVision/Accuracy_Validation/ResNet50_Official/official/transformer/utils/tokenizer.py
-# Copyright 2018 The TensorFlow Authors. All Rights Reserved.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-# ==============================================================================
-"""Defines Subtokenizer class to encode and decode strings."""
-
-from __future__ import absolute_import
-from __future__ import division
-from __future__ import print_function
-
-import collections
-import re
-import sys
-import unicodedata
-
-import numpy as np
-import six
-from six.moves import xrange  # pylint: disable=redefined-builtin
-import tensorflow as tf
-
-PAD = "<pad>"
-PAD_ID = 0
-EOS = "<EOS>"
-EOS_ID = 1
-RESERVED_TOKENS = [PAD, EOS]
-
-# Set of characters that will be used in the function _escape_token() (see func
-# docstring for more details).
-# This set is added to the alphabet list to ensure that all escaped tokens can
-# be encoded.
-_ESCAPE_CHARS = set(u"\\_u;0123456789")
-# Regex for the function _unescape_token(), the inverse of _escape_token().
-# This is used to find "\u", "\\", and "\###;" substrings in the token.
-_UNESCAPE_REGEX = re.compile(r"\\u|\\\\|\\([0-9]+);")
-
-_UNDEFINED_UNICODE = u"\u3013"
-
-# Set contains all letter and number characters.
-_ALPHANUMERIC_CHAR_SET = set(
-    six.unichr(i) for i in xrange(sys.maxunicode)
-    if (unicodedata.category(six.unichr(i)).startswith("L") or
-        unicodedata.category(six.unichr(i)).startswith("N")))
-
-# min_count is the minimum number of times a subtoken must appear in the data
-# before before it is added to the vocabulary. The value is found using binary
-# search to obtain the target vocabulary size.
-_MIN_MIN_COUNT = 1     # min value to use when binary searching for min_count
-_MAX_MIN_COUNT = 1000  # max value to use when binary searching for min_count
-
-
-class Subtokenizer(object):
-  """Encodes and decodes strings to/from integer IDs."""
-
-  def __init__(self, vocab_file, reserved_tokens=None):
-    """Initializes class, creating a vocab file if data_files is provided."""
-    tf.logging.info("Initializing Subtokenizer from file %s." % vocab_file)
-
-    if reserved_tokens is None:
-      reserved_tokens = RESERVED_TOKENS
-
-    self.subtoken_list = _load_vocab_file(vocab_file, reserved_tokens)
-    self.alphabet = _generate_alphabet_dict(self.subtoken_list)
-    self.subtoken_to_id_dict = _list_to_index_dict(self.subtoken_list)
-
-    self.max_subtoken_length = 0
-    for subtoken in self.subtoken_list:
-      self.max_subtoken_length = max(self.max_subtoken_length, len(subtoken))
-
-    # Create cache to speed up subtokenization
-    self._cache_size = 2 ** 20
-    self._cache = [(None, None)] * self._cache_size
-
-  @staticmethod
-  def init_from_files(
-      vocab_file, files, target_vocab_size, threshold, min_count=None,
-      file_byte_limit=1e6, reserved_tokens=None):
-    """Create subtoken vocabulary based on files, and save vocab to file.
-
-    Args:
-      vocab_file: String name of vocab file to store subtoken vocabulary.
-      files: List of file paths that will be used to generate vocabulary.
-      target_vocab_size: target vocabulary size to generate.
-      threshold: int threshold of vocabulary size to accept.
-      min_count: int minimum count to use for generating the vocabulary. The min
-        count is the minimum number of times a subtoken should appear in the
-        files before it is added to the vocabulary. If set to none, this value
-        is found using binary search.
-      file_byte_limit: (Default 1e6) Maximum number of bytes of sample text that
-        will be drawn from the files.
-      reserved_tokens: List of string tokens that are guaranteed to be at the
-        beginning of the subtoken vocabulary list.
-
-    Returns:
-      Subtokenizer object
-    """
-    if reserved_tokens is None:
-      reserved_tokens = RESERVED_TOKENS
-
-    if tf.gfile.Exists(vocab_file):
-      tf.logging.info("Vocab file already exists (%s)" % vocab_file)
-    else:
-      tf.logging.info("Begin steps to create subtoken vocabulary...")
-      token_counts = _count_tokens(files, file_byte_limit)
-      alphabet = _generate_alphabet_dict(token_counts)
-      subtoken_list = _generate_subtokens_with_target_vocab_size(
-          token_counts, alphabet, target_vocab_size, threshold, min_count,
-          reserved_tokens)
-      tf.logging.info("Generated vocabulary with %d subtokens." %
-                      len(subtoken_list))
-      _save_vocab_file(vocab_file, subtoken_list)
-    return Subtokenizer(vocab_file)
-
-  def encode(self, raw_string, add_eos=False):
-    """Encodes a string into a list of int subtoken ids."""
-    ret = []
-    tokens = _split_string_to_tokens(_native_to_unicode(raw_string))
-    for token in tokens:
-      ret.extend(self._token_to_subtoken_ids(token))
-    if add_eos:
-      ret.append(EOS_ID)
-    return ret
-
-  def _token_to_subtoken_ids(self, token):
-    """Encode a single token into a list of subtoken ids."""
-    cache_location = hash(token) % self._cache_size
-    cache_key, cache_value = self._cache[cache_location]
-    if cache_key == token:
-      return cache_value
-
-    ret = _split_token_to_subtokens(
-        _escape_token(token, self.alphabet), self.subtoken_to_id_dict,
-        self.max_subtoken_length)
-    ret = [self.subtoken_to_id_dict[subtoken_id] for subtoken_id in ret]
-
-    self._cache[cache_location] = (token, ret)
-    return ret
-
-  def decode(self, subtokens):
-    """Converts list of int subtokens ids into a string."""
-    if isinstance(subtokens, np.ndarray):
-      # Note that list(subtokens) converts subtokens to a python list, but the
-      # items remain as np.int32. This converts both the array and its items.
-      subtokens = subtokens.tolist()
-
-    if not subtokens:
-      return ""
-
-    assert isinstance(subtokens, list) and isinstance(subtokens[0], int), (
-        "Subtokens argument passed into decode() must be a list of integers.")
-
-    return _unicode_to_native(
-        _join_tokens_to_string(self._subtoken_ids_to_tokens(subtokens)))
-
-  def _subtoken_ids_to_tokens(self, subtokens):
-    """Convert list of int subtoken ids to a list of string tokens."""
-    escaped_tokens = "".join([
-        self.subtoken_list[s] for s in subtokens
-        if s < len(self.subtoken_list)])
-    escaped_tokens = escaped_tokens.split("_")
-
-    # All tokens in the vocabulary list have been escaped (see _escape_token())
-    # so each token must be unescaped when decoding.
-    ret = []
-    for token in escaped_tokens:
-      if token:
-        ret.append(_unescape_token(token))
-    return ret
-
-
-def _save_vocab_file(vocab_file, subtoken_list):
-  """Save subtokens to file."""
-  with tf.gfile.Open(vocab_file, mode="w") as f:
-    for subtoken in subtoken_list:
-      f.write("'%s'\n" % _unicode_to_native(subtoken))
-
-
-def _load_vocab_file(vocab_file, reserved_tokens=None):
-  """Load vocabulary while ensuring reserved tokens are at the top."""
-  if reserved_tokens is None:
-    reserved_tokens = RESERVED_TOKENS
-
-  subtoken_list = []
-  with tf.gfile.Open(vocab_file, mode="r") as f:
-    for line in f:
-      subtoken = _native_to_unicode(line.strip())
-      subtoken = subtoken[1:-1]  # Remove surrounding single-quotes
-      if subtoken in reserved_tokens:
-        continue
-      subtoken_list.append(_native_to_unicode(subtoken))
-  return reserved_tokens + subtoken_list
-
-
-def _native_to_unicode(s):
-  """Convert string to unicode (required in Python 2)."""
-  try:               # Python 2
-    return s if isinstance(s, unicode) else s.decode("utf-8")
-  except NameError:  # Python 3
-    return s
-
-
-def _unicode_to_native(s):
-  """Convert string from unicode to native format (required in Python 2)."""
-  try:               # Python 2
-    return s.encode("utf-8") if isinstance(s, unicode) else s
-  except NameError:  # Python 3
-    return s
-
-
-def _split_string_to_tokens(text):
-  """Splits text to a list of string tokens."""
-  if not text:
-    return []
-  ret = []
-  token_start = 0
-  # Classify each character in the input string
-  is_alnum = [c in _ALPHANUMERIC_CHAR_SET for c in text]
-  for pos in xrange(1, len(text)):
-    if is_alnum[pos] != is_alnum[pos - 1]:
-      token = text[token_start:pos]
-      if token != u" " or token_start == 0:
-        ret.append(token)
-      token_start = pos
-  final_token = text[token_start:]
-  ret.append(final_token)
-  return ret
-
-
-def _join_tokens_to_string(tokens):
-  """Join a list of string tokens into a single string."""
-  token_is_alnum = [t[0] in _ALPHANUMERIC_CHAR_SET for t in tokens]
-  ret = []
-  for i, token in enumerate(tokens):
-    if i > 0 and token_is_alnum[i - 1] and token_is_alnum[i]:
-      ret.append(u" ")
-    ret.append(token)
-  return "".join(ret)
-
-
-def _escape_token(token, alphabet):
-  r"""Replace characters that aren't in the alphabet and append "_" to token.
-
-  Apply three transformations to the token:
-    1. Replace underline character "_" with "\u", and backslash "\" with "\\".
-    2. Replace characters outside of the alphabet with "\###;", where ### is the
-       character's Unicode code point.
-    3. Appends "_" to mark the end of a token.
-
-  Args:
-    token: unicode string to be escaped
-    alphabet: list of all known characters
-
-  Returns:
-    escaped string
-  """
-  token = token.replace(u"\\", u"\\\\").replace(u"_", u"\\u")
-  ret = [c if c in alphabet and c != u"\n" else r"\%d;" % ord(c) for c in token]
-  return u"".join(ret) + "_"
-
-
-def _unescape_token(token):
-  r"""Replaces escaped characters in the token with their unescaped versions.
-
-  Applies inverse transformations as _escape_token():
-    1. Replace "\u" with "_", and "\\" with "\".
-    2. Replace "\###;" with the unicode character the ### refers to.
-
-  Args:
-    token: escaped string
-
-  Returns:
-    unescaped string
-  """
-
-  def match(m):
-    r"""Returns replacement string for matched object.
-
-    Matched objects contain one of the strings that matches the regex pattern:
-      r"\\u|\\\\|\\([0-9]+);"
-    The strings can be '\u', '\\', or '\###;' (### is any digit number).
-
-    m.group(0) refers to the entire matched string ('\u', '\\', or '\###;').
-    m.group(1) refers to the first parenthesized subgroup ('###').
-
-    m.group(0) exists for all match objects, while m.group(1) exists only for
-    the string '\###;'.
-
-    This function looks to see if m.group(1) exists. If it doesn't, then the
-    matched string must be '\u' or '\\' . In this case, the corresponding
-    replacement ('_' and '\') are returned. Note that in python, a single
-    backslash is written as '\\', and double backslash as '\\\\'.
-
-    If m.goup(1) exists, then use the integer in m.group(1) to return a
-    unicode character.
-
-    Args:
-      m: match object
-
-    Returns:
-      String to replace matched object with.
-    """
-    # Check if the matched strings are '\u' or '\\'.
-    if m.group(1) is None:
-      return u"_" if m.group(0) == u"\\u" else u"\\"
-
-    # If m.group(1) exists, try and return unicode character.
-    try:
-      return six.unichr(int(m.group(1)))
-    except (ValueError, OverflowError) as _:
-      return _UNDEFINED_UNICODE
-
-  # Use match function to replace escaped substrings in the token.
-  return _UNESCAPE_REGEX.sub(match, token)
-
-
-def _count_tokens(files, file_byte_limit=1e6):
-  """Return token counts of words in the files.
-
-  Samples file_byte_limit bytes from each file, and counts the words that appear
-  in the samples. The samples are semi-evenly distributed across the file.
-
-  Args:
-    files: List of filepaths
-    file_byte_limit: Max number of bytes that will be read from each file.
-
-  Returns:
-    Dictionary mapping tokens to the number of times they appear in the sampled
-    lines from the files.
-  """
-  token_counts = collections.defaultdict(int)
-
-  for filepath in files:
-    with tf.gfile.Open(filepath, mode="r") as reader:
-      file_byte_budget = file_byte_limit
-      counter = 0
-      lines_to_skip = int(reader.size() / (file_byte_budget * 2))
-      for line in reader:
-        if counter < lines_to_skip:
-          counter += 1
-        else:
-          if file_byte_budget < 0:
-            break
-          line = line.strip()
-          file_byte_budget -= len(line)
-          counter = 0
-
-          # Add words to token counts
-          for token in _split_string_to_tokens(_native_to_unicode(line)):
-            token_counts[token] += 1
-  return token_counts
-
-
-def _list_to_index_dict(lst):
-  """Create dictionary mapping list items to their indices in the list."""
-  return {item: n for n, item in enumerate(lst)}
-
-
-def _split_token_to_subtokens(token, subtoken_dict, max_subtoken_length):
-  """Splits a token into subtokens defined in the subtoken dict."""
-  ret = []
-  start = 0
-  token_len = len(token)
-  while start < token_len:
-    # Find the longest subtoken, so iterate backwards.
-    for end in xrange(min(token_len, start + max_subtoken_length), start, -1):
-      subtoken = token[start:end]
-      if subtoken in subtoken_dict:
-        ret.append(subtoken)
-        start = end
-        break
-    else:  # Did not break
-      # If there is no possible encoding of the escaped token then one of the
-      # characters in the token is not in the alphabet. This should be
-      # impossible and would be indicative of a bug.
-      raise ValueError("Was unable to split token \"%s\" into subtokens." %
-                       token)
-  return ret
-
-
-def _generate_subtokens_with_target_vocab_size(
-    token_counts, alphabet, target_size, threshold, min_count=None,
-    reserved_tokens=None):
-  """Generate subtoken vocabulary close to the target size."""
-  if reserved_tokens is None:
-    reserved_tokens = RESERVED_TOKENS
-
-  if min_count is not None:
-    tf.logging.info("Using min_count=%d to generate vocab with target size %d" %
-                    (min_count, target_size))
-    return _generate_subtokens(
-        token_counts, alphabet, min_count, reserved_tokens=reserved_tokens)
-
-  def bisect(min_val, max_val):
-    """Recursive function to binary search for subtoken vocabulary."""
-    cur_count = (min_val + max_val) // 2
-    tf.logging.info("Binary search: trying min_count=%d (%d %d)" %
-                    (cur_count, min_val, max_val))
-    subtoken_list = _generate_subtokens(
-        token_counts, alphabet, cur_count, reserved_tokens=reserved_tokens)
-
-    val = len(subtoken_list)
-    tf.logging.info("Binary search: min_count=%d resulted in %d tokens" %
-                    (cur_count, val))
-
-    within_threshold = abs(val - target_size) < threshold
-    if within_threshold or min_val >= max_val or cur_count < 2:
-      return subtoken_list
-    if val > target_size:
-      other_subtoken_list = bisect(cur_count + 1, max_val)
-    else:
-      other_subtoken_list = bisect(min_val, cur_count - 1)
-
-    # Return vocabulary dictionary with the closest number of tokens.
-    other_val = len(other_subtoken_list)
-    if abs(other_val - target_size) < abs(val - target_size):
-      return other_subtoken_list
-    return subtoken_list
-
-  tf.logging.info("Finding best min_count to get target size of %d" %
-                  target_size)
-  return bisect(_MIN_MIN_COUNT, _MAX_MIN_COUNT)
-
-
-def _generate_alphabet_dict(iterable, reserved_tokens=None):
-  """Create set of characters that appear in any element in the iterable."""
-  if reserved_tokens is None:
-    reserved_tokens = RESERVED_TOKENS
-  alphabet = {c for token in iterable for c in token}
-  alphabet |= {c for token in reserved_tokens for c in token}
-  alphabet |= _ESCAPE_CHARS  # Add escape characters to alphabet set.
-  return alphabet
-
-
-def _count_and_gen_subtokens(
-    token_counts, alphabet, subtoken_dict, max_subtoken_length):
-  """Count number of times subtokens appear, and generate new subtokens.
-
-  Args:
-    token_counts: dict mapping tokens to the number of times they appear in the
-      original files.
-    alphabet: list of allowed characters. Used to escape the tokens, which
-      guarantees that all tokens can be split into subtokens.
-    subtoken_dict: dict mapping subtokens to ids.
-    max_subtoken_length: maximum length of subtoken in subtoken_dict.
-
-  Returns:
-    A defaultdict mapping subtokens to the number of times they appear in the
-    tokens. The dict may contain new subtokens.
-  """
-  subtoken_counts = collections.defaultdict(int)
-  for token, count in six.iteritems(token_counts):
-    token = _escape_token(token, alphabet)
-    subtokens = _split_token_to_subtokens(
-        token, subtoken_dict, max_subtoken_length)
-
-    # Generate new subtokens by taking substrings from token.
-    start = 0
-    for subtoken in subtokens:
-      for end in xrange(start + 1, len(token) + 1):
-        new_subtoken = token[start:end]
-        subtoken_counts[new_subtoken] += count
-      start += len(subtoken)
-
-  return subtoken_counts
-
-
-def _filter_and_bucket_subtokens(subtoken_counts, min_count):
-  """Return a bucketed list of subtokens that are filtered by count.
-
-  Args:
-    subtoken_counts: defaultdict mapping subtokens to their counts
-    min_count: int count used to filter subtokens
-
-  Returns:
-    List of subtoken sets, where subtokens in set i have the same length=i.
-  """
-  # Create list of buckets, where subtokens in bucket i have length i.
-  subtoken_buckets = []
-  for subtoken, count in six.iteritems(subtoken_counts):
-    if count < min_count:  # Filter out subtokens that don't appear enough
-      continue
-    while len(subtoken_buckets) <= len(subtoken):
-      subtoken_buckets.append(set())
-    subtoken_buckets[len(subtoken)].add(subtoken)
-  return subtoken_buckets
-
-
-def _gen_new_subtoken_list(
-    subtoken_counts, min_count, alphabet, reserved_tokens=None):
-  """Generate candidate subtokens ordered by count, and new max subtoken length.
-
-  Add subtokens to the candiate list in order of length (longest subtokens
-  first). When a subtoken is added, the counts of each of its prefixes are
-  decreased. Prefixes that don't appear much outside the subtoken are not added
-  to the candidate list.
-
-  For example:
-    subtoken being added to candidate list: 'translate'
-    subtoken_counts: {'translate':10, 't':40, 'tr':16, 'tra':12, ...}
-    min_count: 5
-
-  When 'translate' is added, subtoken_counts is updated to:
-    {'translate':0, 't':30, 'tr':6, 'tra': 2, ...}
-
-  The subtoken 'tra' will not be added to the candidate list, because it appears
-  twice (less than min_count) outside of 'translate'.
-
-  Args:
-    subtoken_counts: defaultdict mapping str subtokens to int counts
-    min_count: int minumum count requirement for subtokens
-    alphabet: set of characters. Each character is added to the subtoken list to
-      guarantee that all tokens can be encoded.
-    reserved_tokens: list of tokens that will be added to the beginning of the
-      returned subtoken list.
-
-  Returns:
-    List of candidate subtokens in decreasing count order, and maximum subtoken
-    length
-  """
-  if reserved_tokens is None:
-    reserved_tokens = RESERVED_TOKENS
-
-  # Create a list of (count, subtoken) for each candidate subtoken.
-  subtoken_candidates = []
-
-  # Use bucketted list to iterate through subtokens in order of length.
-  # subtoken_buckets[i] = set(subtokens), where each subtoken has length i.
-  subtoken_buckets = _filter_and_bucket_subtokens(subtoken_counts, min_count)
-  max_subtoken_length = len(subtoken_buckets) - 1
-
-  # Go through the list in reverse order to consider longer subtokens first.
-  for subtoken_len in xrange(max_subtoken_length, 0, -1):
-    for subtoken in subtoken_buckets[subtoken_len]:
-      count = subtoken_counts[subtoken]
-
-      # Possible if this subtoken is a prefix of another token.
-      if count < min_count:
-        continue
-
-      # Ignore alphabet/reserved tokens, which will be added manually later.
-      if subtoken not in alphabet and subtoken not in reserved_tokens:
-        subtoken_candidates.append((count, subtoken))
-
-      # Decrement count of the subtoken's prefixes (if a longer subtoken is
-      # added, its prefixes lose priority to be added).
-      for end in xrange(1, subtoken_len):
-        subtoken_counts[subtoken[:end]] -= count
-
-  # Add alphabet subtokens (guarantees that all strings are encodable).
-  subtoken_candidates.extend((subtoken_counts.get(a, 0), a) for a in alphabet)
-
-  # Order subtoken candidates by decreasing count.
-  subtoken_list = [t for _, t in sorted(subtoken_candidates, reverse=True)]
-
-  # Add reserved tokens to beginning of the list.
-  subtoken_list = reserved_tokens + subtoken_list
-  return subtoken_list, max_subtoken_length
-
-
-def _generate_subtokens(
-    token_counts, alphabet, min_count, num_iterations=4,
-    reserved_tokens=None):
-  """Create a list of subtokens in decreasing order of frequency.
-
-  Args:
-    token_counts: dict mapping str tokens -> int count
-    alphabet: set of characters
-    min_count: int minimum number of times a subtoken must appear before it is
-      added to the vocabulary.
-    num_iterations: int number of iterations to generate new tokens.
-    reserved_tokens: list of tokens that will be added to the beginning to the
-      returned subtoken list.
-
-  Returns:
-    Sorted list of subtokens (most frequent first)
-  """
-  if reserved_tokens is None:
-    reserved_tokens = RESERVED_TOKENS
-
-  # Use alphabet set to create initial list of subtokens
-  subtoken_list = reserved_tokens + list(alphabet)
-  max_subtoken_length = 1
-
-  # On each iteration, segment all words using the subtokens defined in
-  # subtoken_dict, count how often the resulting subtokens appear, and update
-  # the dictionary with subtokens w/ high enough counts.
-  for i in xrange(num_iterations):
-    tf.logging.info("\tGenerating subtokens: iteration %d" % i)
-    # Generate new subtoken->id dictionary using the new subtoken list.
-    subtoken_dict = _list_to_index_dict(subtoken_list)
-
-    # Create dict mapping subtoken->count, with additional subtokens created
-    # from substrings taken from the tokens.
-    subtoken_counts = _count_and_gen_subtokens(
-        token_counts, alphabet, subtoken_dict, max_subtoken_length)
-
-    # Generate new list of subtokens sorted by subtoken count.
-    subtoken_list, max_subtoken_length = _gen_new_subtoken_list(
-        subtoken_counts, min_count, alphabet, reserved_tokens)
-
-    tf.logging.info("\tVocab size: %d" % len(subtoken_list))
-  return subtoken_list
--- a/TensorFlow/ComputeVision/Accuracy_Validation/ResNet50_Official/official/transformer/utils/tokenizer_test.py
+++ b/TensorFlow/ComputeVision/Accuracy_Validation/ResNet50_Official/official/transformer/utils/tokenizer_test.py
-# Copyright 2018 The TensorFlow Authors. All Rights Reserved.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-# ==============================================================================
-"""Test Subtokenizer and string helper methods."""
-
-import collections
-import tempfile
-
-import tensorflow as tf  # pylint: disable=g-bad-import-order
-
-from official.transformer.utils import tokenizer
-
-
-class SubtokenizerTest(tf.test.TestCase):
-
-  def _init_subtokenizer(self, vocab_list):
-    temp_file = tempfile.NamedTemporaryFile(delete=False)
-    with tf.gfile.Open(temp_file.name, 'w') as w:
-      for subtoken in vocab_list:
-        w.write("'%s'" % subtoken)
-        w.write("\n")
-    return tokenizer.Subtokenizer(temp_file.name, reserved_tokens=[])
-
-  def test_encode(self):
-    vocab_list = ["123_", "test", "ing_"]
-    subtokenizer = self._init_subtokenizer(vocab_list)
-    s = "testing 123"
-    encoded_list = subtokenizer.encode(s)
-    self.assertEqual([1, 2, 0], encoded_list)
-
-  def test_decode(self):
-    vocab_list = ["123_", "test", "ing_"]
-    subtokenizer = self._init_subtokenizer(vocab_list)
-    encoded_list = [1, 2, 0]  # testing 123
-    decoded_str = subtokenizer.decode(encoded_list)
-    self.assertEqual("testing 123", decoded_str)
-
-  def test_subtoken_ids_to_tokens(self):
-    vocab_list = ["123_", "test", "ing_"]
-    subtokenizer = self._init_subtokenizer(vocab_list)
-    encoded_list = [1, 2, 0]  # testing 123
-    token_list = subtokenizer._subtoken_ids_to_tokens(encoded_list)
-    self.assertEqual([u"testing", u"123"], token_list)
-
-
-class StringHelperTest(tf.test.TestCase):
-
-  def test_split_string_to_tokens(self):
-    text = "test? testing 123."
-
-    tokens = tokenizer._split_string_to_tokens(text)
-    self.assertEqual(["test", "? ", "testing", "123", "."], tokens)
-
-  def test_join_tokens_to_string(self):
-    tokens = ["test", "? ", "testing", "123", "."]
-
-    s = tokenizer._join_tokens_to_string(tokens)
-    self.assertEqual("test? testing 123.", s)
-
-  def test_escape_token(self):
-    token = u"abc_\\4"
-    alphabet = set("abc_\\u;")
-
-    escaped_token = tokenizer._escape_token(token, alphabet)
-    self.assertEqual("abc\\u\\\\\\52;_", escaped_token)
-
-  def test_unescape_token(self):
-    escaped_token = u"Underline: \\u, Backslash: \\\\, Unicode: \\52;"
-
-    unescaped_token = tokenizer._unescape_token(escaped_token)
-    self.assertEqual(
-        "Underline: _, Backslash: \\, Unicode: 4", unescaped_token)
-
-  def test_list_to_index_dict(self):
-    lst = ["test", "strings"]
-
-    d = tokenizer._list_to_index_dict(lst)
-    self.assertDictEqual({"test": 0, "strings": 1}, d)
-
-  def test_split_token_to_subtokens(self):
-    token = "abc"
-    subtoken_dict = {"a": 0, "b": 1, "c": 2, "ab": 3}
-    max_subtoken_length = 2
-
-    subtokens = tokenizer._split_token_to_subtokens(
-        token, subtoken_dict, max_subtoken_length)
-    self.assertEqual(["ab", "c"], subtokens)
-
-  def test_generate_alphabet_dict(self):
-    s = ["testing", "123"]
-    reserved_tokens = ["???"]
-
-    alphabet = tokenizer._generate_alphabet_dict(s, reserved_tokens)
-    self.assertIn("?", alphabet)
-    self.assertIn("t", alphabet)
-    self.assertIn("e", alphabet)
-    self.assertIn("s", alphabet)
-    self.assertIn("i", alphabet)
-    self.assertIn("n", alphabet)
-    self.assertIn("g", alphabet)
-    self.assertIn("1", alphabet)
-    self.assertIn("2", alphabet)
-    self.assertIn("3", alphabet)
-
-  def test_count_and_gen_subtokens(self):
-    token_counts = {"abc": 5}
-    alphabet = set("abc_")
-    subtoken_dict = {"a": 0, "b": 1, "c": 2, "_": 3}
-    max_subtoken_length = 2
-
-    subtoken_counts = tokenizer._count_and_gen_subtokens(
-        token_counts, alphabet, subtoken_dict, max_subtoken_length)
-
-    self.assertIsInstance(subtoken_counts, collections.defaultdict)
-    self.assertDictEqual(
-        {"a": 5, "b": 5, "c": 5, "_": 5, "ab": 5, "bc": 5, "c_": 5,
-         "abc": 5, "bc_": 5, "abc_": 5}, subtoken_counts)
-
-  def test_filter_and_bucket_subtokens(self):
-    subtoken_counts = collections.defaultdict(
-        int, {"a": 2, "b": 4, "c": 1, "ab": 6, "ac": 3, "abbc": 5})
-    min_count = 3
-
-    subtoken_buckets = tokenizer._filter_and_bucket_subtokens(
-        subtoken_counts, min_count)
-
-    self.assertEqual(len(subtoken_buckets[0]), 0)
-    self.assertEqual(set("b"), subtoken_buckets[1])
-    self.assertEqual(set(["ab", "ac"]), subtoken_buckets[2])
-    self.assertEqual(len(subtoken_buckets[3]), 0)
-    self.assertEqual(set(["abbc"]), subtoken_buckets[4])
-
-  def test_gen_new_subtoken_list(self):
-    subtoken_counts = collections.defaultdict(
-        int, {"translate": 10, "t": 40, "tr": 16, "tra": 12})
-    min_count = 5
-    alphabet = set("translate")
-    reserved_tokens = ["reserved", "tokens"]
-
-    subtoken_list, max_token_length = tokenizer._gen_new_subtoken_list(
-        subtoken_counts, min_count, alphabet, reserved_tokens)
-
-    # Check that "tra" isn"t in the list (its count should be decremented to 2,
-    # so it should not be added to the canddiate list).
-    self.assertNotIn("tra", subtoken_list)
-
-    self.assertIn("tr", subtoken_list)
-    self.assertIn("t", subtoken_list)
-
-    self.assertEqual(len("translate"), max_token_length)
-
-  def test_generate_subtokens(self):
-    token_counts = {"ab": 1, "bc": 3, "abc": 5}
-    alphabet = set("abc_")
-    min_count = 100
-    num_iterations = 1
-    reserved_tokens = ["reserved", "tokens"]
-
-    vocab_list = tokenizer._generate_subtokens(
-        token_counts, alphabet, min_count, num_iterations, reserved_tokens)
-
-    # Check that reserved tokens are at the front of the list
-    self.assertEqual(vocab_list[:2], reserved_tokens)
-
-    # Check that each character in alphabet is in the vocab list
-    for c in alphabet:
-      self.assertIn(c, vocab_list)
-
-
-if __name__ == "__main__":
-  tf.test.main()
--- a/TensorFlow/ComputeVision/Accuracy_Validation/ResNet50_Official/official/utils/__init__.py
+++ b/TensorFlow/ComputeVision/Accuracy_Validation/ResNet50_Official/official/utils/__init__.py
--- a/TensorFlow/ComputeVision/Accuracy_Validation/ResNet50_Official/official/utils/accelerator/__init__.py
+++ b/TensorFlow/ComputeVision/Accuracy_Validation/ResNet50_Official/official/utils/accelerator/__init__.py
--- a/TensorFlow/ComputeVision/Accuracy_Validation/ResNet50_Official/official/utils/accelerator/tpu.py
+++ b/TensorFlow/ComputeVision/Accuracy_Validation/ResNet50_Official/official/utils/accelerator/tpu.py
-# Copyright 2018 The TensorFlow Authors. All Rights Reserved.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-# ==============================================================================
-"""Functions specific to running TensorFlow on TPUs."""
-
-import tensorflow as tf
-
-
-# "local" is a magic word in the TPU cluster resolver; it informs the resolver
-# to use the local CPU as the compute device. This is useful for testing and
-# debugging; the code flow is ostensibly identical, but without the need to
-# actually have a TPU on the other end.
-LOCAL = "local"
-
-
-def construct_scalar_host_call(metric_dict, model_dir, prefix=""):
-  """Construct a host call to log scalars when training on TPU.
-
-  Args:
-    metric_dict: A dict of the tensors to be logged.
-    model_dir: The location to write the summary.
-    prefix: The prefix (if any) to prepend to the metric names.
-
-  Returns:
-    A tuple of (function, args_to_be_passed_to_said_function)
-  """
-  # type: (dict, str) -> (function, list)
-  metric_names = list(metric_dict.keys())
-
-  def host_call_fn(global_step, *args):
-    """Training host call. Creates scalar summaries for training metrics.
-
-    This function is executed on the CPU and should not directly reference
-    any Tensors in the rest of the `model_fn`. To pass Tensors from the
-    model to the `metric_fn`, provide as part of the `host_call`. See
-    https://www.tensorflow.org/api_docs/python/tf/contrib/tpu/TPUEstimatorSpec
-    for more information.
-
-    Arguments should match the list of `Tensor` objects passed as the second
-    element in the tuple passed to `host_call`.
-
-    Args:
-      global_step: `Tensor with shape `[batch]` for the global_step
-      *args: Remaining tensors to log.
-
-    Returns:
-      List of summary ops to run on the CPU host.
-    """
-    step = global_step[0]
-    with tf.contrib.summary.create_file_writer(
-        logdir=model_dir, filename_suffix=".host_call").as_default():
-      with tf.contrib.summary.always_record_summaries():
-        for i, name in enumerate(metric_names):
-          tf.contrib.summary.scalar(prefix + name, args[i][0], step=step)
-
-        return tf.contrib.summary.all_summary_ops()
-
-  # To log the current learning rate, and gradient norm for Tensorboard, the
-  # summary op needs to be run on the host CPU via host_call. host_call
-  # expects [batch_size, ...] Tensors, thus reshape to introduce a batch
-  # dimension. These Tensors are implicitly concatenated to
-  # [params['batch_size']].
-  global_step_tensor = tf.reshape(tf.train.get_or_create_global_step(), [1])
-  other_tensors = [tf.reshape(metric_dict[key], [1]) for key in metric_names]
-
-  return host_call_fn, [global_step_tensor] + other_tensors
-
-
-def embedding_matmul(embedding_table, values, mask, name="embedding_matmul"):
-  """Performs embedding lookup via a matmul.
-
-  The matrix to be multiplied by the embedding table Tensor is constructed
-  via an implementation of scatter based on broadcasting embedding indices
-  and performing an equality comparison against a broadcasted
-  range(num_embedding_table_rows). All masked positions will produce an
-  embedding vector of zeros.
-
-  Args:
-    embedding_table: Tensor of embedding table.
-      Rank 2 (table_size x embedding dim)
-    values: Tensor of embedding indices. Rank 2 (batch x n_indices)
-    mask: Tensor of mask / weights. Rank 2 (batch x n_indices)
-    name: Optional name scope for created ops
-
-  Returns:
-    Rank 3 tensor of embedding vectors.
-  """
-
-  with tf.name_scope(name):
-    n_embeddings = embedding_table.get_shape().as_list()[0]
-    batch_size, padded_size = values.shape.as_list()
-
-    emb_idcs = tf.tile(
-        tf.reshape(values, (batch_size, padded_size, 1)), (1, 1, n_embeddings))
-    emb_weights = tf.tile(
-        tf.reshape(mask, (batch_size, padded_size, 1)), (1, 1, n_embeddings))
-    col_idcs = tf.tile(
-        tf.reshape(tf.range(n_embeddings), (1, 1, n_embeddings)),
-        (batch_size, padded_size, 1))
-    one_hot = tf.where(
-        tf.equal(emb_idcs, col_idcs), emb_weights,
-        tf.zeros((batch_size, padded_size, n_embeddings)))
-
-    return tf.tensordot(one_hot, embedding_table, 1)
--- a/TensorFlow/ComputeVision/Accuracy_Validation/ResNet50_Official/official/utils/accelerator/tpu_test.py
+++ b/TensorFlow/ComputeVision/Accuracy_Validation/ResNet50_Official/official/utils/accelerator/tpu_test.py
-# Copyright 2018 The TensorFlow Authors. All Rights Reserved.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-# ==============================================================================
-"""Test TPU optimized matmul embedding."""
-
-import numpy as np
-import tensorflow as tf
-
-from official.utils.accelerator import tpu as tpu_utils
-
-
-TEST_CASES = [
-    dict(embedding_dim=256, vocab_size=1000, sequence_length=64,
-         batch_size=32, seed=54131),
-    dict(embedding_dim=8, vocab_size=15, sequence_length=12,
-         batch_size=256, seed=536413),
-    dict(embedding_dim=2048, vocab_size=512, sequence_length=50,
-         batch_size=8, seed=35124)
-]
-
-
-class TPUBaseTester(tf.test.TestCase):
-  def construct_embedding_and_values(self, embedding_dim, vocab_size,
-                                     sequence_length, batch_size, seed):
-    np.random.seed(seed)
-
-    embeddings = np.random.random(size=(vocab_size, embedding_dim))
-    embedding_table = tf.convert_to_tensor(embeddings, dtype=tf.float32)
-
-    tokens = np.random.randint(low=1, high=vocab_size-1,
-                               size=(batch_size, sequence_length))
-    for i in range(batch_size):
-      tokens[i, np.random.randint(low=0, high=sequence_length-1):] = 0
-    values = tf.convert_to_tensor(tokens, dtype=tf.int32)
-    mask = tf.to_float(tf.not_equal(values, 0))
-    return embedding_table, values, mask
-
-  def _test_embedding(self, embedding_dim, vocab_size,
-                      sequence_length, batch_size, seed):
-    """Test that matmul embedding matches embedding lookup (gather)."""
-
-    with self.test_session():
-      embedding_table, values, mask = self.construct_embedding_and_values(
-          embedding_dim=embedding_dim,
-          vocab_size=vocab_size,
-          sequence_length=sequence_length,
-          batch_size=batch_size,
-          seed=seed
-      )
-
-      embedding = (tf.nn.embedding_lookup(params=embedding_table, ids=values) *
-                   tf.expand_dims(mask, -1))
-
-      matmul_embedding = tpu_utils.embedding_matmul(
-          embedding_table=embedding_table, values=values, mask=mask)
-
-      self.assertAllClose(embedding, matmul_embedding)
-
-  def _test_masking(self, embedding_dim, vocab_size,
-                    sequence_length, batch_size, seed):
-    """Test that matmul embedding properly zeros masked positions."""
-    with self.test_session():
-      embedding_table, values, mask = self.construct_embedding_and_values(
-          embedding_dim=embedding_dim,
-          vocab_size=vocab_size,
-          sequence_length=sequence_length,
-          batch_size=batch_size,
-          seed=seed
-      )
-
-      matmul_embedding = tpu_utils.embedding_matmul(
-          embedding_table=embedding_table, values=values, mask=mask)
-
-      self.assertAllClose(matmul_embedding,
-                          matmul_embedding * tf.expand_dims(mask, -1))
-
-  def test_embedding_0(self):
-    self._test_embedding(**TEST_CASES[0])
-
-  def test_embedding_1(self):
-    self._test_embedding(**TEST_CASES[1])
-
-  def test_embedding_2(self):
-    self._test_embedding(**TEST_CASES[2])
-
-  def test_masking_0(self):
-    self._test_masking(**TEST_CASES[0])
-
-  def test_masking_1(self):
-    self._test_masking(**TEST_CASES[1])
-
-  def test_masking_2(self):
-    self._test_masking(**TEST_CASES[2])
-
-
-if __name__ == "__main__":
-  tf.test.main()
--- a/TensorFlow/ComputeVision/Accuracy_Validation/ResNet50_Official/official/utils/data/__init__.py
+++ b/TensorFlow/ComputeVision/Accuracy_Validation/ResNet50_Official/official/utils/data/__init__.py
--- a/TensorFlow/ComputeVision/Accuracy_Validation/ResNet50_Official/official/utils/data/file_io.py
+++ b/TensorFlow/ComputeVision/Accuracy_Validation/ResNet50_Official/official/utils/data/file_io.py
-# Copyright 2018 The TensorFlow Authors. All Rights Reserved.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-# ==============================================================================
-"""Convenience functions for managing dataset file buffers."""
-
-from __future__ import absolute_import
-from __future__ import division
-from __future__ import print_function
-
-import atexit
-import multiprocessing
-import os
-import tempfile
-import uuid
-
-import numpy as np
-import six
-
-import tensorflow as tf
-
-
-class _GarbageCollector(object):
-  """Deletes temporary buffer files at exit.
-
-  Certain tasks (such as NCF Recommendation) require writing buffers to
-  temporary files. (Which may be local or distributed.) It is not generally safe
-  to delete these files during operation, but they should be cleaned up. This
-  class keeps track of temporary files created, and deletes them at exit.
-  """
-  def __init__(self):
-    self.temp_buffers = []
-
-  def register(self, filepath):
-    self.temp_buffers.append(filepath)
-
-  def purge(self):
-    try:
-      for i in self.temp_buffers:
-        if tf.gfile.Exists(i):
-          tf.gfile.Remove(i)
-          tf.logging.info("Buffer file {} removed".format(i))
-    except Exception as e:
-      tf.logging.error("Failed to cleanup buffer files: {}".format(e))
-
-
-_GARBAGE_COLLECTOR = _GarbageCollector()
-atexit.register(_GARBAGE_COLLECTOR.purge)
-
-_ROWS_PER_CORE = 50000
-
-
-def write_to_temp_buffer(dataframe, buffer_folder, columns):
-  if buffer_folder is None:
-    _, buffer_path = tempfile.mkstemp()
-  else:
-    tf.gfile.MakeDirs(buffer_folder)
-    buffer_path = os.path.join(buffer_folder, str(uuid.uuid4()))
-  _GARBAGE_COLLECTOR.register(buffer_path)
-
-  return write_to_buffer(dataframe, buffer_path, columns)
-
-
-def iter_shard_dataframe(df, rows_per_core=1000):
-  """Two way shard of a dataframe.
-
-  This function evenly shards a dataframe so that it can be mapped efficiently.
-  It yields a list of dataframes with length equal to the number of CPU cores,
-  with each dataframe having rows_per_core rows. (Except for the last batch
-  which may have fewer rows in the dataframes.) Passing vectorized inputs to
-  a multiprocessing pool is much more effecient than iterating through a
-  dataframe in serial and passing a list of inputs to the pool.
-
-  Args:
-    df: Pandas dataframe to be sharded.
-    rows_per_core: Number of rows in each shard.
-
-  Returns:
-    A list of dataframe shards.
-  """
-  n = len(df)
-  num_cores = min([multiprocessing.cpu_count(), n])
-
-  num_blocks = int(np.ceil(n / num_cores / rows_per_core))
-  max_batch_size = num_cores * rows_per_core
-  for i in range(num_blocks):
-    min_index = i * max_batch_size
-    max_index = min([(i + 1) * max_batch_size, n])
-    df_shard = df[min_index:max_index]
-    n_shard = len(df_shard)
-    boundaries = np.linspace(0, n_shard, num_cores + 1, dtype=np.int64)
-    yield [df_shard[boundaries[j]:boundaries[j+1]] for j in range(num_cores)]
-
-
-def _shard_dict_to_examples(shard_dict):
-  """Converts a dict of arrays into a list of example bytes."""
-  n = [i for i in shard_dict.values()][0].shape[0]
-  feature_list = [{} for _ in range(n)]
-  for column, values in shard_dict.items():
-    if len(values.shape) == 1:
-      values = np.reshape(values, values.shape + (1,))
-
-    if values.dtype.kind == "i":
-      feature_map = lambda x: tf.train.Feature(
-          int64_list=tf.train.Int64List(value=x))
-    elif values.dtype.kind == "f":
-      feature_map = lambda x: tf.train.Feature(
-          float_list=tf.train.FloatList(value=x))
-    else:
-      raise ValueError("Invalid dtype")
-    for i in range(n):
-      feature_list[i][column] = feature_map(values[i])
-  examples = [
-      tf.train.Example(features=tf.train.Features(feature=example_features))
-      for example_features in feature_list
-  ]
-
-  return [e.SerializeToString() for e in examples]
-
-
-def _serialize_shards(df_shards, columns, pool, writer):
-  """Map sharded dataframes to bytes, and write them to a buffer.
-
-  Args:
-    df_shards: A list of pandas dataframes. (Should be of similar size)
-    columns: The dataframe columns to be serialized.
-    pool: A multiprocessing pool to serialize in parallel.
-    writer: A TFRecordWriter to write the serialized shards.
-  """
-  # Pandas does not store columns of arrays as nd arrays. stack remedies this.
-  map_inputs = [{c: np.stack(shard[c].values, axis=0) for c in columns}
-                for shard in df_shards]
-
-  # Failure within pools is very irksome. Thus, it is better to thoroughly check
-  # inputs in the main process.
-  for inp in map_inputs:
-    # Check that all fields have the same number of rows.
-    assert len(set([v.shape[0] for v in inp.values()])) == 1
-    for val in inp.values():
-      assert hasattr(val, "dtype")
-      assert hasattr(val.dtype, "kind")
-      assert val.dtype.kind in ("i", "f")
-      assert len(val.shape) in (1, 2)
-  shard_bytes = pool.map(_shard_dict_to_examples, map_inputs)
-  for s in shard_bytes:
-    for example in s:
-      writer.write(example)
-
-def write_to_buffer(dataframe, buffer_path, columns, expected_size=None):
-  """Write a dataframe to a binary file for a dataset to consume.
-
-  Args:
-    dataframe: The pandas dataframe to be serialized.
-    buffer_path: The path where the serialized results will be written.
-    columns: The dataframe columns to be serialized.
-    expected_size: The size in bytes of the serialized results. This is used to
-      lazily construct the buffer.
-
-  Returns:
-    The path of the buffer.
-  """
-  if tf.gfile.Exists(buffer_path) and tf.gfile.Stat(buffer_path).length > 0:
-    actual_size = tf.gfile.Stat(buffer_path).length
-    if expected_size == actual_size:
-      return buffer_path
-    tf.logging.warning(
-        "Existing buffer {} has size {}. Expected size {}. Deleting and "
-        "rebuilding buffer.".format(buffer_path, actual_size, expected_size))
-    tf.gfile.Remove(buffer_path)
-
-  if dataframe is None:
-    raise ValueError(
-        "dataframe was None but a valid existing buffer was not found.")
-
-  tf.gfile.MakeDirs(os.path.split(buffer_path)[0])
-
-  tf.logging.info("Constructing TFRecordDataset buffer: {}".format(buffer_path))
-
-  count = 0
-  pool = multiprocessing.Pool(multiprocessing.cpu_count())
-  try:
-    with tf.python_io.TFRecordWriter(buffer_path) as writer:
-      for df_shards in iter_shard_dataframe(df=dataframe,
-                                            rows_per_core=_ROWS_PER_CORE):
-        _serialize_shards(df_shards, columns, pool, writer)
-        count += sum([len(s) for s in df_shards])
-        tf.logging.info("{}/{} examples written."
-                        .format(str(count).ljust(8), len(dataframe)))
-  finally:
-    pool.terminate()
-
-  tf.logging.info("Buffer write complete.")
-  return buffer_path
--- a/TensorFlow/ComputeVision/Accuracy_Validation/ResNet50_Official/official/utils/data/file_io_test.py
+++ b/TensorFlow/ComputeVision/Accuracy_Validation/ResNet50_Official/official/utils/data/file_io_test.py
-# Copyright 2018 The TensorFlow Authors. All Rights Reserved.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-# ==============================================================================
-"""Tests for binary data file utilities."""
-
-from __future__ import absolute_import
-from __future__ import division
-from __future__ import print_function
-
-import contextlib
-import multiprocessing
-
-# pylint: disable=wrong-import-order
-import numpy as np
-import pandas as pd
-import tensorflow as tf
-# pylint: enable=wrong-import-order
-
-from official.utils.data import file_io
-
-
-_RAW_ROW = "raw_row"
-_DUMMY_COL = "column_0"
-_DUMMY_VEC_COL = "column_1"
-_DUMMY_VEC_LEN = 4
-
-_ROWS_PER_CORE = 4
-_TEST_CASES = [
-    # One batch of one
-    dict(row_count=1, cpu_count=1, expected=[
-        [[0]]
-    ]),
-
-    dict(row_count=10, cpu_count=1, expected=[
-        [[0, 1, 2, 3]], [[4, 5, 6, 7]], [[8, 9]]
-    ]),
-
-    dict(row_count=21, cpu_count=1, expected=[
-        [[0, 1, 2, 3]], [[4, 5, 6, 7]], [[8, 9, 10, 11]],
-        [[12, 13, 14, 15]], [[16, 17, 18, 19]], [[20]]
-    ]),
-
-    dict(row_count=1, cpu_count=4, expected=[
-        [[0]]
-    ]),
-
-    dict(row_count=10, cpu_count=4, expected=[
-        [[0, 1], [2, 3, 4], [5, 6], [7, 8, 9]]
-    ]),
-
-    dict(row_count=21, cpu_count=4, expected=[
-        [[0, 1, 2, 3], [4, 5, 6, 7], [8, 9, 10, 11], [12, 13, 14, 15]],
-        [[16], [17], [18], [19, 20]]
-    ]),
-
-    dict(row_count=10, cpu_count=8, expected=[
-        [[0], [1], [2], [3, 4], [5], [6], [7], [8, 9]]
-    ]),
-
-    dict(row_count=40, cpu_count=8, expected=[
-        [[0, 1, 2, 3], [4, 5, 6, 7], [8, 9, 10, 11], [12, 13, 14, 15],
-         [16, 17, 18, 19], [20, 21, 22, 23], [24, 25, 26, 27],
-         [28, 29, 30, 31]],
-        [[32], [33], [34], [35], [36], [37], [38], [39]]
-    ]),
-]
-
-_FEATURE_MAP = {
-    _RAW_ROW: tf.FixedLenFeature([1], dtype=tf.int64),
-    _DUMMY_COL: tf.FixedLenFeature([1], dtype=tf.int64),
-    _DUMMY_VEC_COL: tf.FixedLenFeature([_DUMMY_VEC_LEN], dtype=tf.float32)
-}
-
-
-@contextlib.contextmanager
-def fixed_core_count(cpu_count):
-  """Override CPU count.
-
-  file_io.py uses the cpu_count function to scale to the size of the instance.
-  However, this is not desirable for testing because it can make the test flaky.
-  Instead, this context manager fixes the count for more robust testing.
-
-  Args:
-    cpu_count: How many cores multiprocessing claims to have.
-
-  Yields:
-    Nothing. (for context manager only)
-  """
-  old_count_fn = multiprocessing.cpu_count
-  multiprocessing.cpu_count = lambda: cpu_count
-  yield
-  multiprocessing.cpu_count = old_count_fn
-
-
-class BaseTest(tf.test.TestCase):
-
-  def _test_sharding(self, row_count, cpu_count, expected):
-    df = pd.DataFrame({_DUMMY_COL: list(range(row_count))})
-    with fixed_core_count(cpu_count):
-      shards = list(file_io.iter_shard_dataframe(df, _ROWS_PER_CORE))
-    result = [[j[_DUMMY_COL].tolist() for j in i] for i in shards]
-    self.assertAllEqual(expected, result)
-
-  def test_tiny_rows_low_core(self):
-    self._test_sharding(**_TEST_CASES[0])
-
-  def test_small_rows_low_core(self):
-    self._test_sharding(**_TEST_CASES[1])
-
-  def test_large_rows_low_core(self):
-    self._test_sharding(**_TEST_CASES[2])
-
-  def test_tiny_rows_medium_core(self):
-    self._test_sharding(**_TEST_CASES[3])
-
-  def test_small_rows_medium_core(self):
-    self._test_sharding(**_TEST_CASES[4])
-
-  def test_large_rows_medium_core(self):
-    self._test_sharding(**_TEST_CASES[5])
-
-  def test_small_rows_large_core(self):
-    self._test_sharding(**_TEST_CASES[6])
-
-  def test_large_rows_large_core(self):
-    self._test_sharding(**_TEST_CASES[7])
-
-  def _serialize_deserialize(self, num_cores=1, num_rows=20):
-    np.random.seed(1)
-    df = pd.DataFrame({
-        # Serialization order is only deterministic for num_cores=1. raw_row is
-        # used in validation after the deserialization.
-        _RAW_ROW: np.array(range(num_rows), dtype=np.int64),
-        _DUMMY_COL: np.random.randint(0, 35, size=(num_rows,)),
-        _DUMMY_VEC_COL: [
-            np.array([np.random.random() for _ in range(_DUMMY_VEC_LEN)])
-            for i in range(num_rows)  # pylint: disable=unused-variable
-        ]
-    })
-
-    with fixed_core_count(num_cores):
-      buffer_path = file_io.write_to_temp_buffer(
-          df, self.get_temp_dir(), [_RAW_ROW, _DUMMY_COL, _DUMMY_VEC_COL])
-
-    with self.test_session(graph=tf.Graph()) as sess:
-      dataset = tf.data.TFRecordDataset(buffer_path)
-      dataset = dataset.batch(1).map(
-          lambda x: tf.parse_example(x, _FEATURE_MAP))
-
-      data_iter = dataset.make_one_shot_iterator()
-      seen_rows = set()
-      for i in range(num_rows+5):
-        row = data_iter.get_next()
-        try:
-          row_id, val_0, val_1 = sess.run(
-              [row[_RAW_ROW], row[_DUMMY_COL], row[_DUMMY_VEC_COL]])
-          row_id, val_0, val_1 = row_id[0][0], val_0[0][0], val_1[0]
-          assert row_id not in seen_rows
-          seen_rows.add(row_id)
-
-          self.assertEqual(val_0, df[_DUMMY_COL][row_id])
-          self.assertAllClose(val_1, df[_DUMMY_VEC_COL][row_id])
-
-          self.assertLess(i, num_rows, msg="Too many rows.")
-        except tf.errors.OutOfRangeError:
-          self.assertGreaterEqual(i, num_rows, msg="Too few rows.")
-
-    file_io._GARBAGE_COLLECTOR.purge()
-    assert not tf.gfile.Exists(buffer_path)
-
-  def test_serialize_deserialize_0(self):
-    self._serialize_deserialize(num_cores=1)
-
-  def test_serialize_deserialize_1(self):
-    self._serialize_deserialize(num_cores=2)
-
-  def test_serialize_deserialize_2(self):
-    self._serialize_deserialize(num_cores=8)
-
-
-if __name__ == "__main__":
-  tf.test.main()
--- a/TensorFlow/ComputeVision/Accuracy_Validation/ResNet50_Official/official/utils/export/__init__.py
+++ b/TensorFlow/ComputeVision/Accuracy_Validation/ResNet50_Official/official/utils/export/__init__.py
--- a/TensorFlow/ComputeVision/Accuracy_Validation/ResNet50_Official/official/utils/export/export_test.py
+++ b/TensorFlow/ComputeVision/Accuracy_Validation/ResNet50_Official/official/utils/export/export_test.py
-# Copyright 2018 The TensorFlow Authors. All Rights Reserved.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-# ==============================================================================
-"""Tests for exporting utils."""
-
-from __future__ import absolute_import
-from __future__ import division
-from __future__ import print_function
-
-import tensorflow as tf  # pylint: disable=g-bad-import-order
-
-from official.utils.export import export
-
-
-class ExportUtilsTest(tf.test.TestCase):
-  """Tests for the ExportUtils."""
-
-  def test_build_tensor_serving_input_receiver_fn(self):
-    receiver_fn = export.build_tensor_serving_input_receiver_fn(shape=[4, 5])
-    with tf.Graph().as_default():
-      receiver = receiver_fn()
-      self.assertIsInstance(
-          receiver, tf.estimator.export.TensorServingInputReceiver)
-
-      self.assertIsInstance(receiver.features, tf.Tensor)
-      self.assertEqual(receiver.features.shape, tf.TensorShape([1, 4, 5]))
-      self.assertEqual(receiver.features.dtype, tf.float32)
-      self.assertIsInstance(receiver.receiver_tensors, dict)
-      # Note that Python 3 can no longer index .values() directly; cast to list.
-      self.assertEqual(list(receiver.receiver_tensors.values())[0].shape,
-                       tf.TensorShape([1, 4, 5]))
-
-  def test_build_tensor_serving_input_receiver_fn_batch_dtype(self):
-    receiver_fn = export.build_tensor_serving_input_receiver_fn(
-        shape=[4, 5], dtype=tf.int8, batch_size=10)
-
-    with tf.Graph().as_default():
-      receiver = receiver_fn()
-      self.assertIsInstance(
-          receiver, tf.estimator.export.TensorServingInputReceiver)
-
-      self.assertIsInstance(receiver.features, tf.Tensor)
-      self.assertEqual(receiver.features.shape, tf.TensorShape([10, 4, 5]))
-      self.assertEqual(receiver.features.dtype, tf.int8)
-      self.assertIsInstance(receiver.receiver_tensors, dict)
-      # Note that Python 3 can no longer index .values() directly; cast to list.
-      self.assertEqual(list(receiver.receiver_tensors.values())[0].shape,
-                       tf.TensorShape([10, 4, 5]))
-
-
-if __name__ == "__main__":
-  tf.test.main()
--- a/TensorFlow/ComputeVision/Accuracy_Validation/ResNet50_Official/official/utils/flags/README.md
+++ b/TensorFlow/ComputeVision/Accuracy_Validation/ResNet50_Official/official/utils/flags/README.md
-# Adding Abseil (absl) flags quickstart
-## Defining a flag
-absl flag definitions are similar to argparse, although they are defined on a global namespace.
-
-For instance defining a string flag looks like:
-```$xslt
-from absl import flags
-flags.DEFINE_string(
-    name="my_flag",
-    default="a_sensible_default",
-    help="Here is what this flag does."
-)
-```
-
-All three arguments are required, but default may be `None`. A common optional argument is
-short_name for defining abreviations. Certain `DEFINE_*` methods will have other required arguments.
-For instance `DEFINE_enum` requires the `enum_values` argument to be specified.
-
-## Key Flags
-absl has the concept of a key flag. Any flag defined in `__main__` is considered a key flag by
-default. Key flags are displayed in `--help`, others only appear in `--helpfull`. In order to
-handle key flags that are defined outside the module in question, absl provides the
-`flags.adopt_module_key_flags()` method. This adds the key flags of a different module to one's own
-key flags. For example:
-```$xslt
-File: flag_source.py
---------------------------------------
-
-from absl import flags
-flags.DEFINE_string(name="my_flag", default="abc", help="a flag.")
-```
-
-```$xslt
-File: my_module.py
---------------------------------------
-
-from absl import app as absl_app
-from absl import flags
-
-import flag_source
-
-flags.adopt_module_key_flags(flag_source)
-
-def main(_):
-  pass
-
-absl_app.run(main, [__file__, "-h"]
-```
-
-when `my_module.py` is run it will show the help text for `my_flag`. Because not all flags defined
-in a file are equally important, `official/utils/flags/core.py` (generally imported as flags_core)
-provides an abstraction for handling key flag declaration in an easy way through the
-`register_key_flags_in_core()` function, which allows a module to make a single
-`adopt_key_flags(flags_core)` call when using the util flag declaration functions.
-
-## Validators
-Often the constraints on a flag are complicated. absl provides the validator decorator to allow
-one to mark a function as a flag validation function. Suppose we want users to provide a flag
-which is a palindrome.
-
-```$xslt
-from absl import flags
-
-flags.DEFINE_string(name="pal_flag", short_name="pf", default="", help="Give me a palindrome")
-
-@flags.validator("pal_flag")
-def _check_pal(provided_pal_flag):
-  return provided_pal_flag == provided_pal_flag[::-1]
-
-```
-
-Validators take the form that returning True (truthy) passes, and all others 
-(False, None, exception) fail.
-
-## Testing
-To test using absl, simply declare flags in the setupClass method of TensorFlow's TestCase.
-
-```$xslt
-from absl import flags
-import tensorflow as tf
-
-def define_flags():
-  flags.DEFINE_string(name="test_flag", default="abc", help="an example flag")
-
-
-class BaseTester(unittest.TestCase):
-
-  @classmethod
-  def setUpClass(cls):
-    super(BaseTester, cls).setUpClass()
-    define_flags()
-    
-  def test_trivial(self):
-    flags_core.parse_flags([__file__, "test_flag", "def"])
-    self.AssertEqual(flags.FLAGS.test_flag, "def")
-    
-```
--- a/TensorFlow/ComputeVision/Accuracy_Validation/ResNet50_Official/official/utils/flags/__init__.py
+++ b/TensorFlow/ComputeVision/Accuracy_Validation/ResNet50_Official/official/utils/flags/__init__.py
--- a/TensorFlow/ComputeVision/Accuracy_Validation/ResNet50_Official/official/utils/flags/_base.py
+++ b/TensorFlow/ComputeVision/Accuracy_Validation/ResNet50_Official/official/utils/flags/_base.py
-# Copyright 2018 The TensorFlow Authors. All Rights Reserved.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-# ==============================================================================
-"""Flags which will be nearly universal across models."""
-
-from __future__ import absolute_import
-from __future__ import division
-from __future__ import print_function
-
-from absl import flags
-import tensorflow as tf
-
-from official.utils.flags._conventions import help_wrap
-from official.utils.logs import hooks_helper
-
-
-def define_base(data_dir=True, model_dir=True, clean=True, train_epochs=True,
-                epochs_between_evals=True, stop_threshold=True, batch_size=True,
-                num_gpu=True, hooks=True, export_dir=True):
-  """Register base flags.
-
-  Args:
-    data_dir: Create a flag for specifying the input data directory.
-    model_dir: Create a flag for specifying the model file directory.
-    train_epochs: Create a flag to specify the number of training epochs.
-    epochs_between_evals: Create a flag to specify the frequency of testing.
-    stop_threshold: Create a flag to specify a threshold accuracy or other
-      eval metric which should trigger the end of training.
-    batch_size: Create a flag to specify the batch size.
-    num_gpu: Create a flag to specify the number of GPUs used.
-    hooks: Create a flag to specify hooks for logging.
-    export_dir: Create a flag to specify where a SavedModel should be exported.
-
-  Returns:
-    A list of flags for core.py to marks as key flags.
-  """
-  key_flags = []
-
-  if data_dir:
-    flags.DEFINE_string(
-        name="data_dir", short_name="dd", default="/tmp",
-        help=help_wrap("The location of the input data."))
-    key_flags.append("data_dir")
-
-  if model_dir:
-    flags.DEFINE_string(
-        name="model_dir", short_name="md", default="/tmp",
-        help=help_wrap("The location of the model checkpoint files."))
-    key_flags.append("model_dir")
-
-  if clean:
-    flags.DEFINE_boolean(
-        name="clean", default=False,
-        help=help_wrap("If set, model_dir will be removed if it exists."))
-    key_flags.append("clean")
-
-  if train_epochs:
-    flags.DEFINE_integer(
-        name="train_epochs", short_name="te", default=1,
-        help=help_wrap("The number of epochs used to train."))
-    key_flags.append("train_epochs")
-
-  if epochs_between_evals:
-    flags.DEFINE_integer(
-        name="epochs_between_evals", short_name="ebe", default=1,
-        help=help_wrap("The number of training epochs to run between "
-                       "evaluations."))
-    key_flags.append("epochs_between_evals")
-
-  if stop_threshold:
-    flags.DEFINE_float(
-        name="stop_threshold", short_name="st",
-        default=None,
-        help=help_wrap("If passed, training will stop at the earlier of "
-                       "train_epochs and when the evaluation metric is  "
-                       "greater than or equal to stop_threshold."))
-
-  if batch_size:
-    flags.DEFINE_integer(
-        name="batch_size", short_name="bs", default=32,
-        help=help_wrap("Batch size for training and evaluation. When using "
-                       "multiple gpus, this is the global batch size for "
-                       "all devices. For example, if the batch size is 32 "
-                       "and there are 4 GPUs, each GPU will get 8 examples on "
-                       "each step."))
-    key_flags.append("batch_size")
-
-  if num_gpu:
-    flags.DEFINE_integer(
-        name="num_gpus", short_name="ng",
-        default=1 if tf.test.is_gpu_available() else 0,
-        help=help_wrap(
-            "How many GPUs to use with the DistributionStrategies API. The "
-            "default is 1 if TensorFlow can detect a GPU, and 0 otherwise."))
-
-  if hooks:
-    # Construct a pretty summary of hooks.
-    hook_list_str = (
-        u"\ufeff  Hook:\n" + u"\n".join([u"\ufeff    {}".format(key) for key
-                                         in hooks_helper.HOOKS]))
-    flags.DEFINE_list(
-        name="hooks", short_name="hk", default="LoggingTensorHook",
-        help=help_wrap(
-            u"A list of (case insensitive) strings to specify the names of "
-            u"training hooks.\n{}\n\ufeff  Example: `--hooks ProfilerHook,"
-            u"ExamplesPerSecondHook`\n See official.utils.logs.hooks_helper "
-            u"for details.".format(hook_list_str))
-    )
-    key_flags.append("hooks")
-
-  if export_dir:
-    flags.DEFINE_string(
-        name="export_dir", short_name="ed", default=None,
-        help=help_wrap("If set, a SavedModel serialization of the model will "
-                       "be exported to this directory at the end of training. "
-                       "See the README for more details and relevant links.")
-    )
-    key_flags.append("export_dir")
-
-  return key_flags
-
-
-def get_num_gpus(flags_obj):
-  """Treat num_gpus=-1 as 'use all'."""
-  if flags_obj.num_gpus != -1:
-    return flags_obj.num_gpus
-
-  from tensorflow.python.client import device_lib  # pylint: disable=g-import-not-at-top
-  local_device_protos = device_lib.list_local_devices()
-  return sum([1 for d in local_device_protos if d.device_type == "GPU"])
--- a/TensorFlow/ComputeVision/Accuracy_Validation/ResNet50_Official/official/utils/flags/_benchmark.py
+++ b/TensorFlow/ComputeVision/Accuracy_Validation/ResNet50_Official/official/utils/flags/_benchmark.py
-# Copyright 2018 The TensorFlow Authors. All Rights Reserved.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-# ==============================================================================
-"""Flags for benchmarking models."""
-
-from __future__ import absolute_import
-from __future__ import division
-from __future__ import print_function
-
-from absl import flags
-
-from official.utils.flags._conventions import help_wrap
-
-
-def define_benchmark(benchmark_log_dir=True, bigquery_uploader=True):
-  """Register benchmarking flags.
-
-  Args:
-    benchmark_log_dir: Create a flag to specify location for benchmark logging.
-    bigquery_uploader: Create flags for uploading results to BigQuery.
-
-  Returns:
-    A list of flags for core.py to marks as key flags.
-  """
-
-  key_flags = []
-
-  flags.DEFINE_enum(
-      name="benchmark_logger_type", default="BaseBenchmarkLogger",
-      enum_values=["BaseBenchmarkLogger", "BenchmarkFileLogger",
-                   "BenchmarkBigQueryLogger"],
-      help=help_wrap("The type of benchmark logger to use. Defaults to using "
-                     "BaseBenchmarkLogger which logs to STDOUT. Different "
-                     "loggers will require other flags to be able to work."))
-  flags.DEFINE_string(
-      name="benchmark_test_id", short_name="bti", default=None,
-      help=help_wrap("The unique test ID of the benchmark run. It could be the "
-                     "combination of key parameters. It is hardware "
-                     "independent and could be used compare the performance "
-                     "between different test runs. This flag is designed for "
-                     "human consumption, and does not have any impact within "
-                     "the system."))
-
-  if benchmark_log_dir:
-    flags.DEFINE_string(
-        name="benchmark_log_dir", short_name="bld", default=None,
-        help=help_wrap("The location of the benchmark logging.")
-    )
-
-  if bigquery_uploader:
-    flags.DEFINE_string(
-        name="gcp_project", short_name="gp", default=None,
-        help=help_wrap(
-            "The GCP project name where the benchmark will be uploaded."))
-
-    flags.DEFINE_string(
-        name="bigquery_data_set", short_name="bds", default="test_benchmark",
-        help=help_wrap(
-            "The Bigquery dataset name where the benchmark will be uploaded."))
-
-    flags.DEFINE_string(
-        name="bigquery_run_table", short_name="brt", default="benchmark_run",
-        help=help_wrap("The Bigquery table name where the benchmark run "
-                       "information will be uploaded."))
-
-    flags.DEFINE_string(
-        name="bigquery_run_status_table", short_name="brst",
-        default="benchmark_run_status",
-        help=help_wrap("The Bigquery table name where the benchmark run "
-                       "status information will be uploaded."))
-
-    flags.DEFINE_string(
-        name="bigquery_metric_table", short_name="bmt",
-        default="benchmark_metric",
-        help=help_wrap("The Bigquery table name where the benchmark metric "
-                       "information will be uploaded."))
-
-  @flags.multi_flags_validator(
-      ["benchmark_logger_type", "benchmark_log_dir"],
-      message="--benchmark_logger_type=BenchmarkFileLogger will require "
-              "--benchmark_log_dir being set")
-  def _check_benchmark_log_dir(flags_dict):
-    benchmark_logger_type = flags_dict["benchmark_logger_type"]
-    if benchmark_logger_type == "BenchmarkFileLogger":
-      return flags_dict["benchmark_log_dir"]
-    return True
-
-  return key_flags
--- a/TensorFlow/ComputeVision/Accuracy_Validation/ResNet50_Official/official/utils/flags/_conventions.py
+++ b/TensorFlow/ComputeVision/Accuracy_Validation/ResNet50_Official/official/utils/flags/_conventions.py
-# Copyright 2018 The TensorFlow Authors. All Rights Reserved.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-# ==============================================================================
-"""Central location for shared arparse convention definitions."""
-
-from __future__ import absolute_import
-from __future__ import division
-from __future__ import print_function
-
-import codecs
-import functools
-
-from absl import app as absl_app
-from absl import flags
-
-
-# This codifies help string conventions and makes it easy to update them if
-# necessary. Currently the only major effect is that help bodies start on the
-# line after flags are listed. All flag definitions should wrap the text bodies
-# with help wrap when calling DEFINE_*.
-_help_wrap = functools.partial(flags.text_wrap, length=80, indent="",
-                               firstline_indent="\n")
-
-
-# Pretty formatting causes issues when utf-8 is not installed on a system.
-try:
-  codecs.lookup("utf-8")
-  help_wrap = _help_wrap
-except LookupError:
-  def help_wrap(text, *args, **kwargs):
-    return _help_wrap(text, *args, **kwargs).replace("\ufeff", "")
-
-
-# Replace None with h to also allow -h
-absl_app.HelpshortFlag.SHORT_NAME = "h"
--- a/TensorFlow/ComputeVision/Accuracy_Validation/ResNet50_Official/official/utils/flags/_device.py
+++ b/TensorFlow/ComputeVision/Accuracy_Validation/ResNet50_Official/official/utils/flags/_device.py
-# Copyright 2018 The TensorFlow Authors. All Rights Reserved.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-# ==============================================================================
-"""Flags for managing compute devices. Currently only contains TPU flags."""
-
-from __future__ import absolute_import
-from __future__ import division
-from __future__ import print_function
-
-from absl import flags
-import tensorflow as tf
-
-from official.utils.flags._conventions import help_wrap
-
-
-def require_cloud_storage(flag_names):
-  """Register a validator to check directory flags.
-  Args:
-    flag_names: An iterable of strings containing the names of flags to be
-      checked.
-  """
-  msg = "TPU requires GCS path for {}".format(", ".join(flag_names))
-  @flags.multi_flags_validator(["tpu"] + flag_names, message=msg)
-  def _path_check(flag_values):  # pylint: disable=missing-docstring
-    if flag_values["tpu"] is None:
-      return True
-
-    valid_flags = True
-    for key in flag_names:
-      if not flag_values[key].startswith("gs://"):
-        tf.logging.error("{} must be a GCS path.".format(key))
-        valid_flags = False
-
-    return valid_flags
-
-
-def define_device(tpu=True):
-  """Register device specific flags.
-  Args:
-    tpu: Create flags to specify TPU operation.
-  Returns:
-    A list of flags for core.py to marks as key flags.
-  """
-
-  key_flags = []
-
-  if tpu:
-    flags.DEFINE_string(
-        name="tpu", default=None,
-        help=help_wrap(
-            "The Cloud TPU to use for training. This should be either the name "
-            "used when creating the Cloud TPU, or a "
-            "grpc://ip.address.of.tpu:8470 url. Passing `local` will use the"
-            "CPU of the local instance instead. (Good for debugging.)"))
-    key_flags.append("tpu")
-
-    flags.DEFINE_string(
-        name="tpu_zone", default=None,
-        help=help_wrap(
-            "[Optional] GCE zone where the Cloud TPU is located in. If not "
-            "specified, we will attempt to automatically detect the GCE "
-            "project from metadata."))
-
-    flags.DEFINE_string(
-        name="tpu_gcp_project", default=None,
-        help=help_wrap(
-            "[Optional] Project name for the Cloud TPU-enabled project. If not "
-            "specified, we will attempt to automatically detect the GCE "
-            "project from metadata."))
-
-    flags.DEFINE_integer(name="num_tpu_shards", default=8,
-                         help=help_wrap("Number of shards (TPU chips)."))
-
-  return key_flags
--- a/TensorFlow/ComputeVision/Accuracy_Validation/ResNet50_Official/official/utils/flags/_performance.py
+++ b/TensorFlow/ComputeVision/Accuracy_Validation/ResNet50_Official/official/utils/flags/_performance.py
-# Copyright 2018 The TensorFlow Authors. All Rights Reserved.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-# ==============================================================================
-"""Register flags for optimizing performance."""
-
-from __future__ import absolute_import
-from __future__ import division
-from __future__ import print_function
-
-import multiprocessing
-
-from absl import flags    # pylint: disable=g-bad-import-order
-import tensorflow as tf   # pylint: disable=g-bad-import-order
-
-from official.utils.flags._conventions import help_wrap
-
-
-# Map string to (TensorFlow dtype, default loss scale)
-DTYPE_MAP = {
-    "fp16": (tf.float16, 128),
-    "fp32": (tf.float32, 1),
-}
-
-
-def get_tf_dtype(flags_obj):
-  return DTYPE_MAP[flags_obj.dtype][0]
-
-
-def get_loss_scale(flags_obj):
-  if flags_obj.loss_scale is not None:
-    return flags_obj.loss_scale
-  return DTYPE_MAP[flags_obj.dtype][1]
-
-
-def define_performance(num_parallel_calls=True, inter_op=True, intra_op=True,
-                       synthetic_data=True, max_train_steps=True, dtype=True,
-                       all_reduce_alg=True, tf_gpu_thread_mode=False,
-                       datasets_num_private_threads=False,
-                       datasets_num_parallel_batches=False):
-  """Register flags for specifying performance tuning arguments.
-
-  Args:
-    num_parallel_calls: Create a flag to specify parallelism of data loading.
-    inter_op: Create a flag to allow specification of inter op threads.
-    intra_op: Create a flag to allow specification of intra op threads.
-    synthetic_data: Create a flag to allow the use of synthetic data.
-    max_train_steps: Create a flags to allow specification of maximum number
-      of training steps
-    dtype: Create flags for specifying dtype.
-    all_reduce_alg: If set forces a specific algorithm for multi-gpu.
-    tf_gpu_thread_mode: gpu_private triggers us of private thread pool.
-    datasets_num_private_threads: Number of private threads for datasets.
-    datasets_num_parallel_batches: Determines how many batches to process in
-    parallel when using map and batch from tf.data.
-
-  Returns:
-    A list of flags for core.py to marks as key flags.
-  """
-
-  key_flags = []
-  if num_parallel_calls:
-    flags.DEFINE_integer(
-        name="num_parallel_calls", short_name="npc",
-        default=multiprocessing.cpu_count(),
-        help=help_wrap("The number of records that are  processed in parallel "
-                       "during input processing. This can be optimized per "
-                       "data set but for generally homogeneous data sets, "
-                       "should be approximately the number of available CPU "
-                       "cores. (default behavior)"))
-
-  if inter_op:
-    flags.DEFINE_integer(
-        name="inter_op_parallelism_threads", short_name="inter", default=0,
-        help=help_wrap("Number of inter_op_parallelism_threads to use for CPU. "
-                       "See TensorFlow config.proto for details.")
-    )
-
-  if intra_op:
-    flags.DEFINE_integer(
-        name="intra_op_parallelism_threads", short_name="intra", default=0,
-        help=help_wrap("Number of intra_op_parallelism_threads to use for CPU. "
-                       "See TensorFlow config.proto for details."))
-
-  if synthetic_data:
-    flags.DEFINE_bool(
-        name="use_synthetic_data", short_name="synth", default=False,
-        help=help_wrap(
-            "If set, use fake data (zeroes) instead of a real dataset. "
-            "This mode is useful for performance debugging, as it removes "
-            "input processing steps, but will not learn anything."))
-
-  if max_train_steps:
-    flags.DEFINE_integer(
-        name="max_train_steps", short_name="mts", default=None, help=help_wrap(
-            "The model will stop training if the global_step reaches this "
-            "value. If not set, training will run until the specified number "
-            "of epochs have run as usual. It is generally recommended to set "
-            "--train_epochs=1 when using this flag."
-        ))
-
-  if dtype:
-    flags.DEFINE_enum(
-        name="dtype", short_name="dt", default="fp32",
-        enum_values=DTYPE_MAP.keys(),
-        help=help_wrap("The TensorFlow datatype used for calculations. "
-                       "Variables may be cast to a higher precision on a "
-                       "case-by-case basis for numerical stability."))
-
-    flags.DEFINE_integer(
-        name="loss_scale", short_name="ls", default=None,
-        help=help_wrap(
-            "The amount to scale the loss by when the model is run. Before "
-            "gradients are computed, the loss is multiplied by the loss scale, "
-            "making all gradients loss_scale times larger. To adjust for this, "
-            "gradients are divided by the loss scale before being applied to "
-            "variables. This is mathematically equivalent to training without "
-            "a loss scale, but the loss scale helps avoid some intermediate "
-            "gradients from underflowing to zero. If not provided the default "
-            "for fp16 is 128 and 1 for all other dtypes."))
-
-    loss_scale_val_msg = "loss_scale should be a positive integer."
-    @flags.validator(flag_name="loss_scale", message=loss_scale_val_msg)
-    def _check_loss_scale(loss_scale):  # pylint: disable=unused-variable
-      if loss_scale is None:
-        return True  # null case is handled in get_loss_scale()
-
-      return loss_scale > 0
-
-  if all_reduce_alg:
-    flags.DEFINE_string(
-        name="all_reduce_alg", short_name="ara", default=None,
-        help=help_wrap("Defines the algorithm to use for performing all-reduce."
-                       "See tf.contrib.distribute.AllReduceCrossTowerOps for "
-                       "more details and available options."))
-
-  if tf_gpu_thread_mode:
-    flags.DEFINE_string(
-        name="tf_gpu_thread_mode", short_name="gt_mode", default=None,
-        help=help_wrap(
-            "Whether and how the GPU device uses its own threadpool.")
-    )
-
-  if datasets_num_private_threads:
-    flags.DEFINE_integer(
-        name="datasets_num_private_threads",
-        default=None,
-        help=help_wrap(
-            "Number of threads for a private threadpool created for all"
-            "datasets computation..")
-    )
-
-  if datasets_num_parallel_batches:
-    flags.DEFINE_integer(
-        name="datasets_num_parallel_batches",
-        default=None,
-        help=help_wrap(
-            "Determines how many batches to process in parallel when using "
-            "map and batch from tf.data.")
-    )
-
-  return key_flags
--- a/TensorFlow/ComputeVision/Accuracy_Validation/ResNet50_Official/official/utils/flags/core.py
+++ b/TensorFlow/ComputeVision/Accuracy_Validation/ResNet50_Official/official/utils/flags/core.py
-# Copyright 2018 The TensorFlow Authors. All Rights Reserved.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-# ==============================================================================
-"""Public interface for flag definition.
-
-See _example.py for detailed instructions on defining flags.
-"""
-
-from __future__ import absolute_import
-from __future__ import division
-from __future__ import print_function
-
-import functools
-import sys
-
-from absl import app as absl_app
-from absl import flags
-
-from official.utils.flags import _base
-from official.utils.flags import _benchmark
-from official.utils.flags import _conventions
-from official.utils.flags import _device
-from official.utils.flags import _misc
-from official.utils.flags import _performance
-
-
-def set_defaults(**kwargs):
-  for key, value in kwargs.items():
-    flags.FLAGS.set_default(name=key, value=value)
-
-
-def parse_flags(argv=None):
-  """Reset flags and reparse. Currently only used in testing."""
-  flags.FLAGS.unparse_flags()
-  absl_app.parse_flags_with_usage(argv or sys.argv)
-
-
-def register_key_flags_in_core(f):
-  """Defines a function in core.py, and registers its key flags.
-
-  absl uses the location of a flags.declare_key_flag() to determine the context
-  in which a flag is key. By making all declares in core, this allows model
-  main functions to call flags.adopt_module_key_flags() on core and correctly
-  chain key flags.
-
-  Args:
-    f:  The function to be wrapped
-
-  Returns:
-    The "core-defined" version of the input function.
-  """
-
-  def core_fn(*args, **kwargs):
-    key_flags = f(*args, **kwargs)
-    [flags.declare_key_flag(fl) for fl in key_flags]  # pylint: disable=expression-not-assigned
-  return core_fn
-
-
-define_base = register_key_flags_in_core(_base.define_base)
-# Remove options not relevant for Eager from define_base().
-define_base_eager = register_key_flags_in_core(functools.partial(
-    _base.define_base, epochs_between_evals=False, stop_threshold=False,
-    hooks=False))
-define_benchmark = register_key_flags_in_core(_benchmark.define_benchmark)
-define_device = register_key_flags_in_core(_device.define_device)
-define_image = register_key_flags_in_core(_misc.define_image)
-define_performance = register_key_flags_in_core(_performance.define_performance)
-
-
-help_wrap = _conventions.help_wrap
-
-
-get_num_gpus = _base.get_num_gpus
-get_tf_dtype = _performance.get_tf_dtype
-get_loss_scale = _performance.get_loss_scale
-DTYPE_MAP = _performance.DTYPE_MAP
-require_cloud_storage = _device.require_cloud_storage
--- a/TensorFlow/ComputeVision/Accuracy_Validation/ResNet50_Official/official/utils/flags/flags_test.py
+++ b/TensorFlow/ComputeVision/Accuracy_Validation/ResNet50_Official/official/utils/flags/flags_test.py
-# Copyright 2018 The TensorFlow Authors. All Rights Reserved.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-# ==============================================================================
-
-import unittest
-
-from absl import flags
-import tensorflow as tf
-
-from official.utils.flags import core as flags_core  # pylint: disable=g-bad-import-order
-
-
-def define_flags():
-  flags_core.define_base(num_gpu=False)
-  flags_core.define_performance()
-  flags_core.define_image()
-  flags_core.define_benchmark()
-
-
-class BaseTester(unittest.TestCase):
-
-  @classmethod
-  def setUpClass(cls):
-    super(BaseTester, cls).setUpClass()
-    define_flags()
-
-  def test_default_setting(self):
-    """Test to ensure fields exist and defaults can be set.
-    """
-
-    defaults = dict(
-        data_dir="dfgasf",
-        model_dir="dfsdkjgbs",
-        train_epochs=534,
-        epochs_between_evals=15,
-        batch_size=256,
-        hooks=["LoggingTensorHook"],
-        num_parallel_calls=18,
-        inter_op_parallelism_threads=5,
-        intra_op_parallelism_threads=10,
-        data_format="channels_first"
-    )
-
-    flags_core.set_defaults(**defaults)
-    flags_core.parse_flags()
-
-    for key, value in defaults.items():
-      assert flags.FLAGS.get_flag_value(name=key, default=None) == value
-
-  def test_benchmark_setting(self):
-    defaults = dict(
-        hooks=["LoggingMetricHook"],
-        benchmark_log_dir="/tmp/12345",
-        gcp_project="project_abc",
-    )
-
-    flags_core.set_defaults(**defaults)
-    flags_core.parse_flags()
-
-    for key, value in defaults.items():
-      assert flags.FLAGS.get_flag_value(name=key, default=None) == value
-
-  def test_booleans(self):
-    """Test to ensure boolean flags trigger as expected.
-    """
-
-    flags_core.parse_flags([__file__, "--use_synthetic_data"])
-
-    assert flags.FLAGS.use_synthetic_data
-
-  def test_parse_dtype_info(self):
-    for dtype_str, tf_dtype, loss_scale in [["fp16", tf.float16, 128],
-                                            ["fp32", tf.float32, 1]]:
-      flags_core.parse_flags([__file__, "--dtype", dtype_str])
-
-      self.assertEqual(flags_core.get_tf_dtype(flags.FLAGS), tf_dtype)
-      self.assertEqual(flags_core.get_loss_scale(flags.FLAGS), loss_scale)
-
-      flags_core.parse_flags(
-          [__file__, "--dtype", dtype_str, "--loss_scale", "5"])
-
-      self.assertEqual(flags_core.get_loss_scale(flags.FLAGS), 5)
-
-    with self.assertRaises(SystemExit):
-      flags_core.parse_flags([__file__, "--dtype", "int8"])
-
-
-if __name__ == "__main__":
-  unittest.main()