Internal change

PiperOrigin-RevId: 371640518

Internal change
PiperOrigin-RevId: 371640518
a90e36a4 · A. Unique TensorFlower · 8454dedc · a90e36a4 · a90e36a4 · a90e36a4
Commit a90e36a4 authored May 02, 2021 by A. Unique TensorFlower
3 changed files
--- a/official/staging/training/grad_utils.py
+++ b/official/staging/training/grad_utils.py
@@ -65,10 +65,10 @@ def _filter_and_allreduce_gradients(grads_and_vars,
  (grads, variables) = zip(*filtered_grads_and_vars)
  if allreduce_precision == "float16":
    grads = [tf.cast(grad, "float16") for grad in grads]
-  hints = tf.distribute.experimental.CollectiveHints(
+  hints = tf.distribute.experimental.CommunicationOptions(
      bytes_per_pack=bytes_per_pack)
-  allreduced_grads = tf.distribute.get_replica_context().all_reduce(
+  allreduced_grads = tf.distribute.get_strategy(  # pylint: disable=protected-access
-      tf.distribute.ReduceOp.SUM, grads, hints)
+  ).extended._replica_ctx_all_reduce(tf.distribute.ReduceOp.SUM, grads, hints)
  if allreduce_precision == "float16":
    allreduced_grads = [tf.cast(grad, "float32") for grad in allreduced_grads]
  return allreduced_grads, variables

--- a/official/vision/image_classification/resnet/resnet_ctl_imagenet_main.py
+++ b/official/vision/image_classification/resnet/resnet_ctl_imagenet_main.py
@@ -97,8 +97,7 @@ def run(flags_obj):
  Returns:
    Dictionary of training and eval stats.
  """
-  keras_utils.set_session_config(
+  keras_utils.set_session_config()
-      enable_xla=flags_obj.enable_xla)
  performance.set_mixed_precision_policy(flags_core.get_tf_dtype(flags_obj))
  if tf.config.list_physical_devices('GPU'):

--- a/official/vision/image_classification/resnet/resnet_runnable.py
+++ b/official/vision/image_classification/resnet/resnet_runnable.py
@@ -167,7 +167,8 @@ class ResnetRunnable(orbit.StandardTrainer, orbit.StandardEvaluator):
          tape, self.optimizer, loss, self.model.trainable_variables)
      self.train_loss.update_state(loss)
      self.train_accuracy.update_state(labels, logits)
+    if self.flags_obj.enable_xla:
+      step_fn = tf.function(step_fn, jit_compile=True)
    self.strategy.run(step_fn, args=(next(iterator),))
  def train_loop_end(self):