Internal change

PiperOrigin-RevId: 296767846

Internal change
PiperOrigin-RevId: 296767846
89dd9a4e · Zongwei Zhou · A. Unique TensorFlower · c25d7711 · 89dd9a4e
Commit 89dd9a4e authored Feb 23, 2020 by Zongwei Zhou Committed by A. Unique TensorFlower Feb 23, 2020
Show whitespace changes
Inline Side-by-side

Showing with 8 additions and 2 deletions

official/nlp/optimization.py official/nlp/optimization.py +8 -2

No files found.
--- a/official/nlp/optimization.py
+++ b/official/nlp/optimization.py
@@ -137,10 +137,16 @@ class AdamWeightDecay(tf.keras.optimizers.Adam):
          use_locking=self._use_locking)
    return tf.no_op()

-  def apply_gradients(self, grads_and_vars, name=None):
+  def apply_gradients(self,
+                      grads_and_vars,
+                      name=None,
+                      all_reduce_sum_gradients=True):
    grads, tvars = list(zip(*grads_and_vars))
    (grads, _) = tf.clip_by_global_norm(grads, clip_norm=1.0)
-    return super(AdamWeightDecay, self).apply_gradients(zip(grads, tvars))
+    return super(AdamWeightDecay, self).apply_gradients(
+        zip(grads, tvars),
+        name=name,
+        all_reduce_sum_gradients=all_reduce_sum_gradients)

  def _get_lr(self, var_device, var_dtype, apply_state):
    """Retrieves the learning rate with the given state."""