Commit 80c91145 authored by Lawrence McAfee's avatar Lawrence McAfee
Browse files

added timing for count-zeros & inner-step.

parent e858d338
...@@ -435,11 +435,15 @@ class MixedPrecisionOptimizer(MegatronOptimizer): ...@@ -435,11 +435,15 @@ class MixedPrecisionOptimizer(MegatronOptimizer):
timers('optimizer-clip-main-grad').stop() timers('optimizer-clip-main-grad').stop()
# count the zeros in the grads # count the zeros in the grads
timers('optimizer-count-zeros').start()
num_zeros_in_grad = self.count_zeros() if \ num_zeros_in_grad = self.count_zeros() if \
self.log_num_zeros_in_grad else None self.log_num_zeros_in_grad else None
timers('optimizer-count-zeros').stop()
# Step the optimizer. # Step the optimizer.
timers('optimizer-inner-step').start()
self.optimizer.step() self.optimizer.step()
timers('optimizer-inner-step').stop()
# Update params from main params. # Update params from main params.
timers('optimizer-copy-main-to-model-params').start() timers('optimizer-copy-main-to-model-params').start()
......
...@@ -523,6 +523,8 @@ def training_log(loss_dict, total_loss_dict, learning_rate, iteration, ...@@ -523,6 +523,8 @@ def training_log(loss_dict, total_loss_dict, learning_rate, iteration,
add_to_logging('optimizer-copy-to-main-grad') add_to_logging('optimizer-copy-to-main-grad')
add_to_logging('optimizer-unscale-and-check-inf') add_to_logging('optimizer-unscale-and-check-inf')
add_to_logging('optimizer-clip-main-grad') add_to_logging('optimizer-clip-main-grad')
add_to_logging('optimizer-count-zeros')
add_to_logging('optimizer-inner-step')
add_to_logging('optimizer-copy-main-to-model-params') add_to_logging('optimizer-copy-main-to-model-params')
add_to_logging('optimizer') add_to_logging('optimizer')
add_to_logging('batch-generator') add_to_logging('batch-generator')
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment