Commit b6188fc4 authored by Deyu Fu's avatar Deyu Fu
Browse files

address comment

parent d665ab90
......@@ -100,10 +100,7 @@ class FusedAdam(torch.optim.Optimizer):
if clip > 1:
combined_scale = clip * scale
# set bias correction for this group
bias_correction = 0
if group['bias_correction']:
bias_correction = 1
bias_correction = 1 if group['bias_correction'] else 0
for p, grad, output_param in zip(group['params'], grads_this_group, output_params_this_group):
#note: p.grad should not ever be set for correct operation of mixed precision optimizer that sometimes sends None gradients
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment