Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
OpenDAS
apex
Commits
e6925e6c
Commit
e6925e6c
authored
May 30, 2020
by
Thor Johnsen
Browse files
Bug fix
parent
8ed8eaac
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
3 additions
and
3 deletions
+3
-3
apex/contrib/optimizers/distributed_fused_lamb.py
apex/contrib/optimizers/distributed_fused_lamb.py
+3
-3
No files found.
apex/contrib/optimizers/distributed_fused_lamb.py
View file @
e6925e6c
...
@@ -71,7 +71,7 @@ class DistributedFusedLAMB(torch.optim.Optimizer):
...
@@ -71,7 +71,7 @@ class DistributedFusedLAMB(torch.optim.Optimizer):
dwu_group_size
=
0
,
dwu_num_blocks
=
4
,
dwu_num_chunks
=
4
,
dwu_group_size
=
0
,
dwu_num_blocks
=
4
,
dwu_num_chunks
=
4
,
dwu_num_rs_pg
=
1
,
dwu_num_ar_pg
=
4
,
dwu_num_ag_pg
=
0
,
dwu_num_rs_pg
=
1
,
dwu_num_ar_pg
=
4
,
dwu_num_ag_pg
=
0
,
e5m2_allgather
=
False
):
e5m2_allgather
=
False
):
global
fus
ed_
ad
am_cuda
global
distribut
ed_
l
am
b
_cuda
distributed_lamb_cuda
=
importlib
.
import_module
(
"distributed_lamb_cuda"
)
distributed_lamb_cuda
=
importlib
.
import_module
(
"distributed_lamb_cuda"
)
self
.
_amp_scale_adjustment
=
amp_scale_adjustment
self
.
_amp_scale_adjustment
=
amp_scale_adjustment
...
@@ -286,8 +286,8 @@ class DistributedFusedLAMB(torch.optim.Optimizer):
...
@@ -286,8 +286,8 @@ class DistributedFusedLAMB(torch.optim.Optimizer):
if
self
.
_contrib_min_param_i
<
0
:
self
.
_contrib_min_param_i
=
param_i
if
self
.
_contrib_min_param_i
<
0
:
self
.
_contrib_min_param_i
=
param_i
self
.
_contrib_max_param_i
=
param_i
self
.
_contrib_max_param_i
=
param_i
self
.
_contrib_model_param_for_norm_num
=
len
(
self
.
_contrib_model_param_for_norm_is_fp16
)
self
.
_contrib_model_param_for_norm_num
=
len
(
self
.
_contrib_model_param_for_norm_is_fp16
)
if
len
(
self
.
_contrib_model_param_for_norm_fp16
)
==
0
:
len
(
self
.
_contrib_model_param_for_norm_fp16
=
None
if
len
(
self
.
_contrib_model_param_for_norm_fp16
)
==
0
:
self
.
_contrib_model_param_for_norm_fp16
=
None
if
len
(
self
.
_contrib_model_param_for_norm_fp32
)
==
0
:
len
(
self
.
_contrib_model_param_for_norm_fp32
=
None
if
len
(
self
.
_contrib_model_param_for_norm_fp32
)
==
0
:
self
.
_contrib_model_param_for_norm_fp32
=
None
self
.
_contrib_model_param_for_norm_is_fp16
=
torch
.
tensor
([
is_fp16
for
is_fp16
in
self
.
_contrib_model_param_for_norm_is_fp16
],
dtype
=
torch
.
bool
,
device
=
'cuda'
)
self
.
_contrib_model_param_for_norm_is_fp16
=
torch
.
tensor
([
is_fp16
for
is_fp16
in
self
.
_contrib_model_param_for_norm_is_fp16
],
dtype
=
torch
.
bool
,
device
=
'cuda'
)
self
.
_contrib_model_param_for_norm_is_fp32
=
torch
.
tensor
([
not
is_fp16
for
is_fp16
in
self
.
_contrib_model_param_for_norm_is_fp16
],
dtype
=
torch
.
bool
,
device
=
'cuda'
)
self
.
_contrib_model_param_for_norm_is_fp32
=
torch
.
tensor
([
not
is_fp16
for
is_fp16
in
self
.
_contrib_model_param_for_norm_is_fp16
],
dtype
=
torch
.
bool
,
device
=
'cuda'
)
self
.
_contrib_model_param_for_norm_is_fp16
=
None
self
.
_contrib_model_param_for_norm_is_fp16
=
None
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment