Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
OpenDAS
Megatron-LM
Commits
e0a12fe1
Commit
e0a12fe1
authored
Nov 08, 2022
by
Jared Casper
Browse files
Fix merge error.
parent
d3a416cd
Changes
1
Show whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
4 additions
and
4 deletions
+4
-4
megatron/model/transformer.py
megatron/model/transformer.py
+4
-4
No files found.
megatron/model/transformer.py
View file @
e0a12fe1
...
...
@@ -738,7 +738,7 @@ class NoopTransformerLayer(MegatronModule):
def
_get_num_layers
(
args
,
is_encoder_and_decoder_model
,
is_decoder
=
False
):
"""Compute the number of transformer layers resident on the current rank."""
if
get_pipeline_model_parallel_world_size
()
>
1
:
if
mpu
.
get_pipeline_model_parallel_world_size
()
>
1
:
if
is_encoder_and_decoder_model
:
assert
args
.
pipeline_model_parallel_split_rank
is
not
None
...
...
@@ -756,11 +756,11 @@ def _get_num_layers(args, is_encoder_and_decoder_model, is_decoder=False):
'encoder_num_layers (%d) must be divisible by number of ranks given to encoder (%d)'
%
(
args
.
encoder_num_layers
,
num_ranks_in_encoder
)
assert
args
.
decoder_num_layers
%
num_ranks_in_decoder
==
0
,
\
'decoder_num_layers (%d) must be divisible by number of ranks given to decoder (%d)'
%
(
args
.
decoder_num_layers
,
num_ranks_in_decoder
)
if
is_pipeline_stage_before_split
():
if
mpu
.
is_pipeline_stage_before_split
():
num_layers
=
(
0
if
args
.
standalone_embedding_stage
and
get_pipeline_model_parallel_rank
()
==
0
else
and
mpu
.
get_pipeline_model_parallel_rank
()
==
0
else
args
.
encoder_num_layers
//
num_ranks_in_encoder
)
else
:
...
...
@@ -777,7 +777,7 @@ def _get_num_layers(args, is_encoder_and_decoder_model, is_decoder=False):
num_layers
=
(
0
if
args
.
standalone_embedding_stage
and
get_pipeline_model_parallel_rank
()
==
0
else
and
mpu
.
get_pipeline_model_parallel_rank
()
==
0
else
args
.
num_layers
//
args
.
transformer_pipeline_model_parallel_size
)
else
:
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment