Commit c0cfcc47 authored by Rick Ho's avatar Rick Ho
Browse files

fix rank of megatron dp

parent 593feab2
...@@ -84,7 +84,10 @@ class MegatronMLP(FMoETransformerMLP): ...@@ -84,7 +84,10 @@ class MegatronMLP(FMoETransformerMLP):
world_size=world_size, mp_group=group, world_size=world_size, mp_group=group,
expert_dp_comm='none' if args.distributed_experts else 'dp') expert_dp_comm='none' if args.distributed_experts else 'dp')
self.hidden_size = args.hidden_size self.hidden_size = args.hidden_size
self.rank = args.rank if args.distributed_experts:
self.rank = args.rank
else:
self.rank = 0
self.sigma = args.init_method_std self.sigma = args.init_method_std
self.num_layers = args.num_layers self.num_layers = args.num_layers
self.reset_parameters() self.reset_parameters()
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment