Unverified Commit e92f1195 authored by Vasilis Vryniotis's avatar Vasilis Vryniotis Committed by GitHub
Browse files

Add barrier() after init_process_group() (#5475)

parent 55a8300b
......@@ -274,6 +274,7 @@ def init_distributed_mode(args):
torch.distributed.init_process_group(
backend=args.dist_backend, init_method=args.dist_url, world_size=args.world_size, rank=args.rank
)
torch.distributed.barrier()
setup_for_distributed(args.rank == 0)
......
......@@ -267,6 +267,7 @@ def setup_ddp(args):
world_size=args.world_size,
init_method=args.dist_url,
)
torch.distributed.barrier()
def reduce_across_processes(val):
......
......@@ -291,4 +291,5 @@ def init_distributed_mode(args):
torch.distributed.init_process_group(
backend=args.dist_backend, init_method=args.dist_url, world_size=args.world_size, rank=args.rank
)
torch.distributed.barrier()
setup_for_distributed(args.rank == 0)
......@@ -250,4 +250,5 @@ def init_distributed_mode(args):
torch.distributed.init_process_group(
backend=args.dist_backend, init_method=args.dist_url, world_size=args.world_size, rank=args.rank
)
torch.distributed.barrier()
setup_for_distributed(args.rank == 0)
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment