Skip to content

Commit e92f119

Browse files
authored
Add barrier() after init_process_group() (#5475)
1 parent 55a8300 commit e92f119

File tree

4 files changed

+4
-0
lines changed

4 files changed

+4
-0
lines changed

references/classification/utils.py

+1
Original file line numberDiff line numberDiff line change
@@ -274,6 +274,7 @@ def init_distributed_mode(args):
274274
torch.distributed.init_process_group(
275275
backend=args.dist_backend, init_method=args.dist_url, world_size=args.world_size, rank=args.rank
276276
)
277+
torch.distributed.barrier()
277278
setup_for_distributed(args.rank == 0)
278279

279280

references/optical_flow/utils.py

+1
Original file line numberDiff line numberDiff line change
@@ -267,6 +267,7 @@ def setup_ddp(args):
267267
world_size=args.world_size,
268268
init_method=args.dist_url,
269269
)
270+
torch.distributed.barrier()
270271

271272

272273
def reduce_across_processes(val):

references/segmentation/utils.py

+1
Original file line numberDiff line numberDiff line change
@@ -291,4 +291,5 @@ def init_distributed_mode(args):
291291
torch.distributed.init_process_group(
292292
backend=args.dist_backend, init_method=args.dist_url, world_size=args.world_size, rank=args.rank
293293
)
294+
torch.distributed.barrier()
294295
setup_for_distributed(args.rank == 0)

references/video_classification/utils.py

+1
Original file line numberDiff line numberDiff line change
@@ -250,4 +250,5 @@ def init_distributed_mode(args):
250250
torch.distributed.init_process_group(
251251
backend=args.dist_backend, init_method=args.dist_url, world_size=args.world_size, rank=args.rank
252252
)
253+
torch.distributed.barrier()
253254
setup_for_distributed(args.rank == 0)

0 commit comments

Comments
 (0)