constants.py 611 Bytes
Newer Older
1
2
3
'''
Copyright 2020 The Microsoft DeepSpeed Team
'''
4
from datetime import timedelta
5
6
7
8
9

#############################################
# Torch distributed constants
#############################################
TORCH_DISTRIBUTED_DEFAULT_PORT = 29500
10
11
12
13
14
15
16

# Default process group wide timeout, if applicable.
# This only applies to the gloo and nccl backends
# (only if NCCL_BLOCKING_WAIT or NCCL_ASYNC_ERROR_HANDLING is set to 1).
# To make an attempt at backwards compatibility with THD, we use an
# extraordinarily high default timeout, given that THD did not have timeouts.
default_pg_timeout = timedelta(minutes=30)