__init__.py 3.18 KB
Newer Older
Jared Casper's avatar
Jared Casper committed
1
# Copyright (c) 2022, NVIDIA CORPORATION. All rights reserved.
2
3
4
5
6
7
8

"""Model parallel utility interface."""

from .cross_entropy import vocab_parallel_cross_entropy

from .data import broadcast_data

9
from .initialize import is_unitialized
10
11
12
13
from .initialize import destroy_model_parallel
from .initialize import get_data_parallel_group
from .initialize import get_data_parallel_rank
from .initialize import get_data_parallel_world_size
14
from .initialize import get_embedding_group
Vijay Korthikanti's avatar
Vijay Korthikanti committed
15
from .initialize import get_position_embedding_group
16
from .initialize import get_model_parallel_group
17
18
19
20
21
from .initialize import get_tensor_model_parallel_group
from .initialize import get_pipeline_model_parallel_group
from .initialize import get_tensor_model_parallel_rank, set_tensor_model_parallel_rank
from .initialize import get_pipeline_model_parallel_rank, set_pipeline_model_parallel_rank
from .initialize import is_pipeline_first_stage, is_pipeline_last_stage
22
from .initialize import is_rank_in_embedding_group
Vijay Korthikanti's avatar
Vijay Korthikanti committed
23
from .initialize import is_rank_in_position_embedding_group
24
25
26
from .initialize import is_pipeline_stage_before_split, is_pipeline_stage_after_split
from .initialize import is_pipeline_stage_at_split
from .initialize import get_num_layers
27
from .initialize import get_tensor_model_parallel_src_rank
28
from .initialize import get_data_parallel_src_rank
29
30
from .initialize import get_pipeline_model_parallel_first_rank
from .initialize import get_pipeline_model_parallel_last_rank
31
32
from .initialize import get_pipeline_model_parallel_next_rank
from .initialize import get_pipeline_model_parallel_prev_rank
33
34
from .initialize import get_tensor_model_parallel_world_size, set_tensor_model_parallel_world_size
from .initialize import get_pipeline_model_parallel_world_size, set_pipeline_model_parallel_world_size
35
from .initialize import get_virtual_pipeline_model_parallel_rank, set_virtual_pipeline_model_parallel_rank
36
37
38
from .initialize import initialize_model_parallel
from .initialize import model_parallel_is_initialized

Vijay Korthikanti's avatar
Vijay Korthikanti committed
39
from .layers import LinearWithGradAccumulationAndAsyncCommunication
40
41
42
from .layers import ColumnParallelLinear
from .layers import RowParallelLinear
from .layers import VocabParallelEmbedding
43
44
from .layers import (set_tensor_model_parallel_attributes,
                     set_defaults_if_not_set_tensor_model_parallel_attributes,
mohammad's avatar
mohammad committed
45
                     copy_tensor_model_parallel_attributes)
46
47
48
 
from .mappings import  copy_to_tensor_model_parallel_region
from .mappings import  reduce_from_tensor_model_parallel_region
49
50
51
from .mappings import  scatter_to_tensor_model_parallel_region
from .mappings import  gather_from_tensor_model_parallel_region
from .mappings import  scatter_to_sequence_parallel_region
52
from .mappings import  gather_from_sequence_parallel_region
53
from .mappings import  reduce_scatter_to_sequence_parallel_region
54
55
56

from .random import checkpoint
from .random import get_cuda_rng_tracker
57
from .random import model_parallel_cuda_manual_seed
58
59
from .random import gather_split_1d_tensor
from .random import split_tensor_into_1d_equal_chunks
Lawrence McAfee's avatar
Lawrence McAfee committed
60
61
62
from .random import make_viewless_tensor
from .random import assert_viewless_tensor
from .random import safely_set_viewless_tensor_data
63

64
65
from .utils import divide
from .utils import split_tensor_along_last_dim