|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
"""Model parallel utility interface.""" |
|
|
|
from .cross_entropy import vocab_parallel_cross_entropy |
|
|
|
from .data import broadcast_data |
|
|
|
from .initialize import is_unitialized |
|
from .initialize import destroy_model_parallel |
|
from .initialize import get_data_parallel_group |
|
from .initialize import get_data_parallel_rank |
|
from .initialize import get_data_parallel_world_size |
|
from .initialize import get_embedding_group |
|
from .initialize import get_position_embedding_group |
|
from .initialize import get_model_parallel_group |
|
from .initialize import get_tensor_model_parallel_group |
|
from .initialize import get_pipeline_model_parallel_group |
|
from .initialize import get_tensor_model_parallel_rank, set_tensor_model_parallel_rank |
|
from .initialize import get_pipeline_model_parallel_rank, set_pipeline_model_parallel_rank |
|
from .initialize import is_pipeline_first_stage, is_pipeline_last_stage |
|
from .initialize import is_rank_in_embedding_group |
|
from .initialize import is_rank_in_position_embedding_group |
|
from .initialize import is_pipeline_stage_before_split, is_pipeline_stage_after_split |
|
from .initialize import is_pipeline_stage_at_split |
|
from .initialize import get_num_layers |
|
from .initialize import get_num_layers_decoder |
|
from .initialize import get_tensor_model_parallel_src_rank |
|
from .initialize import get_data_parallel_src_rank |
|
from .initialize import get_pipeline_model_parallel_first_rank |
|
from .initialize import get_pipeline_model_parallel_last_rank |
|
from .initialize import get_pipeline_model_parallel_next_rank |
|
from .initialize import get_pipeline_model_parallel_prev_rank |
|
from .initialize import get_tensor_model_parallel_world_size, set_tensor_model_parallel_world_size |
|
from .initialize import get_pipeline_model_parallel_world_size, set_pipeline_model_parallel_world_size |
|
from .initialize import get_virtual_pipeline_model_parallel_rank, set_virtual_pipeline_model_parallel_rank |
|
from .initialize import initialize_model_parallel |
|
from .initialize import model_parallel_is_initialized |
|
|
|
from .layers import LinearWithGradAccumulationAndAsyncCommunication |
|
from .layers import ColumnParallelLinear |
|
from .layers import RowParallelLinear |
|
from .layers import VocabParallelEmbedding |
|
from .layers import (set_tensor_model_parallel_attributes, |
|
set_defaults_if_not_set_tensor_model_parallel_attributes, |
|
copy_tensor_model_parallel_attributes) |
|
|
|
from .mappings import copy_to_tensor_model_parallel_region |
|
from .mappings import reduce_from_tensor_model_parallel_region |
|
from .mappings import scatter_to_tensor_model_parallel_region |
|
from .mappings import gather_from_tensor_model_parallel_region |
|
from .mappings import scatter_to_sequence_parallel_region |
|
from .mappings import gather_from_sequence_parallel_region |
|
from .mappings import reduce_scatter_to_sequence_parallel_region |
|
|
|
from .random import checkpoint |
|
from .random import get_cuda_rng_tracker |
|
from .random import model_parallel_cuda_manual_seed |
|
from .random import gather_split_1d_tensor |
|
from .random import split_tensor_into_1d_equal_chunks |
|
from .random import make_viewless_tensor |
|
from .random import assert_viewless_tensor |
|
from .random import safely_set_viewless_tensor_data |
|
|
|
from .utils import divide |
|
from .utils import split_tensor_along_last_dim |
|
|