-
Notifications
You must be signed in to change notification settings - Fork 163
Expand file tree
/
Copy path__init__.py
More file actions
105 lines (101 loc) · 3.24 KB
/
__init__.py
File metadata and controls
105 lines (101 loc) · 3.24 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
# Copyright 2025 Bytedance Ltd. and/or its affiliates
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
from .async_ulysses import (
async_ulysses_output_projection,
async_ulysses_qkv_projection,
divide_qkv_linear_bias,
divide_qkv_linear_weight,
)
from .comm import (
get_context_parallel_group,
get_context_parallel_rank,
get_context_parallel_world_size,
get_data_parallel_group,
get_data_parallel_rank,
get_ulysses_sequence_parallel_group,
get_ulysses_sequence_parallel_rank,
get_ulysses_sequence_parallel_world_size,
get_unified_sequence_parallel_group,
get_unified_sequence_parallel_rank,
get_unified_sequence_parallel_world_size,
init_sequence_parallel,
set_context_parallel_group,
set_data_parallel_group,
set_ulysses_sequence_parallel_group,
set_unified_sequence_parallel_group,
)
from .data import (
gather_outputs,
sequence_parallel_preprocess,
slice_input_tensor,
slice_input_tensor_scale_grad,
slice_position_embedding,
sp_pad_and_slice,
)
from .loss import reduce_sequence_parallel_loss
from .ulysses import (
all_to_all_images,
gather_heads_scatter_seq,
gather_seq_scatter_heads,
)
from .utils import pad_tensor, unpad_tensor, vlm_images_a2a_meta
from .vision_dp import (
assign_images_to_dp_ranks,
create_dp_vision_forward,
gather_vision_embeddings,
get_image_embedding_counts,
get_image_patch_counts,
prepare_local_vision_inputs,
)
__all__ = [
"init_sequence_parallel",
"set_data_parallel_group",
"get_data_parallel_group",
"get_data_parallel_rank",
"set_ulysses_sequence_parallel_group",
"get_ulysses_sequence_parallel_world_size",
"get_ulysses_sequence_parallel_rank",
"get_ulysses_sequence_parallel_group",
"set_context_parallel_group",
"get_context_parallel_group",
"get_context_parallel_rank",
"get_context_parallel_world_size",
"set_unified_sequence_parallel_group",
"get_unified_sequence_parallel_group",
"get_unified_sequence_parallel_rank",
"get_unified_sequence_parallel_world_size",
"slice_input_tensor",
"slice_input_tensor_scale_grad",
"slice_position_embedding",
"sp_pad_and_slice",
"sequence_parallel_preprocess",
"gather_heads_scatter_seq",
"gather_seq_scatter_heads",
"all_to_all_images",
"gather_outputs",
"vlm_images_a2a_meta",
"pad_tensor",
"unpad_tensor",
"reduce_sequence_parallel_loss",
"async_ulysses_qkv_projection",
"async_ulysses_output_projection",
"divide_qkv_linear_weight",
"divide_qkv_linear_bias",
"get_image_patch_counts",
"get_image_embedding_counts",
"assign_images_to_dp_ranks",
"prepare_local_vision_inputs",
"gather_vision_embeddings",
"create_dp_vision_forward",
]