Skip to content

Commit 9379cbd

Browse files
authored
[release] update version (#6195)
* [release] update version * fix test * fix test
1 parent 24dee8f commit 9379cbd

File tree

4 files changed

+14
-25
lines changed

4 files changed

+14
-25
lines changed

tests/kit/model_zoo/transformers/__init__.py

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -5,7 +5,6 @@
55
from .chatglm2 import *
66
from .command import *
77
from .deepseek import *
8-
from .deepseek_v3 import *
98
from .falcon import *
109
from .gpt import *
1110
from .gptj import *

tests/kit/model_zoo/transformers/deepseek_v3.py

Lines changed: 0 additions & 12 deletions
Original file line numberDiff line numberDiff line change
@@ -5,8 +5,6 @@
55
import transformers
66
from transformers import AutoConfig
77

8-
from ..registry import ModelAttribute, model_zoo
9-
108
# ===============================
119
# Register single-sentence Mixtral
1210
# ===============================
@@ -75,13 +73,3 @@ def init_deepseek():
7573
if m.__class__.__name__ == "DeepseekV3MoE":
7674
m.moe_infer = MethodType(m.moe_infer.__wrapped__, m)
7775
return model
78-
79-
80-
model_zoo.register(
81-
name="transformers_deepseek_v3",
82-
model_fn=init_deepseek,
83-
data_gen_fn=data_gen_for_lm,
84-
output_transform_fn=output_transform_fn,
85-
loss_fn=loss_fn_for_lm,
86-
model_attribute=ModelAttribute(has_control_flow=True),
87-
)

tests/test_shardformer/test_model/test_shard_deepseek_v3.py

Lines changed: 13 additions & 11 deletions
Original file line numberDiff line numberDiff line change
@@ -11,7 +11,12 @@
1111
from colossalai.booster.plugin.moe_hybrid_parallel_plugin import MoeHybridParallelPlugin
1212
from colossalai.testing import parameterize, rerun_if_address_is_in_use, spawn
1313
from colossalai.testing.random import seed_all
14-
from tests.kit.model_zoo import model_zoo
14+
from tests.kit.model_zoo.transformers.deepseek_v3 import (
15+
data_gen_for_lm,
16+
init_deepseek,
17+
loss_fn_for_lm,
18+
output_transform_fn,
19+
)
1520
from tests.test_shardformer.test_model._utils import (
1621
build_model_from_hybrid_plugin,
1722
run_forward_backward_with_hybrid_plugin,
@@ -74,16 +79,13 @@ def run_deepseek_v3_test(config: Tuple[int, ...]):
7479
find_unused_parameters=True,
7580
)
7681

77-
sub_model_zoo = model_zoo.get_sub_registry("transformers_deepseek_v3")
78-
for name, (model_fn, data_gen_fn, output_transform_fn, loss_fn, _) in sub_model_zoo.items():
79-
80-
check_forward_backward(
81-
model_fn,
82-
data_gen_fn,
83-
output_transform_fn,
84-
loss_fn,
85-
plugin_config,
86-
)
82+
check_forward_backward(
83+
init_deepseek,
84+
data_gen_for_lm,
85+
output_transform_fn,
86+
loss_fn_for_lm,
87+
plugin_config,
88+
)
8789

8890

8991
def check_deepseek_v3(rank, world_size, port):

version.txt

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1 +1 @@
1-
0.4.7
1+
0.4.8

0 commit comments

Comments
 (0)