Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
1 change: 0 additions & 1 deletion tests/kit/model_zoo/transformers/__init__.py
Original file line number Diff line number Diff line change
Expand Up @@ -5,7 +5,6 @@
from .chatglm2 import *
from .command import *
from .deepseek import *
from .deepseek_v3 import *
from .falcon import *
from .gpt import *
from .gptj import *
Expand Down
12 changes: 0 additions & 12 deletions tests/kit/model_zoo/transformers/deepseek_v3.py
Original file line number Diff line number Diff line change
Expand Up @@ -5,8 +5,6 @@
import transformers
from transformers import AutoConfig

from ..registry import ModelAttribute, model_zoo

# ===============================
# Register single-sentence Mixtral
# ===============================
Expand Down Expand Up @@ -75,13 +73,3 @@ def init_deepseek():
if m.__class__.__name__ == "DeepseekV3MoE":
m.moe_infer = MethodType(m.moe_infer.__wrapped__, m)
return model


model_zoo.register(
name="transformers_deepseek_v3",
model_fn=init_deepseek,
data_gen_fn=data_gen_for_lm,
output_transform_fn=output_transform_fn,
loss_fn=loss_fn_for_lm,
model_attribute=ModelAttribute(has_control_flow=True),
)
24 changes: 13 additions & 11 deletions tests/test_shardformer/test_model/test_shard_deepseek_v3.py
Original file line number Diff line number Diff line change
Expand Up @@ -11,7 +11,12 @@
from colossalai.booster.plugin.moe_hybrid_parallel_plugin import MoeHybridParallelPlugin
from colossalai.testing import parameterize, rerun_if_address_is_in_use, spawn
from colossalai.testing.random import seed_all
from tests.kit.model_zoo import model_zoo
from tests.kit.model_zoo.transformers.deepseek_v3 import (
data_gen_for_lm,
init_deepseek,
loss_fn_for_lm,
output_transform_fn,
)
from tests.test_shardformer.test_model._utils import (
build_model_from_hybrid_plugin,
run_forward_backward_with_hybrid_plugin,
Expand Down Expand Up @@ -74,16 +79,13 @@ def run_deepseek_v3_test(config: Tuple[int, ...]):
find_unused_parameters=True,
)

sub_model_zoo = model_zoo.get_sub_registry("transformers_deepseek_v3")
for name, (model_fn, data_gen_fn, output_transform_fn, loss_fn, _) in sub_model_zoo.items():

check_forward_backward(
model_fn,
data_gen_fn,
output_transform_fn,
loss_fn,
plugin_config,
)
check_forward_backward(
init_deepseek,
data_gen_for_lm,
output_transform_fn,
loss_fn_for_lm,
plugin_config,
)


def check_deepseek_v3(rank, world_size, port):
Expand Down
2 changes: 1 addition & 1 deletion version.txt
Original file line number Diff line number Diff line change
@@ -1 +1 @@
0.4.7
0.4.8
Loading