From 9c7aa67126c6914436c3152047d111a9561a8ab5 Mon Sep 17 00:00:00 2001 From: ver217 Date: Tue, 18 Feb 2025 14:51:08 +0800 Subject: [PATCH 1/3] [release] update version --- version.txt | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/version.txt b/version.txt index f90568270955..cb498ab2c89f 100644 --- a/version.txt +++ b/version.txt @@ -1 +1 @@ -0.4.7 +0.4.8 From 2fa095202df7b2a7bc7d5dd3b5b0c7c9742fc2d3 Mon Sep 17 00:00:00 2001 From: ver217 Date: Wed, 19 Feb 2025 09:46:01 +0800 Subject: [PATCH 2/3] fix test --- tests/kit/model_zoo/transformers/__init__.py | 1 - .../test_model/test_shard_deepseek_v3.py | 24 ++++++++++--------- 2 files changed, 13 insertions(+), 12 deletions(-) diff --git a/tests/kit/model_zoo/transformers/__init__.py b/tests/kit/model_zoo/transformers/__init__.py index a075cdac1bca..4adc386192d3 100644 --- a/tests/kit/model_zoo/transformers/__init__.py +++ b/tests/kit/model_zoo/transformers/__init__.py @@ -5,7 +5,6 @@ from .chatglm2 import * from .command import * from .deepseek import * -from .deepseek_v3 import * from .falcon import * from .gpt import * from .gptj import * diff --git a/tests/test_shardformer/test_model/test_shard_deepseek_v3.py b/tests/test_shardformer/test_model/test_shard_deepseek_v3.py index aeded5466095..52cb8365d03e 100644 --- a/tests/test_shardformer/test_model/test_shard_deepseek_v3.py +++ b/tests/test_shardformer/test_model/test_shard_deepseek_v3.py @@ -11,7 +11,12 @@ from colossalai.booster.plugin.moe_hybrid_parallel_plugin import MoeHybridParallelPlugin from colossalai.testing import parameterize, rerun_if_address_is_in_use, spawn from colossalai.testing.random import seed_all -from tests.kit.model_zoo import model_zoo +from tests.kit.model_zoo.transformers.deepseek_v3 import ( + data_gen_for_lm, + init_deepseek, + loss_fn_for_lm, + output_transform_fn, +) from tests.test_shardformer.test_model._utils import ( build_model_from_hybrid_plugin, run_forward_backward_with_hybrid_plugin, @@ -74,16 +79,13 @@ def run_deepseek_v3_test(config: Tuple[int, ...]): find_unused_parameters=True, ) - sub_model_zoo = model_zoo.get_sub_registry("transformers_deepseek_v3") - for name, (model_fn, data_gen_fn, output_transform_fn, loss_fn, _) in sub_model_zoo.items(): - - check_forward_backward( - model_fn, - data_gen_fn, - output_transform_fn, - loss_fn, - plugin_config, - ) + check_forward_backward( + init_deepseek, + data_gen_for_lm, + output_transform_fn, + loss_fn_for_lm, + plugin_config, + ) def check_deepseek_v3(rank, world_size, port): From 07438b37249751229ebbf4115f3c0dafdeddb393 Mon Sep 17 00:00:00 2001 From: ver217 Date: Wed, 19 Feb 2025 16:54:28 +0800 Subject: [PATCH 3/3] fix test --- tests/kit/model_zoo/transformers/deepseek_v3.py | 12 ------------ 1 file changed, 12 deletions(-) diff --git a/tests/kit/model_zoo/transformers/deepseek_v3.py b/tests/kit/model_zoo/transformers/deepseek_v3.py index ffd71d95c601..ba15be3c8400 100644 --- a/tests/kit/model_zoo/transformers/deepseek_v3.py +++ b/tests/kit/model_zoo/transformers/deepseek_v3.py @@ -5,8 +5,6 @@ import transformers from transformers import AutoConfig -from ..registry import ModelAttribute, model_zoo - # =============================== # Register single-sentence Mixtral # =============================== @@ -75,13 +73,3 @@ def init_deepseek(): if m.__class__.__name__ == "DeepseekV3MoE": m.moe_infer = MethodType(m.moe_infer.__wrapped__, m) return model - - -model_zoo.register( - name="transformers_deepseek_v3", - model_fn=init_deepseek, - data_gen_fn=data_gen_for_lm, - output_transform_fn=output_transform_fn, - loss_fn=loss_fn_for_lm, - model_attribute=ModelAttribute(has_control_flow=True), -)