Skip to content

Commit 82e213c

Browse files
committed
reorg structure of model implementations
1 parent 74ebfe2 commit 82e213c

33 files changed

+365
-343
lines changed

internlm/checkpoint/checkpoint_manager.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -16,8 +16,8 @@
1616
auto_resume_sanity_check,
1717
ckpt_info_sanity_check,
1818
)
19-
from internlm.model.base_model import BaseModel
20-
from internlm.model.registry import model_initializer
19+
from internlm.model_implementations.registry import model_initializer
20+
from internlm.model_implementations.transformers.base_model import BaseModel
2121
from internlm.monitor import send_alert_message
2222
from internlm.solver.optimizer import HybridZeroOptimizer, HybridZeroOptimizer_v2
2323
from internlm.utils.common import get_current_device

internlm/checkpoint/load_funcs.py

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1,8 +1,8 @@
11
# Copyright (c) InternLM. All rights reserved.
22

3-
from internlm.model.modeling_internlm import InternLM1
4-
from internlm.model.modeling_internlm2 import InternLM2
5-
from internlm.model.modeling_llama import Llama2
3+
from internlm.model_implementations.transformers.modeling_internlm import InternLM1
4+
from internlm.model_implementations.transformers.modeling_internlm2 import InternLM2
5+
from internlm.model_implementations.transformers.modeling_llama import Llama2
66
from internlm.utils.logger import get_logger
77

88
logger = get_logger(__file__)

internlm/core/trainer_builder.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -19,12 +19,12 @@
1919
from internlm.initialize.initialize_trainer import initialize_trainer
2020
from internlm.model.losses.ce_loss import InternLoss
2121
from internlm.model.metrics import AccPerplex
22+
from internlm.model_inject.inject import inject_model
2223
from internlm.monitor.monitor import send_alert_message
2324
from internlm.train.pipeline import (
2425
get_scheduler_hooks,
2526
initialize_llm_profile,
2627
initialize_optimizer,
27-
inject_model,
2828
load_new_batch,
2929
record_current_batch_training_metrics,
3030
)

internlm/model_implementations/__init__.py

Whitespace-only changes.
Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -6,12 +6,12 @@
66
from internlm.core.context import ParallelMode
77
from internlm.core.context import global_context as gpc
88
from internlm.core.parallel.shard import pipeline_parallel_sharding_wrapper
9-
from internlm.model.base_model import BaseModel
109
from internlm.model.modules.linear import (
1110
ParallelLinearWithCommExt,
1211
ScaleColumnParallelLinear,
1312
)
14-
from internlm.model.registry import model_initializer
13+
from internlm.model_implementations.registry import model_initializer
14+
from internlm.model_implementations.transformers.base_model import BaseModel
1515
from internlm.utils.common import get_current_device
1616
from internlm.utils.lazy import LazyObject
1717
from internlm.utils.logger import get_logger

internlm/model/registry.py renamed to internlm/model_implementations/registry.py

Lines changed: 10 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -4,16 +4,16 @@
44

55
from typing import Callable
66

7-
from internlm.model.modeling_baichuan2 import Baichuan2
8-
from internlm.model.modeling_gemma import Gemma
9-
from internlm.model.modeling_internlm import InternLM1
10-
from internlm.model.modeling_internlm2 import InternLM2
11-
from internlm.model.modeling_llama import Llama2
12-
from internlm.model.modeling_llava import Llava
13-
from internlm.model.modeling_mixtral import MixtralMoE
14-
from internlm.model.modeling_moe import Internlm1MoE
15-
from internlm.model.modeling_qwen2 import Qwen2
16-
from internlm.model.modeling_qwen2_moe import Qwen2Moe
7+
from internlm.model_implementations.transformers.modeling_baichuan2 import Baichuan2
8+
from internlm.model_implementations.transformers.modeling_gemma import Gemma
9+
from internlm.model_implementations.transformers.modeling_internlm import InternLM1
10+
from internlm.model_implementations.transformers.modeling_internlm2 import InternLM2
11+
from internlm.model_implementations.transformers.modeling_llama import Llama2
12+
from internlm.model_implementations.transformers.modeling_llava import Llava
13+
from internlm.model_implementations.transformers.modeling_mixtral import MixtralMoE
14+
from internlm.model_implementations.transformers.modeling_moe import Internlm1MoE
15+
from internlm.model_implementations.transformers.modeling_qwen2 import Qwen2
16+
from internlm.model_implementations.transformers.modeling_qwen2_moe import Qwen2Moe
1717
from internlm.utils.common import SingletonMeta
1818
from internlm.utils.utils import ModelType
1919

internlm/model_implementations/transformers/__init__.py

Whitespace-only changes.

internlm/model/base_model.py renamed to internlm/model_implementations/transformers/base_model.py

File renamed without changes.

internlm/model/modeling_baichuan2.py renamed to internlm/model_implementations/transformers/modeling_baichuan2.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -17,7 +17,6 @@
1717
scaled_init_method_uniform,
1818
uniform_,
1919
)
20-
from internlm.model.base_model import BaseModel
2120
from internlm.model.modules.embedding import Embedding1D
2221
from internlm.model.modules.linear import new_linear
2322
from internlm.model.modules.mha import MHA
@@ -27,6 +26,7 @@
2726
convert_attn_args_to_kwargs,
2827
convert_attn_kwargs_to_args,
2928
)
29+
from internlm.model_implementations.transformers.base_model import BaseModel
3030
from internlm.solver.activation_checkpoint import activation_checkpoint
3131
from internlm.utils.logger import get_logger
3232
from internlm.utils.storage_manager import get_fns, llm_load, llm_save

internlm/model/modeling_gemma.py renamed to internlm/model_implementations/transformers/modeling_gemma.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -16,7 +16,6 @@
1616
scaled_init_method_uniform,
1717
uniform_,
1818
)
19-
from internlm.model.base_model import BaseModel
2019
from internlm.model.modules.embedding import Embedding1D
2120
from internlm.model.modules.linear import new_linear
2221
from internlm.model.modules.mha import GQA
@@ -26,6 +25,7 @@
2625
convert_attn_args_to_kwargs,
2726
convert_attn_kwargs_to_args,
2827
)
28+
from internlm.model_implementations.transformers.base_model import BaseModel
2929
from internlm.solver.activation_checkpoint import activation_checkpoint
3030
from internlm.utils.logger import get_logger
3131
from internlm.utils.storage_manager import get_fns, llm_load, llm_save

0 commit comments

Comments
 (0)