Skip to content

Commit 82e213c

Browse files
committed
reorg structure of model implementations
1 parent 74ebfe2 commit 82e213c

33 files changed

+365
-343
lines changed

internlm/checkpoint/checkpoint_manager.py

+2-2
Original file line numberDiff line numberDiff line change
@@ -16,8 +16,8 @@
1616
auto_resume_sanity_check,
1717
ckpt_info_sanity_check,
1818
)
19-
from internlm.model.base_model import BaseModel
20-
from internlm.model.registry import model_initializer
19+
from internlm.model_implementations.registry import model_initializer
20+
from internlm.model_implementations.transformers.base_model import BaseModel
2121
from internlm.monitor import send_alert_message
2222
from internlm.solver.optimizer import HybridZeroOptimizer, HybridZeroOptimizer_v2
2323
from internlm.utils.common import get_current_device

internlm/checkpoint/load_funcs.py

+3-3
Original file line numberDiff line numberDiff line change
@@ -1,8 +1,8 @@
11
# Copyright (c) InternLM. All rights reserved.
22

3-
from internlm.model.modeling_internlm import InternLM1
4-
from internlm.model.modeling_internlm2 import InternLM2
5-
from internlm.model.modeling_llama import Llama2
3+
from internlm.model_implementations.transformers.modeling_internlm import InternLM1
4+
from internlm.model_implementations.transformers.modeling_internlm2 import InternLM2
5+
from internlm.model_implementations.transformers.modeling_llama import Llama2
66
from internlm.utils.logger import get_logger
77

88
logger = get_logger(__file__)

internlm/core/trainer_builder.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -19,12 +19,12 @@
1919
from internlm.initialize.initialize_trainer import initialize_trainer
2020
from internlm.model.losses.ce_loss import InternLoss
2121
from internlm.model.metrics import AccPerplex
22+
from internlm.model_inject.inject import inject_model
2223
from internlm.monitor.monitor import send_alert_message
2324
from internlm.train.pipeline import (
2425
get_scheduler_hooks,
2526
initialize_llm_profile,
2627
initialize_optimizer,
27-
inject_model,
2828
load_new_batch,
2929
record_current_batch_training_metrics,
3030
)

internlm/model_implementations/__init__.py

Whitespace-only changes.

internlm/model/builder.py internlm/model_implementations/builder.py

+2-2
Original file line numberDiff line numberDiff line change
@@ -6,12 +6,12 @@
66
from internlm.core.context import ParallelMode
77
from internlm.core.context import global_context as gpc
88
from internlm.core.parallel.shard import pipeline_parallel_sharding_wrapper
9-
from internlm.model.base_model import BaseModel
109
from internlm.model.modules.linear import (
1110
ParallelLinearWithCommExt,
1211
ScaleColumnParallelLinear,
1312
)
14-
from internlm.model.registry import model_initializer
13+
from internlm.model_implementations.registry import model_initializer
14+
from internlm.model_implementations.transformers.base_model import BaseModel
1515
from internlm.utils.common import get_current_device
1616
from internlm.utils.lazy import LazyObject
1717
from internlm.utils.logger import get_logger

internlm/model/registry.py internlm/model_implementations/registry.py

+10-10
Original file line numberDiff line numberDiff line change
@@ -4,16 +4,16 @@
44

55
from typing import Callable
66

7-
from internlm.model.modeling_baichuan2 import Baichuan2
8-
from internlm.model.modeling_gemma import Gemma
9-
from internlm.model.modeling_internlm import InternLM1
10-
from internlm.model.modeling_internlm2 import InternLM2
11-
from internlm.model.modeling_llama import Llama2
12-
from internlm.model.modeling_llava import Llava
13-
from internlm.model.modeling_mixtral import MixtralMoE
14-
from internlm.model.modeling_moe import Internlm1MoE
15-
from internlm.model.modeling_qwen2 import Qwen2
16-
from internlm.model.modeling_qwen2_moe import Qwen2Moe
7+
from internlm.model_implementations.transformers.modeling_baichuan2 import Baichuan2
8+
from internlm.model_implementations.transformers.modeling_gemma import Gemma
9+
from internlm.model_implementations.transformers.modeling_internlm import InternLM1
10+
from internlm.model_implementations.transformers.modeling_internlm2 import InternLM2
11+
from internlm.model_implementations.transformers.modeling_llama import Llama2
12+
from internlm.model_implementations.transformers.modeling_llava import Llava
13+
from internlm.model_implementations.transformers.modeling_mixtral import MixtralMoE
14+
from internlm.model_implementations.transformers.modeling_moe import Internlm1MoE
15+
from internlm.model_implementations.transformers.modeling_qwen2 import Qwen2
16+
from internlm.model_implementations.transformers.modeling_qwen2_moe import Qwen2Moe
1717
from internlm.utils.common import SingletonMeta
1818
from internlm.utils.utils import ModelType
1919

internlm/model_implementations/transformers/__init__.py

Whitespace-only changes.

internlm/model/modeling_baichuan2.py internlm/model_implementations/transformers/modeling_baichuan2.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -17,7 +17,6 @@
1717
scaled_init_method_uniform,
1818
uniform_,
1919
)
20-
from internlm.model.base_model import BaseModel
2120
from internlm.model.modules.embedding import Embedding1D
2221
from internlm.model.modules.linear import new_linear
2322
from internlm.model.modules.mha import MHA
@@ -27,6 +26,7 @@
2726
convert_attn_args_to_kwargs,
2827
convert_attn_kwargs_to_args,
2928
)
29+
from internlm.model_implementations.transformers.base_model import BaseModel
3030
from internlm.solver.activation_checkpoint import activation_checkpoint
3131
from internlm.utils.logger import get_logger
3232
from internlm.utils.storage_manager import get_fns, llm_load, llm_save

internlm/model/modeling_gemma.py internlm/model_implementations/transformers/modeling_gemma.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -16,7 +16,6 @@
1616
scaled_init_method_uniform,
1717
uniform_,
1818
)
19-
from internlm.model.base_model import BaseModel
2019
from internlm.model.modules.embedding import Embedding1D
2120
from internlm.model.modules.linear import new_linear
2221
from internlm.model.modules.mha import GQA
@@ -26,6 +25,7 @@
2625
convert_attn_args_to_kwargs,
2726
convert_attn_kwargs_to_args,
2827
)
28+
from internlm.model_implementations.transformers.base_model import BaseModel
2929
from internlm.solver.activation_checkpoint import activation_checkpoint
3030
from internlm.utils.logger import get_logger
3131
from internlm.utils.storage_manager import get_fns, llm_load, llm_save

internlm/model/modeling_internlm.py internlm/model_implementations/transformers/modeling_internlm.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -15,7 +15,6 @@
1515
from internlm.core.naive_amp import set_output_attr_to_module
1616
from internlm.core.parallel.shard import partition_uniform
1717
from internlm.initialize.initialize_tensor import normal_, scaled_init_method_normal
18-
from internlm.model.base_model import BaseModel
1918
from internlm.model.modules.embedding import Embedding1D
2019
from internlm.model.modules.linear import new_linear
2120
from internlm.model.modules.mha import MHA
@@ -27,6 +26,7 @@
2726
internlm1_mha_pre_load_convert,
2827
internlm1_mha_save_convert,
2928
)
29+
from internlm.model_implementations.transformers.base_model import BaseModel
3030
from internlm.solver.activation_checkpoint import activation_checkpoint
3131
from internlm.utils.logger import get_logger
3232
from internlm.utils.storage_manager import get_fns, llm_load, llm_save

internlm/model/modeling_internlm2.py internlm/model_implementations/transformers/modeling_internlm2.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -18,7 +18,6 @@
1818
scaled_init_method_uniform,
1919
uniform_,
2020
)
21-
from internlm.model.base_model import BaseModel
2221
from internlm.model.modules.embedding import Embedding1D
2322
from internlm.model.modules.linear import new_linear
2423
from internlm.model.modules.mha import GQA
@@ -29,6 +28,7 @@
2928
convert_attn_kwargs_to_args,
3029
get_parallel_size_from_file,
3130
)
31+
from internlm.model_implementations.transformers.base_model import BaseModel
3232
from internlm.solver.activation_checkpoint import activation_checkpoint
3333
from internlm.utils.logger import get_logger
3434
from internlm.utils.storage_manager import get_fns, llm_load, llm_save

internlm/model/modeling_llama.py internlm/model_implementations/transformers/modeling_llama.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -16,7 +16,6 @@
1616
scaled_init_method_uniform,
1717
uniform_,
1818
)
19-
from internlm.model.base_model import BaseModel
2019
from internlm.model.modules.embedding import Embedding1D
2120
from internlm.model.modules.linear import new_linear
2221
from internlm.model.modules.mha import GQA
@@ -26,6 +25,7 @@
2625
convert_attn_args_to_kwargs,
2726
convert_attn_kwargs_to_args,
2827
)
28+
from internlm.model_implementations.transformers.base_model import BaseModel
2929
from internlm.solver.activation_checkpoint import activation_checkpoint
3030
from internlm.utils.logger import get_logger
3131
from internlm.utils.storage_manager import get_fns, llm_load, llm_save

internlm/model/modeling_llava.py internlm/model_implementations/transformers/modeling_llava.py

+2-2
Original file line numberDiff line numberDiff line change
@@ -7,13 +7,13 @@
77
from internlm.core.context.parallel_context import global_context as gpc
88
from internlm.core.naive_amp import set_output_attr_to_module
99
from internlm.initialize.initialize_tensor import normal_, uniform_
10-
from internlm.model.base_model import BaseModel
1110
from internlm.model.llava.clip_builder import build_vision_tower
1211
from internlm.model.llava.projector_builder import build_vision_projector
13-
from internlm.model.modeling_llama import Llama2Decoder
1412
from internlm.model.modules.embedding import Embedding1D
1513
from internlm.model.modules.linear import new_linear
1614
from internlm.model.modules.norm import new_layer_norm
15+
from internlm.model_implementations.transformers.base_model import BaseModel
16+
from internlm.model_implementations.transformers.modeling_llama import Llama2Decoder
1717
from internlm.utils.logger import get_logger
1818

1919
logger = get_logger(__file__)

internlm/model/modeling_mixtral.py internlm/model_implementations/transformers/modeling_mixtral.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -10,7 +10,6 @@
1010
from internlm.core.context import ParallelMode
1111
from internlm.core.context.parallel_context import global_context as gpc
1212
from internlm.initialize.initialize_tensor import normal_, scaled_init_method_normal
13-
from internlm.model.base_model import BaseModel
1413
from internlm.model.modules.embedding import Embedding1D
1514
from internlm.model.modules.linear import new_linear
1615
from internlm.model.modules.mha import SWA
@@ -21,6 +20,7 @@
2120
convert_attn_args_to_kwargs,
2221
convert_attn_kwargs_to_args,
2322
)
23+
from internlm.model_implementations.transformers.base_model import BaseModel
2424
from internlm.solver.activation_checkpoint import activation_checkpoint
2525
from internlm.utils.logger import get_logger
2626

internlm/model/modeling_moe.py internlm/model_implementations/transformers/modeling_moe.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -10,7 +10,6 @@
1010
from internlm.core.context import ParallelMode
1111
from internlm.core.context.parallel_context import global_context as gpc
1212
from internlm.initialize.initialize_tensor import normal_, scaled_init_method_normal
13-
from internlm.model.base_model import BaseModel
1413
from internlm.model.modules.embedding import Embedding1D
1514
from internlm.model.modules.linear import new_linear
1615
from internlm.model.modules.mha import MHA
@@ -23,6 +22,7 @@
2322
internlm1_mha_pre_load_convert,
2423
internlm1_mha_save_convert,
2524
)
25+
from internlm.model_implementations.transformers.base_model import BaseModel
2626
from internlm.solver.activation_checkpoint import activation_checkpoint
2727
from internlm.utils.logger import get_logger
2828

internlm/model/modeling_qwen2.py internlm/model_implementations/transformers/modeling_qwen2.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -16,7 +16,6 @@
1616
scaled_init_method_uniform,
1717
uniform_,
1818
)
19-
from internlm.model.base_model import BaseModel
2019
from internlm.model.modules.embedding import Embedding1D
2120
from internlm.model.modules.linear import new_linear
2221
from internlm.model.modules.mha import SWA
@@ -26,6 +25,7 @@
2625
convert_attn_args_to_kwargs,
2726
convert_attn_kwargs_to_args,
2827
)
28+
from internlm.model_implementations.transformers.base_model import BaseModel
2929
from internlm.solver.activation_checkpoint import activation_checkpoint
3030
from internlm.utils.logger import get_logger
3131
from internlm.utils.storage_manager import get_fns, llm_load, llm_save

internlm/model/modeling_qwen2_moe.py internlm/model_implementations/transformers/modeling_qwen2_moe.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -14,7 +14,6 @@
1414
scaled_init_method_uniform,
1515
uniform_,
1616
)
17-
from internlm.model.base_model import BaseModel
1817
from internlm.model.modules.embedding import Embedding1D
1918
from internlm.model.modules.linear import new_linear
2019
from internlm.model.modules.mha import SWA
@@ -25,6 +24,7 @@
2524
convert_attn_args_to_kwargs,
2625
convert_attn_kwargs_to_args,
2726
)
27+
from internlm.model_implementations.transformers.base_model import BaseModel
2828
from internlm.solver.activation_checkpoint import activation_checkpoint
2929
from internlm.utils.logger import get_logger
3030

internlm/model_inject/__init__.py

Whitespace-only changes.

0 commit comments

Comments
 (0)