Skip to content

Commit 6075d1e

Browse files
committed
reorg structure of model implementations
1 parent 74ebfe2 commit 6075d1e

33 files changed

+365
-343
lines changed

internlm/checkpoint/checkpoint_manager.py

+2-2
Original file line numberDiff line numberDiff line change
@@ -16,8 +16,8 @@
1616
auto_resume_sanity_check,
1717
ckpt_info_sanity_check,
1818
)
19-
from internlm.model.base_model import BaseModel
20-
from internlm.model.registry import model_initializer
19+
from internlm.model_implementations.registry import model_initializer
20+
from internlm.model_implementations.transformers.base_model import BaseModel
2121
from internlm.monitor import send_alert_message
2222
from internlm.solver.optimizer import HybridZeroOptimizer, HybridZeroOptimizer_v2
2323
from internlm.utils.common import get_current_device

internlm/checkpoint/load_funcs.py

+3-3
Original file line numberDiff line numberDiff line change
@@ -1,8 +1,8 @@
11
# Copyright (c) InternLM. All rights reserved.
22

3-
from internlm.model.modeling_internlm import InternLM1
4-
from internlm.model.modeling_internlm2 import InternLM2
5-
from internlm.model.modeling_llama import Llama2
3+
from internlm.model_implementations.transformers.modeling_internlm import InternLM1
4+
from internlm.model_implementations.transformers.modeling_internlm2 import InternLM2
5+
from internlm.model_implementations.transformers.modeling_llama import Llama2
66
from internlm.utils.logger import get_logger
77

88
logger = get_logger(__file__)

internlm/core/trainer_builder.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -17,14 +17,14 @@
1717
from internlm.data.train_state import get_train_state
1818
from internlm.eval.evaluation import evaluate_on_val_dls
1919
from internlm.initialize.initialize_trainer import initialize_trainer
20+
from internlm.model_inject.inject import inject_model
2021
from internlm.model.losses.ce_loss import InternLoss
2122
from internlm.model.metrics import AccPerplex
2223
from internlm.monitor.monitor import send_alert_message
2324
from internlm.train.pipeline import (
2425
get_scheduler_hooks,
2526
initialize_llm_profile,
2627
initialize_optimizer,
27-
inject_model,
2828
load_new_batch,
2929
record_current_batch_training_metrics,
3030
)

internlm/model_implementations/__init__.py

Whitespace-only changes.

internlm/model/builder.py internlm/model_implementations/builder.py

+2-2
Original file line numberDiff line numberDiff line change
@@ -6,12 +6,12 @@
66
from internlm.core.context import ParallelMode
77
from internlm.core.context import global_context as gpc
88
from internlm.core.parallel.shard import pipeline_parallel_sharding_wrapper
9-
from internlm.model.base_model import BaseModel
9+
from internlm.model_implementations.transformers.base_model import BaseModel
1010
from internlm.model.modules.linear import (
1111
ParallelLinearWithCommExt,
1212
ScaleColumnParallelLinear,
1313
)
14-
from internlm.model.registry import model_initializer
14+
from internlm.model_implementations.registry import model_initializer
1515
from internlm.utils.common import get_current_device
1616
from internlm.utils.lazy import LazyObject
1717
from internlm.utils.logger import get_logger

internlm/model/registry.py internlm/model_implementations/registry.py

+10-10
Original file line numberDiff line numberDiff line change
@@ -4,16 +4,16 @@
44

55
from typing import Callable
66

7-
from internlm.model.modeling_baichuan2 import Baichuan2
8-
from internlm.model.modeling_gemma import Gemma
9-
from internlm.model.modeling_internlm import InternLM1
10-
from internlm.model.modeling_internlm2 import InternLM2
11-
from internlm.model.modeling_llama import Llama2
12-
from internlm.model.modeling_llava import Llava
13-
from internlm.model.modeling_mixtral import MixtralMoE
14-
from internlm.model.modeling_moe import Internlm1MoE
15-
from internlm.model.modeling_qwen2 import Qwen2
16-
from internlm.model.modeling_qwen2_moe import Qwen2Moe
7+
from internlm.model_implementations.transformers.modeling_baichuan2 import Baichuan2
8+
from internlm.model_implementations.transformers.modeling_gemma import Gemma
9+
from internlm.model_implementations.transformers.modeling_internlm import InternLM1
10+
from internlm.model_implementations.transformers.modeling_internlm2 import InternLM2
11+
from internlm.model_implementations.transformers.modeling_llama import Llama2
12+
from internlm.model_implementations.transformers.modeling_llava import Llava
13+
from internlm.model_implementations.transformers.modeling_mixtral import MixtralMoE
14+
from internlm.model_implementations.transformers.modeling_moe import Internlm1MoE
15+
from internlm.model_implementations.transformers.modeling_qwen2 import Qwen2
16+
from internlm.model_implementations.transformers.modeling_qwen2_moe import Qwen2Moe
1717
from internlm.utils.common import SingletonMeta
1818
from internlm.utils.utils import ModelType
1919

internlm/model_implementations/transformers/__init__.py

Whitespace-only changes.

internlm/model/modeling_baichuan2.py internlm/model_implementations/transformers/modeling_baichuan2.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -17,7 +17,7 @@
1717
scaled_init_method_uniform,
1818
uniform_,
1919
)
20-
from internlm.model.base_model import BaseModel
20+
from internlm.model_implementations.transformers.base_model import BaseModel
2121
from internlm.model.modules.embedding import Embedding1D
2222
from internlm.model.modules.linear import new_linear
2323
from internlm.model.modules.mha import MHA

internlm/model/modeling_gemma.py internlm/model_implementations/transformers/modeling_gemma.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -16,7 +16,7 @@
1616
scaled_init_method_uniform,
1717
uniform_,
1818
)
19-
from internlm.model.base_model import BaseModel
19+
from internlm.model_implementations.transformers.base_model import BaseModel
2020
from internlm.model.modules.embedding import Embedding1D
2121
from internlm.model.modules.linear import new_linear
2222
from internlm.model.modules.mha import GQA

internlm/model/modeling_internlm.py internlm/model_implementations/transformers/modeling_internlm.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -15,7 +15,7 @@
1515
from internlm.core.naive_amp import set_output_attr_to_module
1616
from internlm.core.parallel.shard import partition_uniform
1717
from internlm.initialize.initialize_tensor import normal_, scaled_init_method_normal
18-
from internlm.model.base_model import BaseModel
18+
from internlm.model_implementations.transformers.base_model import BaseModel
1919
from internlm.model.modules.embedding import Embedding1D
2020
from internlm.model.modules.linear import new_linear
2121
from internlm.model.modules.mha import MHA

internlm/model/modeling_internlm2.py internlm/model_implementations/transformers/modeling_internlm2.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -18,7 +18,7 @@
1818
scaled_init_method_uniform,
1919
uniform_,
2020
)
21-
from internlm.model.base_model import BaseModel
21+
from internlm.model_implementations.transformers.base_model import BaseModel
2222
from internlm.model.modules.embedding import Embedding1D
2323
from internlm.model.modules.linear import new_linear
2424
from internlm.model.modules.mha import GQA

internlm/model/modeling_llama.py internlm/model_implementations/transformers/modeling_llama.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -16,7 +16,7 @@
1616
scaled_init_method_uniform,
1717
uniform_,
1818
)
19-
from internlm.model.base_model import BaseModel
19+
from internlm.model_implementations.transformers.base_model import BaseModel
2020
from internlm.model.modules.embedding import Embedding1D
2121
from internlm.model.modules.linear import new_linear
2222
from internlm.model.modules.mha import GQA

internlm/model/modeling_llava.py internlm/model_implementations/transformers/modeling_llava.py

+2-2
Original file line numberDiff line numberDiff line change
@@ -7,10 +7,10 @@
77
from internlm.core.context.parallel_context import global_context as gpc
88
from internlm.core.naive_amp import set_output_attr_to_module
99
from internlm.initialize.initialize_tensor import normal_, uniform_
10-
from internlm.model.base_model import BaseModel
10+
from internlm.model_implementations.transformers.base_model import BaseModel
1111
from internlm.model.llava.clip_builder import build_vision_tower
1212
from internlm.model.llava.projector_builder import build_vision_projector
13-
from internlm.model.modeling_llama import Llama2Decoder
13+
from internlm.model_implementations.transformers.modeling_llama import Llama2Decoder
1414
from internlm.model.modules.embedding import Embedding1D
1515
from internlm.model.modules.linear import new_linear
1616
from internlm.model.modules.norm import new_layer_norm

internlm/model/modeling_mixtral.py internlm/model_implementations/transformers/modeling_mixtral.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -10,7 +10,7 @@
1010
from internlm.core.context import ParallelMode
1111
from internlm.core.context.parallel_context import global_context as gpc
1212
from internlm.initialize.initialize_tensor import normal_, scaled_init_method_normal
13-
from internlm.model.base_model import BaseModel
13+
from internlm.model_implementations.transformers.base_model import BaseModel
1414
from internlm.model.modules.embedding import Embedding1D
1515
from internlm.model.modules.linear import new_linear
1616
from internlm.model.modules.mha import SWA

internlm/model/modeling_moe.py internlm/model_implementations/transformers/modeling_moe.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -10,7 +10,7 @@
1010
from internlm.core.context import ParallelMode
1111
from internlm.core.context.parallel_context import global_context as gpc
1212
from internlm.initialize.initialize_tensor import normal_, scaled_init_method_normal
13-
from internlm.model.base_model import BaseModel
13+
from internlm.model_implementations.transformers.base_model import BaseModel
1414
from internlm.model.modules.embedding import Embedding1D
1515
from internlm.model.modules.linear import new_linear
1616
from internlm.model.modules.mha import MHA

internlm/model/modeling_qwen2.py internlm/model_implementations/transformers/modeling_qwen2.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -16,7 +16,7 @@
1616
scaled_init_method_uniform,
1717
uniform_,
1818
)
19-
from internlm.model.base_model import BaseModel
19+
from internlm.model_implementations.transformers.base_model import BaseModel
2020
from internlm.model.modules.embedding import Embedding1D
2121
from internlm.model.modules.linear import new_linear
2222
from internlm.model.modules.mha import SWA

internlm/model/modeling_qwen2_moe.py internlm/model_implementations/transformers/modeling_qwen2_moe.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -14,7 +14,7 @@
1414
scaled_init_method_uniform,
1515
uniform_,
1616
)
17-
from internlm.model.base_model import BaseModel
17+
from internlm.model_implementations.transformers.base_model import BaseModel
1818
from internlm.model.modules.embedding import Embedding1D
1919
from internlm.model.modules.linear import new_linear
2020
from internlm.model.modules.mha import SWA

internlm/model_inject/__init__.py

Whitespace-only changes.

0 commit comments

Comments
 (0)