Skip to content

Commit 5a2e996

Browse files
committed
fix ci
1 parent 6075d1e commit 5a2e996

12 files changed

+13
-13
lines changed

internlm/core/trainer_builder.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -17,9 +17,9 @@
1717
from internlm.data.train_state import get_train_state
1818
from internlm.eval.evaluation import evaluate_on_val_dls
1919
from internlm.initialize.initialize_trainer import initialize_trainer
20-
from internlm.model_inject.inject import inject_model
2120
from internlm.model.losses.ce_loss import InternLoss
2221
from internlm.model.metrics import AccPerplex
22+
from internlm.model_inject.inject import inject_model
2323
from internlm.monitor.monitor import send_alert_message
2424
from internlm.train.pipeline import (
2525
get_scheduler_hooks,

internlm/model_implementations/builder.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -6,12 +6,12 @@
66
from internlm.core.context import ParallelMode
77
from internlm.core.context import global_context as gpc
88
from internlm.core.parallel.shard import pipeline_parallel_sharding_wrapper
9-
from internlm.model_implementations.transformers.base_model import BaseModel
109
from internlm.model.modules.linear import (
1110
ParallelLinearWithCommExt,
1211
ScaleColumnParallelLinear,
1312
)
1413
from internlm.model_implementations.registry import model_initializer
14+
from internlm.model_implementations.transformers.base_model import BaseModel
1515
from internlm.utils.common import get_current_device
1616
from internlm.utils.lazy import LazyObject
1717
from internlm.utils.logger import get_logger

internlm/model_implementations/transformers/modeling_baichuan2.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -17,7 +17,6 @@
1717
scaled_init_method_uniform,
1818
uniform_,
1919
)
20-
from internlm.model_implementations.transformers.base_model import BaseModel
2120
from internlm.model.modules.embedding import Embedding1D
2221
from internlm.model.modules.linear import new_linear
2322
from internlm.model.modules.mha import MHA
@@ -27,6 +26,7 @@
2726
convert_attn_args_to_kwargs,
2827
convert_attn_kwargs_to_args,
2928
)
29+
from internlm.model_implementations.transformers.base_model import BaseModel
3030
from internlm.solver.activation_checkpoint import activation_checkpoint
3131
from internlm.utils.logger import get_logger
3232
from internlm.utils.storage_manager import get_fns, llm_load, llm_save

internlm/model_implementations/transformers/modeling_gemma.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -16,7 +16,6 @@
1616
scaled_init_method_uniform,
1717
uniform_,
1818
)
19-
from internlm.model_implementations.transformers.base_model import BaseModel
2019
from internlm.model.modules.embedding import Embedding1D
2120
from internlm.model.modules.linear import new_linear
2221
from internlm.model.modules.mha import GQA
@@ -26,6 +25,7 @@
2625
convert_attn_args_to_kwargs,
2726
convert_attn_kwargs_to_args,
2827
)
28+
from internlm.model_implementations.transformers.base_model import BaseModel
2929
from internlm.solver.activation_checkpoint import activation_checkpoint
3030
from internlm.utils.logger import get_logger
3131
from internlm.utils.storage_manager import get_fns, llm_load, llm_save

internlm/model_implementations/transformers/modeling_internlm.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -15,7 +15,6 @@
1515
from internlm.core.naive_amp import set_output_attr_to_module
1616
from internlm.core.parallel.shard import partition_uniform
1717
from internlm.initialize.initialize_tensor import normal_, scaled_init_method_normal
18-
from internlm.model_implementations.transformers.base_model import BaseModel
1918
from internlm.model.modules.embedding import Embedding1D
2019
from internlm.model.modules.linear import new_linear
2120
from internlm.model.modules.mha import MHA
@@ -27,6 +26,7 @@
2726
internlm1_mha_pre_load_convert,
2827
internlm1_mha_save_convert,
2928
)
29+
from internlm.model_implementations.transformers.base_model import BaseModel
3030
from internlm.solver.activation_checkpoint import activation_checkpoint
3131
from internlm.utils.logger import get_logger
3232
from internlm.utils.storage_manager import get_fns, llm_load, llm_save

internlm/model_implementations/transformers/modeling_internlm2.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -18,7 +18,6 @@
1818
scaled_init_method_uniform,
1919
uniform_,
2020
)
21-
from internlm.model_implementations.transformers.base_model import BaseModel
2221
from internlm.model.modules.embedding import Embedding1D
2322
from internlm.model.modules.linear import new_linear
2423
from internlm.model.modules.mha import GQA
@@ -29,6 +28,7 @@
2928
convert_attn_kwargs_to_args,
3029
get_parallel_size_from_file,
3130
)
31+
from internlm.model_implementations.transformers.base_model import BaseModel
3232
from internlm.solver.activation_checkpoint import activation_checkpoint
3333
from internlm.utils.logger import get_logger
3434
from internlm.utils.storage_manager import get_fns, llm_load, llm_save

internlm/model_implementations/transformers/modeling_llama.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -16,7 +16,6 @@
1616
scaled_init_method_uniform,
1717
uniform_,
1818
)
19-
from internlm.model_implementations.transformers.base_model import BaseModel
2019
from internlm.model.modules.embedding import Embedding1D
2120
from internlm.model.modules.linear import new_linear
2221
from internlm.model.modules.mha import GQA
@@ -26,6 +25,7 @@
2625
convert_attn_args_to_kwargs,
2726
convert_attn_kwargs_to_args,
2827
)
28+
from internlm.model_implementations.transformers.base_model import BaseModel
2929
from internlm.solver.activation_checkpoint import activation_checkpoint
3030
from internlm.utils.logger import get_logger
3131
from internlm.utils.storage_manager import get_fns, llm_load, llm_save

internlm/model_implementations/transformers/modeling_llava.py

+2-2
Original file line numberDiff line numberDiff line change
@@ -7,13 +7,13 @@
77
from internlm.core.context.parallel_context import global_context as gpc
88
from internlm.core.naive_amp import set_output_attr_to_module
99
from internlm.initialize.initialize_tensor import normal_, uniform_
10-
from internlm.model_implementations.transformers.base_model import BaseModel
1110
from internlm.model.llava.clip_builder import build_vision_tower
1211
from internlm.model.llava.projector_builder import build_vision_projector
13-
from internlm.model_implementations.transformers.modeling_llama import Llama2Decoder
1412
from internlm.model.modules.embedding import Embedding1D
1513
from internlm.model.modules.linear import new_linear
1614
from internlm.model.modules.norm import new_layer_norm
15+
from internlm.model_implementations.transformers.base_model import BaseModel
16+
from internlm.model_implementations.transformers.modeling_llama import Llama2Decoder
1717
from internlm.utils.logger import get_logger
1818

1919
logger = get_logger(__file__)

internlm/model_implementations/transformers/modeling_mixtral.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -10,7 +10,6 @@
1010
from internlm.core.context import ParallelMode
1111
from internlm.core.context.parallel_context import global_context as gpc
1212
from internlm.initialize.initialize_tensor import normal_, scaled_init_method_normal
13-
from internlm.model_implementations.transformers.base_model import BaseModel
1413
from internlm.model.modules.embedding import Embedding1D
1514
from internlm.model.modules.linear import new_linear
1615
from internlm.model.modules.mha import SWA
@@ -21,6 +20,7 @@
2120
convert_attn_args_to_kwargs,
2221
convert_attn_kwargs_to_args,
2322
)
23+
from internlm.model_implementations.transformers.base_model import BaseModel
2424
from internlm.solver.activation_checkpoint import activation_checkpoint
2525
from internlm.utils.logger import get_logger
2626

internlm/model_implementations/transformers/modeling_moe.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -10,7 +10,6 @@
1010
from internlm.core.context import ParallelMode
1111
from internlm.core.context.parallel_context import global_context as gpc
1212
from internlm.initialize.initialize_tensor import normal_, scaled_init_method_normal
13-
from internlm.model_implementations.transformers.base_model import BaseModel
1413
from internlm.model.modules.embedding import Embedding1D
1514
from internlm.model.modules.linear import new_linear
1615
from internlm.model.modules.mha import MHA
@@ -23,6 +22,7 @@
2322
internlm1_mha_pre_load_convert,
2423
internlm1_mha_save_convert,
2524
)
25+
from internlm.model_implementations.transformers.base_model import BaseModel
2626
from internlm.solver.activation_checkpoint import activation_checkpoint
2727
from internlm.utils.logger import get_logger
2828

internlm/model_implementations/transformers/modeling_qwen2.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -16,7 +16,6 @@
1616
scaled_init_method_uniform,
1717
uniform_,
1818
)
19-
from internlm.model_implementations.transformers.base_model import BaseModel
2019
from internlm.model.modules.embedding import Embedding1D
2120
from internlm.model.modules.linear import new_linear
2221
from internlm.model.modules.mha import SWA
@@ -26,6 +25,7 @@
2625
convert_attn_args_to_kwargs,
2726
convert_attn_kwargs_to_args,
2827
)
28+
from internlm.model_implementations.transformers.base_model import BaseModel
2929
from internlm.solver.activation_checkpoint import activation_checkpoint
3030
from internlm.utils.logger import get_logger
3131
from internlm.utils.storage_manager import get_fns, llm_load, llm_save

internlm/model_implementations/transformers/modeling_qwen2_moe.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -14,7 +14,6 @@
1414
scaled_init_method_uniform,
1515
uniform_,
1616
)
17-
from internlm.model_implementations.transformers.base_model import BaseModel
1817
from internlm.model.modules.embedding import Embedding1D
1918
from internlm.model.modules.linear import new_linear
2019
from internlm.model.modules.mha import SWA
@@ -25,6 +24,7 @@
2524
convert_attn_args_to_kwargs,
2625
convert_attn_kwargs_to_args,
2726
)
27+
from internlm.model_implementations.transformers.base_model import BaseModel
2828
from internlm.solver.activation_checkpoint import activation_checkpoint
2929
from internlm.utils.logger import get_logger
3030

0 commit comments

Comments
 (0)