Skip to content
Binary file not shown.
8 changes: 8 additions & 0 deletions flagscale/train/megatron/nemo_bridge/__init__.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,8 @@
# Copyright (c) 2025, BAAI. All rights reserved.
Copy link
Copy Markdown
Collaborator

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

nemo megatron-bridge supports pip install for usage, ref https://pypi.org/project/megatron-bridge/
please remove source codes

Copy link
Copy Markdown
Collaborator

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Rename flagscale/train/megatron/nemo_bridge to flagscale/train/megatron/bridge so that it matches the import pattern from megatron.bridge

#
# Mainly adapted from: https://github.com/NVIDIA-NeMo/Megatron-Bridge
"""Megatron Bridge - A component of the Megatron ecosystem."""

from megatron.nemo_bridge.models.conversion.auto_bridge import AutoBridge

__all__ = ["AutoBridge"]
99 changes: 99 additions & 0 deletions flagscale/train/megatron/nemo_bridge/models/__init__.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,99 @@
# Copyright (c) 2025, BAAI. All rights reserved.
#
# Copied from: https://github.com/NVIDIA-NeMo/Megatron-Bridge

from megatron.nemo_bridge.models.conversion.auto_bridge import AutoBridge
from megatron.nemo_bridge.models.conversion.mapping_registry import MegatronMappingRegistry
from megatron.nemo_bridge.models.conversion.model_bridge import MegatronModelBridge
from megatron.nemo_bridge.models.conversion.param_mapping import (
AutoMapping,
ColumnParallelMapping,
GatedMLPMapping,
MegatronParamMapping,
QKVMapping,
ReplicatedMapping,
RowParallelMapping,
)
from megatron.nemo_bridge.models.deepseek import (
DeepSeekModelProvider,
DeepSeekProvider,
DeepSeekV2LiteModelProvider,
DeepSeekV2LiteProvider,
DeepSeekV2ModelProvider,
DeepSeekV2Provider,
DeepSeekV3ModelProvider,
DeepSeekV3Provider,
MoonlightModelProvider16B,
MoonlightProvider,
)
from megatron.nemo_bridge.models.gpt_provider import GPTModelProvider
from megatron.nemo_bridge.models.qwen import (
Qwen2ModelProvider,
Qwen2ModelProvider1P5B,
Qwen2ModelProvider7B,
Qwen2ModelProvider72B,
Qwen2ModelProvider500M,
Qwen3ModelProvider,
Qwen3ModelProvider1P7B,
Qwen3ModelProvider4B,
Qwen3ModelProvider8B,
Qwen3ModelProvider14B,
Qwen3ModelProvider32B,
Qwen3ModelProvider600M,
Qwen3MoEModelProvider,
Qwen3MoEModelProvider30B_A3B,
Qwen3MoEModelProvider235B_A22B,
Qwen25ModelProvider1P5B,
Qwen25ModelProvider3B,
Qwen25ModelProvider7B,
Qwen25ModelProvider14B,
Qwen25ModelProvider32B,
Qwen25ModelProvider72B,
Qwen25ModelProvider500M,
)

__all__ = [
"AutoBridge",
"MegatronMappingRegistry",
"MegatronModelBridge",
"ColumnParallelMapping",
"GatedMLPMapping",
"MegatronParamMapping",
"QKVMapping",
"ReplicatedMapping",
"RowParallelMapping",
"AutoMapping",
"GPTModelProvider",
"Qwen2ModelProvider",
"Qwen2ModelProvider500M",
"Qwen2ModelProvider1P5B",
"Qwen2ModelProvider7B",
"Qwen2ModelProvider72B",
"Qwen25ModelProvider500M",
"Qwen25ModelProvider1P5B",
"Qwen25ModelProvider3B",
"Qwen25ModelProvider7B",
"Qwen25ModelProvider14B",
"Qwen25ModelProvider32B",
"Qwen25ModelProvider72B",
"Qwen3ModelProvider",
"Qwen3ModelProvider600M",
"Qwen3ModelProvider1P7B",
"Qwen3ModelProvider4B",
"Qwen3ModelProvider8B",
"Qwen3ModelProvider14B",
"Qwen3ModelProvider32B",
"Qwen3MoEModelProvider",
"Qwen3MoEModelProvider30B_A3B",
"Qwen3MoEModelProvider235B_A22B",
"DeepSeekModelProvider",
"DeepSeekProvider",
"DeepSeekV2LiteModelProvider",
"DeepSeekV2LiteProvider",
"DeepSeekV2ModelProvider",
"DeepSeekV2Provider",
"DeepSeekV3ModelProvider",
"DeepSeekV3Provider",
"MoonlightModelProvider16B",
"MoonlightProvider",
]
Loading
Loading