Skip to content
Open
Show file tree
Hide file tree
Changes from 1 commit
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
Binary file not shown.
8 changes: 8 additions & 0 deletions flagscale/train/megatron/nemo_bridge/__init__.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,8 @@
# Copyright (c) 2025, BAAI. All rights reserved.
Copy link
Collaborator

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

nemo megatron-bridge supports pip install for usage, ref https://pypi.org/project/megatron-bridge/
please remove source codes

Copy link
Collaborator

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Rename flagscale/train/megatron/nemo_bridge to flagscale/train/megatron/bridge so that it matches the import pattern from megatron.bridge

#
# Mainly adapted from: https://github.com/NVIDIA-NeMo/Megatron-Bridge
"""Megatron Bridge - A component of the Megatron ecosystem."""

from megatron.nemo_bridge.models.conversion.auto_bridge import AutoBridge

__all__ = ["AutoBridge"]
99 changes: 99 additions & 0 deletions flagscale/train/megatron/nemo_bridge/models/__init__.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,99 @@
# Copyright (c) 2025, BAAI. All rights reserved.
#
# Copied from: https://github.com/NVIDIA-NeMo/Megatron-Bridge

from megatron.nemo_bridge.models.conversion.auto_bridge import AutoBridge
from megatron.nemo_bridge.models.conversion.mapping_registry import MegatronMappingRegistry
from megatron.nemo_bridge.models.conversion.model_bridge import MegatronModelBridge
from megatron.nemo_bridge.models.conversion.param_mapping import (
AutoMapping,
ColumnParallelMapping,
GatedMLPMapping,
MegatronParamMapping,
QKVMapping,
ReplicatedMapping,
RowParallelMapping,
)
from megatron.nemo_bridge.models.deepseek import (
DeepSeekModelProvider,
DeepSeekProvider,
DeepSeekV2LiteModelProvider,
DeepSeekV2LiteProvider,
DeepSeekV2ModelProvider,
DeepSeekV2Provider,
DeepSeekV3ModelProvider,
DeepSeekV3Provider,
MoonlightModelProvider16B,
MoonlightProvider,
)
from megatron.nemo_bridge.models.gpt_provider import GPTModelProvider
from megatron.nemo_bridge.models.qwen import (
Qwen2ModelProvider,
Qwen2ModelProvider1P5B,
Qwen2ModelProvider7B,
Qwen2ModelProvider72B,
Qwen2ModelProvider500M,
Qwen3ModelProvider,
Qwen3ModelProvider1P7B,
Qwen3ModelProvider4B,
Qwen3ModelProvider8B,
Qwen3ModelProvider14B,
Qwen3ModelProvider32B,
Qwen3ModelProvider600M,
Qwen3MoEModelProvider,
Qwen3MoEModelProvider30B_A3B,
Qwen3MoEModelProvider235B_A22B,
Qwen25ModelProvider1P5B,
Qwen25ModelProvider3B,
Qwen25ModelProvider7B,
Qwen25ModelProvider14B,
Qwen25ModelProvider32B,
Qwen25ModelProvider72B,
Qwen25ModelProvider500M,
)

__all__ = [
"AutoBridge",
"MegatronMappingRegistry",
"MegatronModelBridge",
"ColumnParallelMapping",
"GatedMLPMapping",
"MegatronParamMapping",
"QKVMapping",
"ReplicatedMapping",
"RowParallelMapping",
"AutoMapping",
"GPTModelProvider",
"Qwen2ModelProvider",
"Qwen2ModelProvider500M",
"Qwen2ModelProvider1P5B",
"Qwen2ModelProvider7B",
"Qwen2ModelProvider72B",
"Qwen25ModelProvider500M",
"Qwen25ModelProvider1P5B",
"Qwen25ModelProvider3B",
"Qwen25ModelProvider7B",
"Qwen25ModelProvider14B",
"Qwen25ModelProvider32B",
"Qwen25ModelProvider72B",
"Qwen3ModelProvider",
"Qwen3ModelProvider600M",
"Qwen3ModelProvider1P7B",
"Qwen3ModelProvider4B",
"Qwen3ModelProvider8B",
"Qwen3ModelProvider14B",
"Qwen3ModelProvider32B",
"Qwen3MoEModelProvider",
"Qwen3MoEModelProvider30B_A3B",
"Qwen3MoEModelProvider235B_A22B",
"DeepSeekModelProvider",
"DeepSeekProvider",
"DeepSeekV2LiteModelProvider",
"DeepSeekV2LiteProvider",
"DeepSeekV2ModelProvider",
"DeepSeekV2Provider",
"DeepSeekV3ModelProvider",
"DeepSeekV3Provider",
"MoonlightModelProvider16B",
"MoonlightProvider",
]
Loading
Loading