Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
1 change: 0 additions & 1 deletion .github/workflows/cicd-main.yml
Original file line number Diff line number Diff line change
Expand Up @@ -399,7 +399,6 @@ jobs:
- script: L2_Launch_recipes_llama_1b
- script: L2_Launch_recipes_llama_3b
- script: L2_Launch_recipes_llama_distill
- script: L2_Launch_recipes_mamba
- script: L2_Launch_recipes_nemotronh
- script: L2_Launch_recipes_qwen
- script: L2_Launch_data
Expand Down
2 changes: 1 addition & 1 deletion docs/nemo2-migration-guide.md
Original file line number Diff line number Diff line change
Expand Up @@ -26,7 +26,7 @@ Megatron Bridge offers model providers that directly map to NeMo 2.0 model confi
### Supported Model Families

Megatron Bridge supports the following model families with preset providers:
- **Base Models**: `GPTModelProvider`, `T5ModelProvider`, `MambaProvider`
- **Base Models**: `GPTModelProvider`, `T5ModelProvider`, `MambaModelProvider`
- **Llama**: Llama2, Llama3, Llama3.1, Llama3.2, CodeLlama, Llama4
- **Qwen**: Qwen2, Qwen2.5, Qwen3, Qwen3MoE, Qwen2.5VL
- **DeepSeek**: DeepSeek, DeepSeekV2, DeepSeekV2Lite, DeepSeekV3, Moonlight
Expand Down
34 changes: 1 addition & 33 deletions src/megatron/bridge/models/__init__.py
Original file line number Diff line number Diff line change
Expand Up @@ -105,24 +105,7 @@
LlamaNemotronBridge,
LlamaNemotronHeterogeneousProvider,
)
from megatron.bridge.models.mamba.mamba_provider import (
MambaModelProvider,
MambaModelProvider1P3B,
MambaModelProvider2P7B,
MambaModelProvider130M,
MambaModelProvider370M,
MambaModelProvider780M,
MambaProvider,
MambaProvider1_3B,
MambaProvider2_7B,
MambaProvider130M,
MambaProvider370M,
MambaProvider780M,
NVIDIAMambaHybridModelProvider8B,
NVIDIAMambaHybridProvider8B,
NVIDIAMambaModelProvider8B,
NVIDIAMambaProvider8B,
)
from megatron.bridge.models.mamba.mamba_provider import MambaModelProvider
from megatron.bridge.models.ministral3 import (
Ministral3Bridge,
Ministral3Model,
Expand Down Expand Up @@ -327,21 +310,6 @@
"NemotronNano9Bv2Provider",
"NemotronNano12Bv2Provider",
"MambaModelProvider",
"MambaModelProvider1P3B",
"MambaModelProvider2P7B",
"MambaModelProvider130M",
"MambaModelProvider370M",
"MambaModelProvider780M",
"NVIDIAMambaHybridModelProvider8B",
"NVIDIAMambaModelProvider8B",
"MambaProvider",
"MambaProvider1_3B",
"MambaProvider2_7B",
"MambaProvider130M",
"MambaProvider370M",
"MambaProvider780M",
"NVIDIAMambaHybridProvider8B",
"NVIDIAMambaProvider8B",
# Nemotron Models
"NemotronBridge",
"NemotronModelProvider",
Expand Down
34 changes: 1 addition & 33 deletions src/megatron/bridge/models/mamba/__init__.py
Original file line number Diff line number Diff line change
Expand Up @@ -12,41 +12,9 @@
# See the License for the specific language governing permissions and
# limitations under the License.

from megatron.bridge.models.mamba.mamba_provider import (
MambaModelProvider,
MambaModelProvider1P3B,
MambaModelProvider2P7B,
MambaModelProvider130M,
MambaModelProvider370M,
MambaModelProvider780M,
MambaProvider,
MambaProvider1_3B,
MambaProvider2_7B,
MambaProvider130M,
MambaProvider370M,
MambaProvider780M,
NVIDIAMambaHybridModelProvider8B,
NVIDIAMambaHybridProvider8B,
NVIDIAMambaModelProvider8B,
NVIDIAMambaProvider8B,
)
from megatron.bridge.models.mamba.mamba_provider import MambaModelProvider


__all__ = [
"MambaModelProvider",
"MambaModelProvider1P3B",
"MambaModelProvider2P7B",
"MambaModelProvider130M",
"MambaModelProvider370M",
"MambaModelProvider780M",
"NVIDIAMambaHybridModelProvider8B",
"NVIDIAMambaModelProvider8B",
"MambaProvider",
"MambaProvider1_3B",
"MambaProvider2_7B",
"MambaProvider130M",
"MambaProvider370M",
"MambaProvider780M",
"NVIDIAMambaHybridProvider8B",
"NVIDIAMambaProvider8B",
]
Loading
Loading