Commit 6fa2609
Submodule Megatron-Bridge updated 78 files
- .github/workflows/_update_dependencies.yml+3-3
- .github/workflows/build-test-publish-wheel.yml+1-1
- .github/workflows/config/.secrets.baseline+10-1
- .main.commit+1-1
- 3rdparty/Megatron-LM+1-1
- AGENTS.md+96
- README.md+3-1
- docker/Dockerfile.fw_final+1-1
- docs/index.md+1
- docs/modelopt/quantization.md+1-1
- docs/releases/README.md+1
- docs/releases/release-process.md+85
- docs/training/peft.md+4-4
- examples/conversion/hf_megatron_roundtrip_multi_gpu.py+70-12
- examples/evaluation/utils/executors.py+12-1
- examples/models/bailing/README.md+72
- examples/models/bailing/conversion.sh+43
- examples/models/bailing/inference.sh+42
- examples/quantization/conf/quantized_llama3_8b_pretrain_override_example.yaml+2-1
- examples/quantization/quantize.py+9-1
- pyproject.toml+4-2
- ruff.toml+2
- scripts/performance/README.md+42-1
- scripts/performance/argument_parser.py+16-1
- scripts/performance/configs/llama/llama3_workload_base_configs.py+8-2
- scripts/performance/configs/nemotronh/nemotron_3_llm_pretrain.py+16-6
- scripts/performance/configs/nemotronh/nemotron_3_workload_base_configs.py+18-44
- scripts/performance/configs/nemotronh/te_quant.cfg+35
- scripts/performance/configs/qwen/qwen3_llm_pretrain.py+15-21
- scripts/performance/configs/qwen/qwen3_workload_base_configs.py+29-29
- scripts/performance/perf_plugins.py+20-9
- scripts/performance/setup_experiment.py+53-16
- scripts/performance/utils/executors.py+20-10
- scripts/performance/utils/overrides.py+9-6
- skills/adding-model-support/recipe-patterns.md+4-7
- src/megatron/bridge/__init__.py+1
- src/megatron/bridge/inference/vlm/base.py+16-13
- src/megatron/bridge/inference/vlm/qwenvl_inference_wrapper.py+43-9
- src/megatron/bridge/inference/vlm/vlm_engine.py+2-2
- src/megatron/bridge/inference/vlm/vlm_inference_controller.py+24-15
- src/megatron/bridge/models/__init__.py+4
- src/megatron/bridge/models/bailing/__init__.py+21
- src/megatron/bridge/models/bailing/bailing_moe2_bridge.py+229
- src/megatron/bridge/models/bailing/configuration_bailing_moe_v2.py+113
- src/megatron/bridge/models/bailing/modeling_bailing_moe_v2.py+1.6k
- src/megatron/bridge/models/conversion/auto_bridge.py+5-8
- src/megatron/bridge/models/gpt_oss/gpt_oss_bridge.py+2-10
- src/megatron/bridge/models/kimi_vl/kimi_k25_vl_bridge.py+6-1
- src/megatron/bridge/models/kimi_vl/utils.py+5-4
- src/megatron/bridge/package_info.py+19-1
- src/megatron/bridge/training/callbacks.py+12
- src/megatron/bridge/training/checkpointing.py+1-5
- src/megatron/bridge/training/config.py+9
- src/megatron/bridge/training/initialize.py+1
- src/megatron/bridge/training/post_training/checkpointing.py+1-1
- src/megatron/bridge/training/pretrain.py+1-1
- src/megatron/bridge/training/setup.py+19
- src/megatron/bridge/training/state.py+28-4
- src/megatron/bridge/training/train.py+1
- src/megatron/bridge/training/utils/train_utils.py+5-1
- tests/functional_tests/inference/test_vlm_inference.py+81
- tests/functional_tests/launch_scripts/active/L0_Launch_models_bailing.sh+23
- tests/functional_tests/launch_scripts/active/L0_Launch_vlm_inference.sh+24
- tests/functional_tests/test_groups/models/bailing/__init__.py+13
- tests/functional_tests/test_groups/models/bailing/test_bailing_moe2_conversion.py+201
- tests/functional_tests/test_groups/models/gpt_oss/test_gpt_oss_conversion.py+10
- tests/functional_tests/test_groups/recipes/test_gpt_oss_recipes_finetune.py+8
- tests/functional_tests/test_groups/recipes/test_perf_config_integration.py+10
- tests/unit_tests/inference/vlm/test_base.py+19-1
- tests/unit_tests/inference/vlm/test_qwenvl_inference_wrapper.py+37-2
- tests/unit_tests/models/test_auto_bridge.py+9-7
- tests/unit_tests/scripts/performance/test_executors.py+68
- tests/unit_tests/scripts/test_performance_offline_mode.py+203
- tests/unit_tests/training/test_callbacks.py+2
- tests/unit_tests/training/test_checkpointing.py+1
- tests/unit_tests/training/test_state.py+12-7
- tests/unit_tests/training/utils/test_train_utils.py+108
- uv.lock+622-224
| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
56 | 56 | | |
57 | 57 | | |
58 | 58 | | |
59 | | - | |
| 59 | + | |
60 | 60 | | |
61 | 61 | | |
62 | 62 | | |
| |||
| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
497 | 497 | | |
498 | 498 | | |
499 | 499 | | |
500 | | - | |
| 500 | + | |
501 | 501 | | |
502 | 502 | | |
503 | 503 | | |
| |||
Some generated files are not rendered by default. Learn more about customizing how changed files appear on GitHub.
0 commit comments