Commit 0030d5d
- nemo/collections/audio/modules/transforms.py+173-8
- nemo/collections/llm/api.py+5
- nemo/collections/llm/gpt/data/core.py+1-1
- nemo/collections/llm/gpt/model/hyena.py+44-2
- nemo/collections/llm/gpt/model/llama_embedding.py+12
- nemo/collections/llm/gpt/model/megatron/hyena/hyena_layer_specs.py+52-62
- nemo/collections/llm/gpt/model/megatron/hyena/hyena_mixer.py+8-32
- nemo/collections/llm/gpt/model/megatron/hyena/hyena_utils.py+64-23
- nemo/collections/llm/gpt/model/megatron/hyena/te_compat.py+162
- nemo/collections/nlp/data/language_modeling/megatron/gpt_sft_dataset.py+4-1
- nemo/collections/vlm/inference/base.py+68-12
- nemo/collections/vlm/inference/qwenvl_inference_wrapper.py+87
- nemo/collections/vlm/inference/vlm_inference_controller.py+40
- nemo/lightning/pytorch/plugins/data_sampler.py+55-1
- nemo/lightning/pytorch/strategies/megatron_strategy.py+33-3
- nemo/lightning/resume.py+5-4
- nemo/utils/sequence_packing_utils.py+1-1
- requirements/manifest.json+2-2
- scripts/llm/ptq.py+4
- scripts/nlp_language_modeling/t0/merge_train_tasks.py-133
- scripts/nlp_language_modeling/t0/t0_dataset_preproc.py-179
- scripts/nlp_language_modeling/t0/tasks_splits_and_features.py-8.1k
- scripts/performance/argument_parser.py+14
- scripts/performance/diffusion/pretrain_flux_12b.py+2
- scripts/performance/helpers.py+9
- scripts/performance/llm/finetune_deepseek_v3.py+2
- scripts/performance/llm/finetune_llama31_405b.py+2
- scripts/performance/llm/finetune_llama3_70b.py+2
- scripts/performance/llm/finetune_llama3_8b.py+2
- scripts/performance/llm/finetune_llama4_e128.py+2
- scripts/performance/llm/pretrain_deepseek_v3.py+2
- scripts/performance/llm/pretrain_gpt3_175b.py+2
- scripts/performance/llm/pretrain_llama31_405b.py+2
- scripts/performance/llm/pretrain_llama3_70b.py+2
- scripts/performance/llm/pretrain_llama3_8b.py+2
- scripts/performance/llm/pretrain_llama4_e128.py+2
- scripts/performance/llm/pretrain_llama4_e16.py+2
- scripts/performance/llm/pretrain_mixtral_8x22b.py+2
- scripts/performance/llm/pretrain_mixtral_8x7b.py+2
- scripts/performance/llm/pretrain_nemotronh_47b.py+2
- scripts/performance/llm/pretrain_nemotronh_56b.py+2
- scripts/performance/llm/pretrain_nemotronh_8b.py+2
- scripts/performance/llm/pretrain_qwen3_235b_a22b.py+2
- scripts/performance/llm/pretrain_qwen3_30b_a3b.py+2
- scripts/performance/recommended_model_configs/model_configs_b200.csv+2-2
- scripts/performance/recommended_model_configs/model_configs_gb200.csv+2-2
- scripts/performance/recommended_model_configs/model_configs_h100.csv+2-2
- scripts/performance/vlm/finetune_qwen25vl_32b.py+2
- scripts/performance/vlm/finetune_qwen25vl_7b.py+2
- scripts/performance/vlm/pretrain_vlm_llama4_e128.py+2
- scripts/performance/vlm/pretrain_vlm_llama4_e16.py+2
- scripts/vlm/qwen25vl_generate.py+42-45
- tests/collections/audio/test_audio_modules_transforms.py+86
- tests/collections/llm/gpt/model/test_evo2.py+3-3
- tests/collections/llm/gpt/model/test_hyena_mixer_kernel.py+118
- tests/collections/vlm/inference/__init__.py+13
- tests/collections/vlm/inference/test_base.py+669
- tests/collections/vlm/inference/test_qwenvl_inference_wrapper.py+285
- tests/collections/vlm/inference/test_vlm_inference_controller.py+286
0 commit comments