LICENSE
README.md
pyproject.toml
nemo_automodel/__init__.py
nemo_automodel/package_info.py
nemo_automodel.egg-info/PKG-INFO
nemo_automodel.egg-info/SOURCES.txt
nemo_automodel.egg-info/dependency_links.txt
nemo_automodel.egg-info/entry_points.txt
nemo_automodel.egg-info/requires.txt
nemo_automodel.egg-info/top_level.txt
nemo_automodel/_cli/app.py
nemo_automodel/_diffusers/__init__.py
nemo_automodel/_diffusers/auto_diffusion_pipeline.py
nemo_automodel/_transformers/__init__.py
nemo_automodel/_transformers/auto_model.py
nemo_automodel/_transformers/auto_tokenizer.py
nemo_automodel/_transformers/infrastructure.py
nemo_automodel/_transformers/kernel_patches.py
nemo_automodel/_transformers/model_init.py
nemo_automodel/_transformers/registry.py
nemo_automodel/_transformers/utils.py
nemo_automodel/_transformers/tokenization/nemo_auto_tokenizer.py
nemo_automodel/_transformers/tokenization/registry.py
nemo_automodel/_transformers/tokenization/tokenization_mistral_common.py
nemo_automodel/autonvtx/__init__.py
nemo_automodel/components/__init__.py
nemo_automodel/components/_peft/__init__.py
nemo_automodel/components/_peft/lora.py
nemo_automodel/components/_peft/lora_kernel.py
nemo_automodel/components/_peft/lora_moe.py
nemo_automodel/components/_peft/module_matcher.py
nemo_automodel/components/attention/__init__.py
nemo_automodel/components/attention/flex_attention.py
nemo_automodel/components/attention/utils.py
nemo_automodel/components/checkpoint/__init__.py
nemo_automodel/components/checkpoint/_torch_backports.py
nemo_automodel/components/checkpoint/addons.py
nemo_automodel/components/checkpoint/checkpointing.py
nemo_automodel/components/checkpoint/conversion_mapping.py
nemo_automodel/components/checkpoint/state_dict_adapter.py
nemo_automodel/components/checkpoint/stateful_wrappers.py
nemo_automodel/components/checkpoint/utils.py
nemo_automodel/components/checkpoint/_backports/__init__.py
nemo_automodel/components/checkpoint/_backports/_fsspec_filesystem.py
nemo_automodel/components/checkpoint/_backports/_version.py
nemo_automodel/components/checkpoint/_backports/consolidate_hf_safetensors.py
nemo_automodel/components/checkpoint/_backports/default_planner.py
nemo_automodel/components/checkpoint/_backports/filesystem.py
nemo_automodel/components/checkpoint/_backports/hf_storage.py
nemo_automodel/components/checkpoint/_backports/hf_utils.py
nemo_automodel/components/checkpoint/_backports/planner_helpers.py
nemo_automodel/components/config/__init__.py
nemo_automodel/components/config/_arg_parser.py
nemo_automodel/components/config/loader.py
nemo_automodel/components/datasets/__init__.py
nemo_automodel/components/datasets/reservoir_sampler.py
nemo_automodel/components/datasets/utils.py
nemo_automodel/components/datasets/llm/__init__.py
nemo_automodel/components/datasets/llm/chat_dataset.py
nemo_automodel/components/datasets/llm/column_mapped_text_instruction_dataset.py
nemo_automodel/components/datasets/llm/column_mapped_text_instruction_iterable_dataset.py
nemo_automodel/components/datasets/llm/delta_lake_dataset.py
nemo_automodel/components/datasets/llm/formatting_utils.py
nemo_automodel/components/datasets/llm/hellaswag.py
nemo_automodel/components/datasets/llm/megatron_dataset.py
nemo_automodel/components/datasets/llm/mock.py
nemo_automodel/components/datasets/llm/mock_iterable_dataset.py
nemo_automodel/components/datasets/llm/mock_packed.py
nemo_automodel/components/datasets/llm/nanogpt_dataset.py
nemo_automodel/components/datasets/llm/packed_sequence.py
nemo_automodel/components/datasets/llm/retrieval_collator.py
nemo_automodel/components/datasets/llm/retrieval_dataset.py
nemo_automodel/components/datasets/llm/retrieval_dataset_inline.py
nemo_automodel/components/datasets/llm/seq_cls.py
nemo_automodel/components/datasets/llm/squad.py
nemo_automodel/components/datasets/llm/xlam.py
nemo_automodel/components/datasets/llm/megatron/Makefile
nemo_automodel/components/datasets/llm/megatron/__init__.py
nemo_automodel/components/datasets/llm/megatron/builder.py
nemo_automodel/components/datasets/llm/megatron/gpt_dataset.py
nemo_automodel/components/datasets/llm/megatron/helpers.py
nemo_automodel/components/datasets/llm/megatron/indexed_dataset.py
nemo_automodel/components/datasets/llm/megatron/megatron_utils.py
nemo_automodel/components/datasets/llm/megatron/sampler.py
nemo_automodel/components/datasets/vlm/__init__.py
nemo_automodel/components/datasets/vlm/collate_fns.py
nemo_automodel/components/datasets/vlm/datasets.py
nemo_automodel/components/datasets/vlm/utils.py
nemo_automodel/components/distributed/__init__.py
nemo_automodel/components/distributed/config.py
nemo_automodel/components/distributed/cp_utils.py
nemo_automodel/components/distributed/ddp.py
nemo_automodel/components/distributed/fsdp2.py
nemo_automodel/components/distributed/grad_utils.py
nemo_automodel/components/distributed/init_utils.py
nemo_automodel/components/distributed/megatron_fsdp.py
nemo_automodel/components/distributed/mesh.py
nemo_automodel/components/distributed/mesh_utils.py
nemo_automodel/components/distributed/optimized_tp_plans.py
nemo_automodel/components/distributed/parallel_styles.py
nemo_automodel/components/distributed/parallelizer.py
nemo_automodel/components/distributed/parallelizer_utils.py
nemo_automodel/components/distributed/tensor_utils.py
nemo_automodel/components/distributed/thd_utils.py
nemo_automodel/components/distributed/utils.py
nemo_automodel/components/distributed/pipelining/__init__.py
nemo_automodel/components/distributed/pipelining/autopipeline.py
nemo_automodel/components/distributed/pipelining/config.py
nemo_automodel/components/distributed/pipelining/functional.py
nemo_automodel/components/distributed/pipelining/hf_utils.py
nemo_automodel/components/launcher/__init__.py
nemo_automodel/components/launcher/slurm/config.py
nemo_automodel/components/launcher/slurm/template.py
nemo_automodel/components/launcher/slurm/utils.py
nemo_automodel/components/loggers/__init__.py
nemo_automodel/components/loggers/log_utils.py
nemo_automodel/components/loggers/metric_logger.py
nemo_automodel/components/loggers/mlflow_utils.py
nemo_automodel/components/loggers/wandb_utils.py
nemo_automodel/components/loss/__init__.py
nemo_automodel/components/loss/chunked_ce.py
nemo_automodel/components/loss/kd_loss.py
nemo_automodel/components/loss/linear_ce.py
nemo_automodel/components/loss/masked_ce.py
nemo_automodel/components/loss/te_parallel_ce.py
nemo_automodel/components/loss/triton/te_cross_entropy.py
nemo_automodel/components/models/__init__.py
nemo_automodel/components/models/gpt2.py
nemo_automodel/components/models/biencoder/__init__.py
nemo_automodel/components/models/biencoder/biencoder_model.py
nemo_automodel/components/models/biencoder/llama_bidirectional_model.py
nemo_automodel/components/models/biencoder/state_dict_adapter.py
nemo_automodel/components/models/common/__init__.py
nemo_automodel/components/models/common/hf_checkpointing_mixin.py
nemo_automodel/components/models/common/utils.py
nemo_automodel/components/models/common/combined_projection/__init__.py
nemo_automodel/components/models/common/combined_projection/combined_mlp.py
nemo_automodel/components/models/common/combined_projection/combined_qkv.py
nemo_automodel/components/models/common/combined_projection/state_dict_adapter.py
nemo_automodel/components/models/deepseek_v3/__init__.py
nemo_automodel/components/models/deepseek_v3/layers.py
nemo_automodel/components/models/deepseek_v3/model.py
nemo_automodel/components/models/deepseek_v3/rope_utils.py
nemo_automodel/components/models/deepseek_v3/state_dict_adapter.py
nemo_automodel/components/models/deepseek_v32/__init__.py
nemo_automodel/components/models/deepseek_v32/config.py
nemo_automodel/components/models/deepseek_v32/layers.py
nemo_automodel/components/models/deepseek_v32/model.py
nemo_automodel/components/models/deepseek_v32/state_dict_adapter.py
nemo_automodel/components/models/glm4_moe/__init__.py
nemo_automodel/components/models/glm4_moe/layers.py
nemo_automodel/components/models/glm4_moe/model.py
nemo_automodel/components/models/glm4_moe/state_dict_adapter.py
nemo_automodel/components/models/gpt_oss/__init__.py
nemo_automodel/components/models/gpt_oss/layers.py
nemo_automodel/components/models/gpt_oss/model.py
nemo_automodel/components/models/gpt_oss/rope_utils.py
nemo_automodel/components/models/gpt_oss/state_dict_adapter.py
nemo_automodel/components/models/kimi_k25_vl/__init__.py
nemo_automodel/components/models/kimi_k25_vl/model.py
nemo_automodel/components/models/kimi_k25_vl/state_dict_adapter.py
nemo_automodel/components/models/kimivl/__init__.py
nemo_automodel/components/models/kimivl/model.py
nemo_automodel/components/models/llama/__init__.py
nemo_automodel/components/models/llama/model.py
nemo_automodel/components/models/llama/rope_utils.py
nemo_automodel/components/models/llama/state_dict_adapter.py
nemo_automodel/components/models/minimax_m2/__init__.py
nemo_automodel/components/models/minimax_m2/layers.py
nemo_automodel/components/models/minimax_m2/model.py
nemo_automodel/components/models/minimax_m2/state_dict_adapter.py
nemo_automodel/components/models/mistral3/__init__.py
nemo_automodel/components/models/mistral3/model.py
nemo_automodel/components/models/nemotron_parse/__init__.py
nemo_automodel/components/models/nemotron_parse/model.py
nemo_automodel/components/models/nemotron_parse/nemotron_parse_loss.py
nemo_automodel/components/models/nemotron_v3/__init__.py
nemo_automodel/components/models/nemotron_v3/layers.py
nemo_automodel/components/models/nemotron_v3/model.py
nemo_automodel/components/models/nemotron_v3/state_dict_adapter.py
nemo_automodel/components/models/qwen2/__init__.py
nemo_automodel/components/models/qwen2/model.py
nemo_automodel/components/models/qwen2/state_dict_adapter.py
nemo_automodel/components/models/qwen3_moe/__init__.py
nemo_automodel/components/models/qwen3_moe/layers.py
nemo_automodel/components/models/qwen3_moe/model.py
nemo_automodel/components/models/qwen3_moe/state_dict_adapter.py
nemo_automodel/components/models/qwen3_next/__init__.py
nemo_automodel/components/models/qwen3_next/layers.py
nemo_automodel/components/models/qwen3_next/model.py
nemo_automodel/components/models/qwen3_next/state_dict_adapter.py
nemo_automodel/components/models/qwen3_omni_moe/__init__.py
nemo_automodel/components/models/qwen3_omni_moe/model.py
nemo_automodel/components/models/qwen3_omni_moe/state_dict_adapter.py
nemo_automodel/components/models/qwen3_vl_moe/__init__.py
nemo_automodel/components/models/qwen3_vl_moe/model.py
nemo_automodel/components/models/qwen3_vl_moe/state_dict_adapter.py
nemo_automodel/components/models/step3p5/__init__.py
nemo_automodel/components/models/step3p5/layers.py
nemo_automodel/components/models/step3p5/model.py
nemo_automodel/components/models/step3p5/state_dict_adapter.py
nemo_automodel/components/moe/__init__.py
nemo_automodel/components/moe/config.py
nemo_automodel/components/moe/experts.py
nemo_automodel/components/moe/fsdp_mixin.py
nemo_automodel/components/moe/layers.py
nemo_automodel/components/moe/parallelizer.py
nemo_automodel/components/moe/state_dict_mixin.py
nemo_automodel/components/moe/state_dict_utils.py
nemo_automodel/components/moe/megatron/__init__.py
nemo_automodel/components/moe/megatron/fused_a2a.py
nemo_automodel/components/moe/megatron/fused_indices_converter.py
nemo_automodel/components/moe/megatron/moe_utils.py
nemo_automodel/components/moe/megatron/token_dispatcher.py
nemo_automodel/components/optim/__init__.py
nemo_automodel/components/optim/scheduler.py
nemo_automodel/components/optim/utils.py
nemo_automodel/components/quantization/__init__.py
nemo_automodel/components/quantization/fp8.py
nemo_automodel/components/quantization/qat.py
nemo_automodel/components/quantization/qlora.py
nemo_automodel/components/training/__init__.py
nemo_automodel/components/training/model_output_utils.py
nemo_automodel/components/training/rng.py
nemo_automodel/components/training/signal_handler.py
nemo_automodel/components/training/step_scheduler.py
nemo_automodel/components/training/timers.py
nemo_automodel/components/training/utils.py
nemo_automodel/components/utils/__init__.py
nemo_automodel/components/utils/compile_utils.py
nemo_automodel/components/utils/flops_utils.py
nemo_automodel/components/utils/model_utils.py
nemo_automodel/components/utils/yaml_utils.py
nemo_automodel/recipes/_dist_setup.py
nemo_automodel/recipes/base_recipe.py
nemo_automodel/recipes/biencoder/__init__.py
nemo_automodel/recipes/biencoder/mine_hard_negatives.py
nemo_automodel/recipes/biencoder/train_biencoder.py
nemo_automodel/recipes/llm/benchmark.py
nemo_automodel/recipes/llm/kd.py
nemo_automodel/recipes/llm/train_ft.py
nemo_automodel/recipes/llm/train_seq_cls.py
nemo_automodel/recipes/vlm/finetune.py
nemo_automodel/shared/__init__.py
nemo_automodel/shared/import_utils.py
nemo_automodel/shared/torch_patches.py
nemo_automodel/shared/utils.py