README.md
pyproject.toml
setup.py
src/xlm/__init__.py
src/xlm/__main__.py
src/xlm/datamodule.py
src/xlm/external_models.py
src/xlm/flags.py
src/xlm/generative_perplexity.py
src/xlm/harness.py
src/xlm/log_predictions.py
src/xlm/metrics.py
src/xlm/model.py
src/xlm/noise.py
src/xlm/py.typed
src/xlm/version.py
src/xlm/commands/__init__.py
src/xlm/commands/cli_demo.py
src/xlm/commands/extract_model_state_dict.py
src/xlm/commands/generate_star_graphs.py
src/xlm/commands/hydra_callbacks.py
src/xlm/commands/lightning_eval.py
src/xlm/commands/lightning_generate.py
src/xlm/commands/lightning_main.py
src/xlm/commands/lightning_prepare_data.py
src/xlm/commands/lightning_train.py
src/xlm/commands/push_to_hub.py
src/xlm/commands/scaffold_model.py
src/xlm/commands/split_owt.py
src/xlm/commands/train_tokenizer.py
src/xlm/configs/common/cluster/unity_default.yaml
src/xlm/configs/common/cluster/unity_gypsum.yaml
src/xlm/configs/common/hydra/default.yaml
src/xlm/configs/common/hydra/callbacks/dynamic_help.yaml
src/xlm/configs/common/hydra/help/xlm.yaml
src/xlm/configs/common/paths/default.yaml
src/xlm/configs/lightning_train/config.yaml
src/xlm/configs/lightning_train/callbacks/checkpoint_every_n_steps_with_thinning.yaml
src/xlm/configs/lightning_train/callbacks/checkpoint_monitor.yaml
src/xlm/configs/lightning_train/callbacks/debug.yaml
src/xlm/configs/lightning_train/callbacks/debug_small_data.yaml
src/xlm/configs/lightning_train/callbacks/debug_v2.yaml
src/xlm/configs/lightning_train/callbacks/default.yaml
src/xlm/configs/lightning_train/callbacks/default_v2.yaml
src/xlm/configs/lightning_train/callbacks/ema.yaml
src/xlm/configs/lightning_train/callbacks/file_friendly_progress_bar.yaml
src/xlm/configs/lightning_train/callbacks/learning_rate_monitor.yaml
src/xlm/configs/lightning_train/callbacks/log_gradients_to_tensorboard.yaml
src/xlm/configs/lightning_train/callbacks/on_exception_checkpoint.yaml
src/xlm/configs/lightning_train/callbacks/print_batch.yaml
src/xlm/configs/lightning_train/callbacks/print_batch_v2.yaml
src/xlm/configs/lightning_train/callbacks/speed_monitor.yaml
src/xlm/configs/lightning_train/callbacks/unconditional_samples.yaml
src/xlm/configs/lightning_train/datamodule/default.yaml
src/xlm/configs/lightning_train/datamodule/lm1b.yaml
src/xlm/configs/lightning_train/datamodule/owt.yaml
src/xlm/configs/lightning_train/datasets/default_text.yaml
src/xlm/configs/lightning_train/datasets/lm1b_test.yaml
src/xlm/configs/lightning_train/datasets/lm1b_train.yaml
src/xlm/configs/lightning_train/datasets/owt_test.yaml
src/xlm/configs/lightning_train/datasets/owt_train.yaml
src/xlm/configs/lightning_train/datasets/owt_val.yaml
src/xlm/configs/lightning_train/datasets/star.yaml
src/xlm/configs/lightning_train/datasets/star_easy_test.yaml
src/xlm/configs/lightning_train/datasets/star_easy_test_pred.yaml
src/xlm/configs/lightning_train/datasets/star_easy_train.yaml
src/xlm/configs/lightning_train/datasets/star_easy_val.yaml
src/xlm/configs/lightning_train/datasets/star_easy_val_pred.yaml
src/xlm/configs/lightning_train/datasets/star_hard_test.yaml
src/xlm/configs/lightning_train/datasets/star_hard_test_pred.yaml
src/xlm/configs/lightning_train/datasets/star_hard_train.yaml
src/xlm/configs/lightning_train/datasets/star_hard_val.yaml
src/xlm/configs/lightning_train/datasets/star_hard_val_pred.yaml
src/xlm/configs/lightning_train/datasets/star_medium_test.yaml
src/xlm/configs/lightning_train/datasets/star_medium_test_pred.yaml
src/xlm/configs/lightning_train/datasets/star_medium_train.yaml
src/xlm/configs/lightning_train/datasets/star_medium_val.yaml
src/xlm/configs/lightning_train/datasets/star_medium_val_pred.yaml
src/xlm/configs/lightning_train/datasets/sudoku_train.yaml
src/xlm/configs/lightning_train/datasets/sudoku_val.yaml
src/xlm/configs/lightning_train/datasets/sudoku_val_pred.yaml
src/xlm/configs/lightning_train/datasets/text_uncoditional_prediction.yaml
src/xlm/configs/lightning_train/debug/eval_unconditional_preds.yaml
src/xlm/configs/lightning_train/debug/multinode.yaml
src/xlm/configs/lightning_train/debug/no_dl_workers.yaml
src/xlm/configs/lightning_train/debug/overfit.yaml
src/xlm/configs/lightning_train/debug/print_predictions.yaml
src/xlm/configs/lightning_train/debug/profile_single_node.yaml
src/xlm/configs/lightning_train/debug/small_data.yaml
src/xlm/configs/lightning_train/experiment/gpt2_generative_perplexity.yaml
src/xlm/configs/lightning_train/generative_perplexity/gpt2-large.yaml
src/xlm/configs/lightning_train/generative_perplexity/gpt2-small.yaml
src/xlm/configs/lightning_train/generative_perplexity/llama3_3B.yaml
src/xlm/configs/lightning_train/loggers/debug.yaml
src/xlm/configs/lightning_train/loggers/default.yaml
src/xlm/configs/lightning_train/loggers/tensorboard.yaml
src/xlm/configs/lightning_train/loggers/wandb.yaml
src/xlm/configs/lightning_train/metrics/accumulated_loss.yaml
src/xlm/configs/lightning_train/metrics/exact_match.yaml
src/xlm/configs/lightning_train/metrics/seq2seq_exact_match.yaml
src/xlm/configs/lightning_train/metrics/seq2seq_length_loss.yaml
src/xlm/configs/lightning_train/metrics/seq2seq_token_accuracy.yaml
src/xlm/configs/lightning_train/metrics/seq2seq_token_ce.yaml
src/xlm/configs/lightning_train/metrics/token_accuracy.yaml
src/xlm/configs/lightning_train/model/rotary_transformer.yaml
src/xlm/configs/lightning_train/model/rotary_transformer_xtiny2.yaml
src/xlm/configs/lightning_train/noise_schedule/dummy.yaml
src/xlm/configs/lightning_train/trainer_strategy/cpu.yaml
src/xlm/configs/lightning_train/trainer_strategy/ddp.yaml
src/xlm/configs/lightning_train/trainer_strategy/ddp_multinode.yaml
src/xlm/configs/lightning_train/trainer_strategy/ddp_multinode_no_hooks.yaml
src/xlm/configs/lightning_train/trainer_strategy/single_device.yaml
src/xlm/configs/slurm/generate_sbatch.yaml
src/xlm/configs/slurm/train_sbatch.yaml
src/xlm/configs/slurm/hardware/1_node_1_gpu.yaml
src/xlm/configs/slurm/hardware/ddp_2_node_1_gpu_debug.yaml
src/xlm/configs/slurm/hardware/ddp_4_node_1_gpu.yaml
src/xlm/configs/slurm/hardware/ddp_8_node_1_gpu.yaml
src/xlm/modules/__init__.py
src/xlm/modules/ddit_simple.py
src/xlm/modules/ddit_simple_v2.py
src/xlm/modules/encoder.py
src/xlm/modules/gpt2_transformer.py
src/xlm/modules/position.py
src/xlm/modules/rotary_transformer.py
src/xlm/tasks/__init__.py
src/xlm/tasks/lm1b.py
src/xlm/tasks/owt.py
src/xlm/tasks/star.py
src/xlm/tasks/star_old.py
src/xlm/tasks/sudoku.py
src/xlm/utils/__init__.py
src/xlm/utils/batch_size.py
src/xlm/utils/checkpoint_with_thinning.py
src/xlm/utils/data.py
src/xlm/utils/ddp.py
src/xlm/utils/debug.py
src/xlm/utils/ema.py
src/xlm/utils/file_friendly_progress_callback.py
src/xlm/utils/imports.py
src/xlm/utils/nn.py
src/xlm/utils/omegaconf_resolvers.py
src/xlm/utils/on_exception_checkpoint.py
src/xlm/utils/os.py
src/xlm/utils/rank_zero.py
src/xlm/utils/rich_utils.py
src/xlm/utils/saving_utils.py
src/xlm/utils/seed.py
src/xlm/utils/signal.py
src/xlm/utils/slurm.py
src/xlm/utils/speed_monitor_callback.py
src/xlm/utils/tqdm.py
src/xlm/utils/wandb.py
src/xlm_core.egg-info/PKG-INFO
src/xlm_core.egg-info/SOURCES.txt
src/xlm_core.egg-info/dependency_links.txt
src/xlm_core.egg-info/entry_points.txt
src/xlm_core.egg-info/requires.txt
src/xlm_core.egg-info/top_level.txt