configs/__init__.py,sha256=JPftAl0UOmUEW7_01z1Ldy367-6HDQymLUtb4cB-Os0,41
configs/deepspeed/zero3_config_gpu1.json,sha256=QqbMEMySxJk1rlRXJEKzZQOMSCa-pHVbPWE2uqYtjBs,874
configs/deepspeed/zero3_config_gpu2.json,sha256=I5OWZYO3P8nJVW4u0ybNvhDDw3Gg5TRZQPGTuAEnrnM,874
configs/deepspeed/zero3_config_gpu4.json,sha256=DDYFcRPWRqW6RvavfCkz_jf9RTa7WXKM1KUnRlp4UIQ,874
configs/deepspeed/zero3_config_gpu8.json,sha256=H1AVY0lk03QSGHcfmak1zyzNNjR5DULCrcGVDCuhKk4,875
configs/evaluation/mmlu/llama3_3B_recipe.yaml,sha256=9tmiD9Scm4Alr3xxt5UtPynXXiWol3d2w2Nl9ebVDPM,851
configs/inference/llama3_3B_recipe.yaml,sha256=rzi5mD_d_pgeJf66E6KDyi6XcngEMfp67CIfyLvHtAw,2619
configs/training/dpo/llama3_3B_full_recipe.yaml,sha256=B2C55x1ttL2dfmnY0PO6dszkixA0cqtNQUaIjj7ZMPI,1464
configs/training/dpo/llama3_3B_lora_recipe.yaml,sha256=rYqG-qqUGbwu81XbKnmFOguGv0X1u0sDCb8GLkLKe98,1939
configs/training/dpo/llama3_3B_qlora_recipe.yaml,sha256=VYFAgxV8bnLSRGYWVjq4ud50LNjMWW0bj2bebQZ8qMU,2334
configs/training/grpo/llama3_3B_full_recipe.yaml,sha256=x-Gbsp4ZCT6aNV3YdYa2TKnRmm1BfkgctjSI8GZlYN4,1372
configs/training/grpo/llama3_3B_lora_recipe.yaml,sha256=1iOSMqybdFOFvQ89cDPunKl6WA1FTpfiqCX0JsZPypY,1842
configs/training/gspo/llama3_3B_full_recipe.yaml,sha256=nFBTdk1Muh4vYDUYFw3o8vSa7RCLzN_Yqvy9ghj1c-A,1896
configs/training/gspo/llama3_3B_lora_recipe.yaml,sha256=1USGxBk3TMohplGWWsteZIkx3ziANFpJvkSL8-rbrwo,2366
configs/training/ppo/llama3_3B_full_recipe.yaml,sha256=mLBL2Ab75W9EcribV4F-i69PexmdZf99M-I0bjafoSA,1757
configs/training/ppo/llama3_3B_lora_recipe.yaml,sha256=E0jyWFayKrkaEO1VN-Jf4SxLhubOeWHpBWOBJdc3Ujg,2069
configs/training/ppo/llama3_3B_qlora_recipe.yaml,sha256=NskgPhEOV6PS41-Q3EX7SANH8N2WjLCdPrpj69wt3p0,2464
configs/training/sft/llama3_3B_full_recipe.yaml,sha256=2DZI8BKGfB2r9mV0tAaLKb0I_aqSqsu5rDeyHAgVOiQ,1972
configs/training/sft/llama3_3B_lora_recipe.yaml,sha256=5B_AaGdMHj1pwPkUvQ2-KmZbfI9K5sUGyxvrp2da60Y,2440
configs/training/sft/llama3_3B_qlora_recipe.yaml,sha256=DVPLFPO2Z2arYOOgNuL2xeudy26xQdV8E1uNK73e73E,2834
core/__init__.py,sha256=ZLoFWQbRZmA7N3sNO4jhtFWK4XK39WsL9E7SGGXTbPQ,503
core/config.py,sha256=e_7j4yqdA7KYoamUBBUQBALGMhE6-GiEePkeeDVH-ko,10973
core/model_utils.py,sha256=U-LCHfJg5vp8eJg7lX6aRmtgddB-ojB9g29lwkjdQUo,5270
core/trainer_base.py,sha256=j1WLm5smbgU2IaF1rA1Sg5udbc-_a_MN5HmCQmjMw-w,10177
evaluations/README.md,sha256=4iDwuRVrcBjh6HdfsHG7qwsuYe1shFKGIkY5Ox8zeXU,2886
evaluations/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
evaluations/eval.py,sha256=rUTx7fUFEJGf2ZwFGxOdh3IcNybFCVS4I69zDGvBTvs,18345
inference/README.md,sha256=s6ZayJQ5tvbOxRxynsX04HhEsn8ZXVeYlHWb0bfaaU8,2483
inference/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
inference/inference.py,sha256=RF0nG51mi_wFIkischa-b6YcWWUXf3BlcF5hRQyEADU,17385
scripts/run_evaluation.sh,sha256=yeryJXpnu9pEdaewm2Bbc0XXSdEvNOeSgwvzxwqiZ7I,2006
scripts/run_inference.py,sha256=rtyNL-H5vDJcTuQD-ljAMxmccP3QliJJQAghC5TD7GM,2805
scripts/run_inference.sh,sha256=ZNyzkQPCHXltIeEXXsyg1RWqjeivcQw_ehsYoYTSxCI,2472
scripts/run_training.sh,sha256=5uwOfBUaho_jEIJajf280jhX1Xp4Sh2D0-NJDwzTHvA,5401
scripts/train.py,sha256=plOydOzpXC1smFo_rgIjj1f1q84JlxI3L-joWneJGZ8,11425
trainers/README.md,sha256=EnUTe7b-kVo7ZyDhNOmc16T8adFzgIoxUo2NtxVMh2o,10779
trainers/__init__.py,sha256=GRzSseIIGpqQVwXLfvunt6ruyydWxiImE6DEw6ytFuY,325
trainers/dpo_trainer.py,sha256=AsHTpTsaGh9A_xhhB0qC2KMy6Cis_Ravg3092PZahRQ,7903
trainers/grpo_trainer.py,sha256=1QhT2vFzTQx8n5J1RnEi-q3SKLGyWtGRSkR2_M5Js7I,7677
trainers/gspo_trainer.py,sha256=0A2kST0P6qpm0tKzpjpT07zmFfSrVWGyDZmx_llBUuQ,8083
trainers/ppo_trainer.py,sha256=kzG4emNqxBePPAwJ5Yxx6EOuLAqBvjGo19JAJ46Into,15897
trainers/sft_trainer.py,sha256=6fjQiHp6TjE30np3qIVHzopPNwhYRS0_DlixB8fxxyI,7254
trainers/rewards/__init__.py,sha256=1n7-T_HVBsCUh6g3VSA9kbkYZtKOxP4xcZtZN7lKS_k,138
trainers/rewards/accuracy_rewards.py,sha256=6_c5MNZXgbN_bJll6II07Jznh89TUAks2Jk47UQ10EQ,2083
trainers/rewards/format_rewards.py,sha256=YOTaHWy0Mj31KlRR8TawhDVEsq7eCQsmsPSyodFW1q8,761
trainers/templates/__init__.py,sha256=LjHvIpd2MlC5KXj-ytZeGlB6RKBdxse-SmNs5KX9Kto,210
trainers/templates/gsm8k_template.py,sha256=9eKKr7UkJgt433Wb8FGptKoetFh3oJwhieQb3rE9L_g,3367
trainers/templates/openmathinstruct_template.py,sha256=fXfdM1RjD4f4Mqb9U3mz9raJqHhqHZDkNekDydVlSNE,3167
utils/__init__.py,sha256=gdozgduqj7ezlsIAf1hAQmqyBAhEDdRypqXLZC2BKg0,218
utils/logging_utils.py,sha256=xSlc1L13L0IK5TavxfOIfnCqr1GJdbZnKPs-a7vALEM,4678
venv_deploy/share/jupyter/kernels/python3/kernel.json,sha256=69y5qspxusKKSbKfpYw86C4_UFV01AU6NtRuUi9t-kI,193
venv_deploy/share/jupyter/labextensions/@jupyter-widgets/jupyterlab-manager/install.json,sha256=e65KcDNtdaA4aZgF1mLHIhwaoIzpH9LmUueG4iJYmI0,197
venv_deploy/share/jupyter/labextensions/@jupyter-widgets/jupyterlab-manager/package.json,sha256=vmebfycAy9ffbvozQULkX7ZwWimcOH7gX3pG2PctTHE,3551
venv_deploy/share/jupyter/labextensions/@jupyter-widgets/jupyterlab-manager/schemas/@jupyter-widgets/jupyterlab-manager/plugin.json,sha256=IWNBmBm-GTATCrzha5m-Kh0Gt6H4KzGsnzcuSigjx2A,375
venv_deploy/share/jupyter/labextensions/@jupyter-widgets/jupyterlab-manager/static/third-party-licenses.json,sha256=rAEtxqfQ91D1yZL60D4LaDq1y5tR-5HE0ih2wdIEZoY,32961
fai_rl-0.1.2.dist-info/METADATA,sha256=uOWKxHGY0BRM5zzUjVI6ATeZliDvkrayQj9LYyGHmpI,6242
fai_rl-0.1.2.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
fai_rl-0.1.2.dist-info/entry_points.txt,sha256=RXIEJu9nGkumQG_SHFpjdspyBMzlzHVVmf04SIhaMN4,134
fai_rl-0.1.2.dist-info/top_level.txt,sha256=imDwC8k77PliHi5xcLMbFvG1ieVBSKzkiueFZcyxEaU,70
fai_rl-0.1.2.dist-info/RECORD,,
