examples/datasets/anthropic_hh.py,sha256=SVc_ZHldn6YmqV2-5G5jgnm_gYdlER3XnnunpJd1ruo,4229
examples/datasets/tldr_preference.py,sha256=pPbQXnNXTl-daKKDp0Prx9NhgXT86y6_c6oFIQg8BgU,4139
examples/datasets/tokenize_ds.py,sha256=THM32kd-6jCVmefHO6oZ_hfyZ1u77NO5NfZAwIqitvw,1559
examples/scripts/ddpo.py,sha256=QS91t3sw1voySX6C-E2e-Kqpy5s6e-M0dT7dECbxSjk,6500
examples/scripts/dpo.py,sha256=2gUU4BOgKblXat9h3iozbpLOV-L8ocIcu98WqZPSbTY,6054
examples/scripts/kto.py,sha256=6hIOeA8pcTA_dwlUsw2EcKzNfYzDlY8qJG7UF9MxXaI,3729
examples/scripts/ppo.py,sha256=D_vm_vc9T1AH5Au-3YUJ5v2mLXLfz-2dDnOAS4hSUBI,7646
examples/scripts/ppo_multi_adapter.py,sha256=wnjUJ_bT63rbVvD28SkcOHF5kFdhP6fmgQzCxXsLwZA,5261
examples/scripts/reward_modeling.py,sha256=1-bFGP-HluJjiEmiMtDou_UlQKQKp-r66FtSewvciXU,4596
examples/scripts/sft.py,sha256=jGp1BG5rnx6UmoszGc-KuLGOl9Yhf03uxz-OrgKWjho,4730
tests/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
tests/test_best_of_n_sampler.py,sha256=cpvov4JPTyR7vTVR6TL2VEieBRy8n3DKd9rvmSNaYgk,3158
tests/test_cli.py,sha256=b1iYYCsg8hiMgWN8V9YORw3gB5uaPBpVweaxXAp7gfU,1723
tests/test_core.py,sha256=VZhUKUEnYJUeAnDNXF_1Nci-fDk9gFFH23xk0QZdpm4,1545
tests/test_cpo_trainer.py,sha256=DJVumDG6dZHEchioDDtkdCMhIH_WWssB2MBy9JkNFxc,6283
tests/test_data_collator_completion_only.py,sha256=wC9ma4bcoQpQJFR3SSDW2mPcfcrOEQJuj2hrUAVVd40,5505
tests/test_dataset_formatting.py,sha256=d79wNIYDpBqbfwDIZGsV91r2rl2aOxsyfGviXw3SziE,6894
tests/test_ddpo_trainer.py,sha256=yKdl7BBT-TgMoCGPY3Bu5xkwaNjfjXsXQuR5cnGv49w,4168
tests/test_dpo_trainer.py,sha256=2LschDcXe-y7twtWNWSztNGSCNnwUJVrykp4u3n_Qx4,22515
tests/test_e2e.py,sha256=eUbrUuWkgM8KnMR1msSk-BNvovUk7JerdvjAsOh_KT0,152
tests/test_environments.py,sha256=myopLePaDu4EU2-PaB6TD_K2C1hvDNohIx5rZWqYc7U,11127
tests/test_iterative_sft_trainer.py,sha256=C-H9v4VeYUtuF2sHsteOUNMBlFOeb2gNjKgWU5QuQHU,4597
tests/test_kto_trainer.py,sha256=wNsOFJe1ndjTFnh1phUKEKZ2DweSWr6HtCMQJDvym8s,14983
tests/test_modeling_value_head.py,sha256=7N0fZxNboDFqX2iv-k6EDGgN3Tc5pJshKUMi-MNvtvw,22746
tests/test_no_peft.py,sha256=e6LgycQ7f4woUPmHBKfs3hvMbU8GCOdRvxYF14vkUB0,5560
tests/test_orpo_trainer.py,sha256=ojfPXVZ2HKY9XdC5FTJYYwkcjzRMLeXB4hvh2tD4pcs,6119
tests/test_peft_models.py,sha256=pcZ3HmT8pur78O7AhM_SCYBHEitz9vsg5nxq8rLUgac,9122
tests/test_ppo_trainer.py,sha256=LgC5N83EsdQQ09jrg0zZ4mC-1z6sXMnUY3cxgIEr5Zs,47392
tests/test_reward_trainer.py,sha256=55nwLp7hS6MMLaTZX970iuqq1MrUGFyxHoFZ3HOFJnM,13419
tests/test_rich_progress_callback.py,sha256=fbBsKmDFMYrHMVyFCE2s5erbCNUEFp1tBl0i3foxud4,1640
tests/test_sft_trainer.py,sha256=8H-1Z-lboLv33LrgW9wYYq-QIn3pXZahRPtceJ-LrB0,43099
tests/testing_constants.py,sha256=NjVJ5Q7LaQcEhbU2OIgK81fgR3H97Nuq3eW6aLPIisg,799
tests/testing_utils.py,sha256=26WvbkTM5cdJyixg837Lx9BposCY7AjEn3du3PqIJ0I,3342
tests/slow/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
tests/slow/test_dpo_slow.py,sha256=AOMlK7hA9hXyoh20b9pHehj7wkwt2jicwWRsLuwet2k,7757
tests/slow/test_sft_slow.py,sha256=x13BIbH37U7v6pMgd1PLp_UX6806n-gsK24AD4MW36E,14741
tests/slow/testing_constants.py,sha256=SvuyWUH3XLLFoBX7J7w57yLWVP0l0TlHTIjb4OKf5q8,1082
trl/__init__.py,sha256=gljfFJp0_lDWdObJPLlWzoZwFKPSZBNDPMgPdXym_do,3921
trl/core.py,sha256=mVYQfYMUlo6rOsNDZ5iXI2FHbvgFyIyL14kevRrZSWY,12148
trl/import_utils.py,sha256=f3TVdLifsO8sDljXEiTUxVUqQTcGwrFsmsktYlVAO_U,6079
trl/commands/__init__.py,sha256=cC-O6JC3_LmUQ1jnHY5Gyz2MmUC2ZAc-RmrKkMI9ku4,1207
trl/commands/cli.py,sha256=BAKnhU2eXDd01cPSTIhbes4ZgaAzpcJRIEkZxcXcABw,2367
trl/commands/cli_utils.py,sha256=HHVjUFoIt-j1L7IlXj6rWacjXj0kUCRdz1mybNL3-H4,12965
trl/commands/scripts/chat.py,sha256=RyYZYbLbBOZ7w51o4-Dscwvfz7oBrZt9wqtPrdES5uk,12612
trl/commands/scripts/cpo.py,sha256=vEYFZlWWEkshxSN3Jv9u4idVMdQWGmA3mzhIqaON6sc,4003
trl/commands/scripts/ddpo.py,sha256=QS91t3sw1voySX6C-E2e-Kqpy5s6e-M0dT7dECbxSjk,6500
trl/commands/scripts/dpo.py,sha256=2gUU4BOgKblXat9h3iozbpLOV-L8ocIcu98WqZPSbTY,6054
trl/commands/scripts/kto.py,sha256=6hIOeA8pcTA_dwlUsw2EcKzNfYzDlY8qJG7UF9MxXaI,3729
trl/commands/scripts/orpo.py,sha256=KTA4uj5C-dIndnQpajXptRIvCr6gQCVAGhPbk94u_Q0,4057
trl/commands/scripts/ppo.py,sha256=D_vm_vc9T1AH5Au-3YUJ5v2mLXLfz-2dDnOAS4hSUBI,7646
trl/commands/scripts/ppo_multi_adapter.py,sha256=wnjUJ_bT63rbVvD28SkcOHF5kFdhP6fmgQzCxXsLwZA,5261
trl/commands/scripts/reward_modeling.py,sha256=1-bFGP-HluJjiEmiMtDou_UlQKQKp-r66FtSewvciXU,4596
trl/commands/scripts/sft.py,sha256=jGp1BG5rnx6UmoszGc-KuLGOl9Yhf03uxz-OrgKWjho,4730
trl/commands/scripts/vsft_llava.py,sha256=4vqDQL1AzgJM3qWkrlHpksH7VOhkvItKT9ggFIBjRY0,7371
trl/commands/scripts/config/default_chat_config.yaml,sha256=EUJ3XAK7_YbN3EzlTqBQRov71u0BoQEmSs6-qW39kCM,487
trl/environment/__init__.py,sha256=uBxjkEmKJItWVB2I8nv1FmMU12PNVVamuN6sfGmXU6c,390
trl/environment/base_environment.py,sha256=H4O2xHvG7wVogdqNan5KpzRGf8O25hbQYSO8xIxd9cY,17569
trl/extras/__init__.py,sha256=ajCQ4__JlCJaTy-EHMowYAnRnFPuCrHaxlekGjSsLRU,971
trl/extras/best_of_n_sampler.py,sha256=Wq6ylNxpB-OYp3s761cfZWAe3IPpuArt9QzKMsPTleI,5182
trl/extras/dataset_formatting.py,sha256=FGJTuEDc8K4y2aEKXPR1rvyv0WdpDCIaL4rGOb8a22M,3646
trl/models/__init__.py,sha256=HOolk_HhpjxEWoUwVGzk4hvaHAVVifLFvECKBMy-FXw,2208
trl/models/modeling_base.py,sha256=LE34u1GXjRLQqMAtZvsKe6NVdhQmKEtdWsKjXU-i2jE,28788
trl/models/modeling_sd_base.py,sha256=YwRGCbqXLeOkPf9RTSy9rXLC14GinxblHyNFecdzFXk,27695
trl/models/modeling_value_head.py,sha256=68ageX_AUEwuol0yvlGpnVwfm6KHk0qmmwyHC_cW8BQ,18933
trl/models/sd_utils.py,sha256=EhTaUSJNwUcopoK6tcg46VJ027FwdetgYyswiJ0NG_g,5874
trl/models/utils.py,sha256=8DB4Mx51NP69ZlUoMN96NMlF-u1726OFxTSUuJ-8ab4,6026
trl/trainer/__init__.py,sha256=4b2AfcFY1WoFBUHhvAifNluxQm0UgKyv_3p52TCrBXY,3343
trl/trainer/base.py,sha256=51YAcpsjJ8ghVbfhBXcP7BT0_yXnmhj0G_zfZhl3guE,1772
trl/trainer/cpo_config.py,sha256=rYa4J1vJzC7fVw8UN9e3FwlUiHlpCpNcmjTvU4xNoPo,3875
trl/trainer/cpo_trainer.py,sha256=EgWql2d73TCD-0zl3FQ6vbyjQbNiZMj1ytJCUVA1GgI,44118
trl/trainer/ddpo_config.py,sha256=_7i0WDkISo6IXaPmizNCbq05DHdFIF8yIcryyVQ-Gcs,4891
trl/trainer/ddpo_trainer.py,sha256=pZM2pRMB61tX7WKuYx_XULwEpc9KFd8iWT8vUM_qiFc,26796
trl/trainer/dpo_trainer.py,sha256=BrETMKSwBW1iV0eJvAxaNcdRy1t52PzfETS2DEeO90I,62510
trl/trainer/iterative_sft_trainer.py,sha256=Q8nY2xBti-sxU08debOR0ywU7s-mqoT0lk_kLZjEiUw,16699
trl/trainer/kto_config.py,sha256=kZMsqu8xynEf8ZkH2D6YTVKlGMUcZmUtfXVypaQCPa0,4970
trl/trainer/kto_trainer.py,sha256=AAwW1JhfzuBL_JRSySgDa6tn66Aus1OXOxYv5n849aU,63623
trl/trainer/model_config.py,sha256=tNvO09LuaYlWkfHrYrZXRPKtD_zPSHIhs7ARq0_66Uk,3297
trl/trainer/orpo_config.py,sha256=Jd0P6XiNjIVkNMXM3fUM0_xdccyi67bUplHO4USY2Yk,3500
trl/trainer/orpo_trainer.py,sha256=oGxN47UsR0dU3BwTGACTi-JA4-s3_RQsr5UetjpIWDA,45703
trl/trainer/ppo_config.py,sha256=MNodpTmSzy7kHL9sWweNJwkGmTSOHZ3VGGJ8yP_F-Yo,8202
trl/trainer/ppo_trainer.py,sha256=wKLZOa1V3PbGOghERCA5LHKKE3o8q7S4xKHhxH8Phw0,63097
trl/trainer/reward_config.py,sha256=9WbpDsmeokMx2TG21ZEjq9AEa9XntiMvk_tRELom8Cs,1623
trl/trainer/reward_trainer.py,sha256=9JYmLvw1s-UPnYmVMaSoywi80aV90Gaev12pRf9Ld4c,14097
trl/trainer/sft_trainer.py,sha256=C7SyFFr6dit0darwWDgPKhZd3jKL6BdYJf3UWNIdxbA,27414
trl/trainer/utils.py,sha256=78C9pWMEA3YoJkLvK7Qrsij-b_uq0AGzBy9wKC8-XKA,35309
trl-0.8.2.dist-info/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
trl-0.8.2.dist-info/METADATA,sha256=kgbH88pTwSYV6saa-ZZLvcRONEq91sfMon2p_GzOcVM,11914
trl-0.8.2.dist-info/WHEEL,sha256=2wepM1nk4DS4eFpYrW1TTqPcoGNfHhhO_i5m4cOimbo,92
trl-0.8.2.dist-info/entry_points.txt,sha256=yL7_8yycDPJfL0E-DhCJabQAYr4U6-pL2IfXVqomtOs,46
trl-0.8.2.dist-info/top_level.txt,sha256=TUKDSfcN6PgBU9dnJ6_YJ7qhDzZ0CKzHvHehR6GKpWg,10
trl-0.8.2.dist-info/RECORD,,
