tests/slow/__init__.py,sha256=HnL_He_PiCx-HneCtjrS23wrXSWzA8DI1AjVaBb0Q5U,612
tests/slow/test_dpo_slow.py,sha256=YC09gO1ab21BCp_8ZVwtgZPfI455hLPXYfsHkl8PzmQ,7933
tests/slow/test_sft_slow.py,sha256=7osR0peYVWNiWwqLW9klDfiluwL-OSQV3HLT7T6Rbn4,15724
tests/slow/testing_constants.py,sha256=9EEKDsVxlW2WgvK4-kpcdfHci0WA8WmsBDruL4zH4fY,1077
trl/__init__.py,sha256=Dg1fmVkBxXL7Lgar6RveGrSeGUksHup5IuM86ZYnoKs,6211
trl/core.py,sha256=mLs1VB7gzP1w-NllOyYFsLj59b9n1pFtY3kENgG__WM,11388
trl/data_utils.py,sha256=Dh-nEkgCrCuh5vg7BYonllMeqXnfe8r0oL-lk87Zdu0,16667
trl/env_utils.py,sha256=56zu6hKknW6p7sQoNbEu0Xcb8qgJJN2GSu8gOiBsxb4,1394
trl/import_utils.py,sha256=uB7qhgTKvBSgksvYKEFRVbsutQM5a5XTWQrZVypwxTY,4149
trl/utils.py,sha256=8FVSHNZsU8kupkBrWvQrZ5kQmpHJRK1HnCkmHALvIlI,1813
trl/commands/__init__.py,sha256=WVN3lzmCA1_KrCtmeWno7lj0yvZwo6AmE80rznyqLjg,1124
trl/commands/cli.py,sha256=_Z1KZ2gltzc99lx4GSims0Zyko6vj5rCR6fPdLSSfh0,5591
trl/commands/cli_utils.py,sha256=dljcqriYx3YVRYtOJaQGOfmM1srf9yP3y43A_tk7GiQ,11440
trl/commands/scripts/alignprop.py,sha256=NJHwI0ksD1OYTJBNOAWVi0q1hL_xsdFLdwKwdENXtsA,4246
trl/commands/scripts/bco.py,sha256=91jY7AkQCWGBCbhzz7WrR0oTVj4025nGwo5xwrD-w4M,5888
trl/commands/scripts/chat.py,sha256=mOD3zda5_bA_tiTOmffSR4PkRrGZ8_lckZx8FVQbydk,13313
trl/commands/scripts/cpo.py,sha256=FxGME50kZDarLQjNkC9x0poeg_zKZ8Nj1VhR9OnUYkc,3495
trl/commands/scripts/ddpo.py,sha256=N9NjtzxLMurxlOJHuE6LKQM5QFhqtwzXIcF7VC7IGDQ,6712
trl/commands/scripts/dpo.py,sha256=pgO4YuIYylV1U-yVkEnF35QLx3RCrfbdb36gGVEYqHE,4651
trl/commands/scripts/dpo_online.py,sha256=kdzS7avE5z-bnhllxoZkKLS9mDjyyl0Fh6pnMoDYF6M,5363
trl/commands/scripts/dpo_vlm.py,sha256=gIWREYlVMdvIpMDKiV5HqgfJK3DedYnov5ZUVrX0xTA,5089
trl/commands/scripts/gkd.py,sha256=Fznlima0N8I8eUwkkzR3Q97fz2BuSMyxmdVUPlsHWGA,4965
trl/commands/scripts/kto.py,sha256=FXkSIdCQkUaDOlboC6gd-miUxyWPSR4W3Tpo07INEiA,3688
trl/commands/scripts/nash_md.py,sha256=eOH4No7II514FyXroBxv2oJ_8O6qCz3028sLHBszVnc,5242
trl/commands/scripts/orpo.py,sha256=OsDLTumwI3r8fkxNxvyfcsIpW9tVTUpz9-mnyplBVXE,3584
trl/commands/scripts/reward_modeling.py,sha256=yLEXMrZKwvXvWe2pggWrgT62QthjMH_WyfY4Z6QSgWs,4740
trl/commands/scripts/sft.py,sha256=DWY2nxYFEOinQwSNniiO6hanKRDWq7A7yeZErBAhjYg,3557
trl/commands/scripts/sft_vlm.py,sha256=F5lRvkXGezCzrguPxyQ0XeJXS1nt-71ftBLO7pln1_8,4976
trl/commands/scripts/xpo.py,sha256=an2inNYMCM2ONZ7QlQa0fLz4EFO0sOYocKh9ANXOBYg,4671
trl/commands/scripts/config/default_chat_config.yaml,sha256=EUJ3XAK7_YbN3EzlTqBQRov71u0BoQEmSs6-qW39kCM,487
trl/environment/__init__.py,sha256=L8-K4ielg0XYKUuX1cqRD7bP_yk8pnkNBHPLBtj1C78,989
trl/environment/base_environment.py,sha256=zxzLozfVLrtkwzl0VHp43GL9yFM8M9OijuEUWX9Wv44,17569
trl/extras/__init__.py,sha256=X0_tV0qLoXz5yky5kRsAu3oItzgpNwjL1TcuhHHOFk0,956
trl/extras/best_of_n_sampler.py,sha256=_4e5fxo4YmeuyfgHVWuoVL2udfHoN0Ay7FI9b5PIhfo,5794
trl/extras/dataset_formatting.py,sha256=RCv-AEJ0d6AjlxwhhAwUdMkdJ4j_cnTn7U5aQk-qAZY,4258
trl/models/__init__.py,sha256=2AAT1Sijo3-854Mwhz7mMuWOb2XORjLFi_Zf-AiXTN4,2236
trl/models/auxiliary_modules.py,sha256=cjT5yEa6FPg9Sm7Ocz5oDOk_OXQx04n1hLC7cfrkh5U,3337
trl/models/modeling_base.py,sha256=8A2JGpra8Y2vgdd8dlo9mBcQKCA39T2smbAwCIFh9XU,30859
trl/models/modeling_sd_base.py,sha256=Zu0jDIc9HXB0v9YO7ym8WCn6sdLUHzBGTQN-NiA8QS0,42320
trl/models/modeling_value_head.py,sha256=LWa-hhoxkBni99Kr9rL-9E7oi4bWXlXDGttgE6BN8F4,19381
trl/models/sd_utils.py,sha256=g2eTiZwrffwzzFYQYLFvrBDIoUoiTUI9MSpCXwrY4to,5873
trl/models/utils.py,sha256=9QZd1NDaeOnhQhv3cu2ybD1mBbIi8u6oys0q03Ekro8,7477
trl/templates/lm_model_card.md,sha256=W2EnvqdDDbfCQUQLxHTjB3D8u-lvg6yq4mbLQXgOmKM,1958
trl/trainer/__init__.py,sha256=kNet1V1aqjg4U7Jeem98A0VE1ql2Xyq3Y2XpE0UATS8,5454
trl/trainer/alignprop_config.py,sha256=mAxEpRKvWQ6Vmn36B5xLm8tTa6ps64-UbN8Wa1_JEcY,7384
trl/trainer/alignprop_trainer.py,sha256=bTI9lpGPDUCMlGWv4SvDhJztW2kh49igUY1dZieBpDk,18236
trl/trainer/base.py,sha256=51YAcpsjJ8ghVbfhBXcP7BT0_yXnmhj0G_zfZhl3guE,1772
trl/trainer/bco_config.py,sha256=V4rYJiRYd-vQS27uTz-OA9_DZOoBEga0mK6c14DGuwo,5073
trl/trainer/bco_trainer.py,sha256=Mv72muvZ0fr9dw4bw-LQiAD5xDljhgre1CWqArhQZW4,72482
trl/trainer/callbacks.py,sha256=HTJyhPG4Iwhq9lNWNdNCbsbsv6NZsTZOUCYEP4VdOok,19144
trl/trainer/cpo_config.py,sha256=7VIlLdcf0jr2RCkni23T51ryq6ucHjzmv0or6_HdQa8,5556
trl/trainer/cpo_trainer.py,sha256=Wy1cBx629EN79NLBtsW-uWCyAzSIaDMBikdSWMwnK0M,49699
trl/trainer/ddpo_config.py,sha256=fT72Yeq_61LDgPTvSrkG0XgxPjNlQoXtBLy0zPk6U7k,8583
trl/trainer/ddpo_trainer.py,sha256=ElOkIUC5844t_dhqDCggxvjshpCand_rRQlL5VJGiPc,27926
trl/trainer/dpo_config.py,sha256=gOKJkU74GbZuuwXdwCkVuR7_JOWgbjI4LO_w-Whi-ek,11385
trl/trainer/dpo_trainer.py,sha256=Pkw2DL4LvrjqXqHjfM1E6m30ITHT8ufR5-WXTxNhE2g,79207
trl/trainer/gkd_config.py,sha256=0Vfmt8vY8hHmxV3qI8oN4R3FmDg1kjQcb31qLspsJzo,3036
trl/trainer/gkd_trainer.py,sha256=m-01gEKpS_Phw2GKNialIWcCnE1_q4-4VHUCRLHSPlY,17212
trl/trainer/iterative_sft_trainer.py,sha256=4r9MpURFeAEvMVqZZrUUCbzJ8YKI0va6wfKaqjP9VBQ,19152
trl/trainer/judges.py,sha256=rSu6IuTrX3rIXjkGUvVJa5jsoYNewW7lnREHht0y_0Y,16027
trl/trainer/kto_config.py,sha256=WsHHbooqY6rc5xbq38rpyP64l6z9-JbZ138NcLEVogk,5745
trl/trainer/kto_trainer.py,sha256=Gd089TsBw6AXUO8xr8HKfKAArLgU5d8v6lhqQmJfadk,74104
trl/trainer/model_config.py,sha256=FVkm1rMkcD4kQMrXeq_XMQrlhFQjGPF4Mr1tV0-F9ek,4966
trl/trainer/nash_md_config.py,sha256=KW-JQSL1nM5Pi6_HJosqSPl6EfIzx6Oh_PlD0PFfJPk,1552
trl/trainer/nash_md_trainer.py,sha256=JQ4ycIb6d9_yGyw11Q80SNC1U9SxTZLWvK_uFncmXAk,22523
trl/trainer/online_dpo_config.py,sha256=QjpofoGENwLaqFYN5B5PDplcKJPy0uR_C3RGtMqfwfw,3948
trl/trainer/online_dpo_trainer.py,sha256=1L9BMF7P1c1sAXhrbBpe3IHE82HWWlOpClVpbm4ULw4,34266
trl/trainer/orpo_config.py,sha256=CRf1_qvFQmgYVl-Khy27_NnyFvnk1hFJfv1ra2ENjxU,4314
trl/trainer/orpo_trainer.py,sha256=6jhJ7vojgQLPyh4SNz8phaB3zbuTgiCT5BckYx8eN8w,50604
trl/trainer/ppo_config.py,sha256=byfAQUv1mY_Io7M9nqPCpfkJp7cnZ-A9K7eEq9ghAtc,2380
trl/trainer/ppo_trainer.py,sha256=wzYmxfC-p_2wIw2YXBGdIPk4k4zuj3Q3JRcmYOE40OI,35409
trl/trainer/ppov2_config.py,sha256=vgqPj4wON8HYNa3_0lnOroOk2UoG6r1LUgfNS4iiJYU,1037
trl/trainer/ppov2_trainer.py,sha256=0aRirqkIOKkQcKmb802dKArNScKZeFqpqPvGRnwBTME,1045
trl/trainer/reward_config.py,sha256=n4L091qDbptyO-YlWipFwoaRt5PBOXV2_zI_QhckI7Q,2095
trl/trainer/reward_trainer.py,sha256=wisPmFUNmPx2ekVLj7ejuEmMjOwVFwVUGtTtsAvEmDk,19156
trl/trainer/rloo_config.py,sha256=N_lEhLzd8RDuYj5CA-0dOLxa6C428P6SsGW0VQiwLEY,2057
trl/trainer/rloo_trainer.py,sha256=Q48PPao6q-27PBXUDifSbyJ505UPr8VHOC1FUWdX2iU,30475
trl/trainer/sft_config.py,sha256=qf2AuFj7qn2Rc6RZyJWF1MuP_yMUdJkdo-wFOggw7wg,4054
trl/trainer/sft_trainer.py,sha256=4FSce55wdXysOF5jEAAfwxtSxT-nJayajx6eOUxjch4,29640
trl/trainer/utils.py,sha256=uBNiYO8CHFmedq2hZZNAuE8bJ0jxFDQBQkhfPHbZiqs,61866
trl/trainer/xpo_config.py,sha256=tdtkDHmmO57TQtgR1NkTFwR7uBT-CrKzc4k6RA0Aff8,1430
trl/trainer/xpo_trainer.py,sha256=tp9_AAo0MEZNIr1cFB27MAEMSm2mN7TC8pfRJbWsR-c,25574
trl-0.12.0.dist-info/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
trl-0.12.0.dist-info/METADATA,sha256=nNgaj7ORjYZ33l2pHq5pSyNf36G0grtNbZWQ1UUU-OU,10964
trl-0.12.0.dist-info/WHEEL,sha256=R0nc6qTxuoLk7ShA2_Y-UWkN8ZdfDBG2B6Eqpz2WXbs,91
trl-0.12.0.dist-info/entry_points.txt,sha256=yL7_8yycDPJfL0E-DhCJabQAYr4U6-pL2IfXVqomtOs,46
trl-0.12.0.dist-info/top_level.txt,sha256=TUKDSfcN6PgBU9dnJ6_YJ7qhDzZ0CKzHvHehR6GKpWg,10
trl-0.12.0.dist-info/RECORD,,
