trl/__init__.py,sha256=7mi4w7rWpwRHGlwGjnwgQRtfvU1EL1l7y6W2TFYufwk,6544
trl/_compat.py,sha256=V0fGIaQzlgGkWWYuKVef-KWtW9692TQr1t55c3SPTq4,7689
trl/chat_template_utils.py,sha256=5hGOiQdquwVLv35nMNLWJO5sk7vqQU7r5uQAY8P4mnM,22916
trl/cli.py,sha256=jwgZ20oEZRg8rkJuuw2Roj6ToRotpczJDqGWyBwP_28,6909
trl/data_utils.py,sha256=D9-VIyb3neYy2Z-js6T8KuKzWEmcF-Cr7DDGvmEBtqU,40920
trl/import_utils.py,sha256=-axSkC_bEo3N_dvyFnsdO8YeONuh4CPgua1478T31iw,5798
trl/mergekit_utils.py,sha256=PDl-gYi1t6urIng9S7GdZAoApIK65ZlcWzKZer59l6M,2508
trl/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
trl/accelerate_configs/fsdp1.yaml,sha256=FBw8i6diLwfcUI6Uu7T-UTpd7niY062tLsCFMLoT0c4,725
trl/accelerate_configs/fsdp2.yaml,sha256=zg1L3kVDJb7kvuxIPaqMN6mZQFD2mvG8IxSRmkY7dDk,627
trl/accelerate_configs/multi_gpu.yaml,sha256=yDX-SPo8qY3SW8jsf_53VJX1GwIV20wmRPBbCKf4_8I,321
trl/accelerate_configs/single_gpu.yaml,sha256=4MuOZIjHNir2adOzaoOgBwD9IXXRbPNPzBYVW-zkc7I,316
trl/accelerate_configs/zero1.yaml,sha256=fyUlyzQ_nhP6oamOgOBM7MDZMuHvG4xZfm_-2wnuYTo,441
trl/accelerate_configs/zero2.yaml,sha256=kW58rFIjO1Jz0-TWjg2zUHO5BUBHI4TPFIUHb2M-WiQ,470
trl/accelerate_configs/zero3.yaml,sha256=VN3HDSxEn_WCvYpML4thWO7cpr2N39VwAJjMvPtwfxE,498
trl/experimental/__init__.py,sha256=FMF_-llsmlfdSVPb8RfoW4z6zX0Co7J2jub6IW2bKyE,1310
trl/experimental/merge_model_callback.py,sha256=UG2Yr0VJsYCkrDGmWjwssAvTNwMgJTadpeExsIpdQmg,13850
trl/experimental/utils.py,sha256=IRBaaoQi34AVVWBVOWWJaI7JcMT3rQ_jEOJHMN9g3TM,22797
trl/experimental/winrate_callback.py,sha256=rdcVQ7joSOSafYsQn5zahtDYj59hP0wx8wQkuiavQgY,13164
trl/experimental/bco/__init__.py,sha256=X9vUxV2PcrTORo0CEALpq8EoHXtNTavAh0s-GVBDYio,682
trl/experimental/bco/bco_config.py,sha256=eil-zPBXtD5Q33fPrAMXdtDv6H2_XifyyeP5x8bAH90,11284
trl/experimental/bco/bco_trainer.py,sha256=Od_WSdtm1DtWtDPoztQ_MLWCzGsMK5vxu2cWL_TnHhc,70741
trl/experimental/bema_for_ref_model/__init__.py,sha256=YSMOnS353SIRvV4_NS-Y-t0sbD6snBcbELbG3ku2Nfg,683
trl/experimental/bema_for_ref_model/callback.py,sha256=RYC7doi9utJa98wKMT0NP8pmY0rITQGISfwZjlQm_Vw,9641
trl/experimental/bema_for_ref_model/dpo_trainer.py,sha256=4YrnaxULpR6TSpjWLvOGoLBziWQNGgWhNqOjuZT1mHg,1181
trl/experimental/cpo/__init__.py,sha256=rO0s9KRAaIsLOMJo2sweX51LkAK4QsLOeDDGIonMFLw,722
trl/experimental/cpo/cpo_config.py,sha256=g5Y4hwPZ5tjpJPgxCdh0acdGu-UCu49cX3DVfe-3BU4,11742
trl/experimental/cpo/cpo_trainer.py,sha256=IUYala0-NwCjG2zM7utPfJJcAw8sB3Faoxqszs2H6w4,50410
trl/experimental/gfpo/__init__.py,sha256=uP2ol8mB0vbkaDcIXCAAwN_HzW7ulo0c4HGqqlevafY,686
trl/experimental/gfpo/gfpo_config.py,sha256=Zz4vFZ9vAy9kD47EN3RgoSJZtW7_8JnGn35sgHmZzNw,1325
trl/experimental/gfpo/gfpo_trainer.py,sha256=mIgwf2DzLdBPE-y7KpzRZq4Yr9rFYj8jEW0kSNcJCJg,21475
trl/experimental/gkd/__init__.py,sha256=QO5Yki2ia5hOep3fpQArdI3KMnpQkIV1FE0WiznkZrU,722
trl/experimental/gkd/gkd_config.py,sha256=iAdbdxzY-5qmWvTJAPHg_TthR3E_cG61r6jEfNGxsrM,4900
trl/experimental/gkd/gkd_trainer.py,sha256=pJQJQeyx8lvEuEs6Hu3gBxblt-U2p4wnvU64FBeV5OE,20720
trl/experimental/gold/__init__.py,sha256=FnYqi1_ahqtra-Zj2iECHAfr7AHBXQxYWrDNhK-a3Vc,728
trl/experimental/gold/gold.py,sha256=b0dUWVQmSNiTKCicRlB6-wxe1Xny8SPPrJ5V9wVi_u0,5461
trl/experimental/gold/gold_config.py,sha256=cUQb5iIc0lza5vYJ8a8yxAvP0A4UAgN08X3RxCtyCxY,20007
trl/experimental/gold/gold_trainer.py,sha256=qXZ5toERTzKNiYOBI_D7Ulbv5L8rubqon3bNbk-_-UY,101507
trl/experimental/grpo_with_replay_buffer/__init__.py,sha256=KPrhB5rG42642HmeBRcnefGPLBICYAdd613MaDGFTys,770
trl/experimental/grpo_with_replay_buffer/grpo_with_replay_buffer_config.py,sha256=UW6s4umTNDvsDQ-2lHMOAovD5Ro1gGlBohJNnuEan0U,1372
trl/experimental/grpo_with_replay_buffer/grpo_with_replay_buffer_trainer.py,sha256=9duMAbykhskzxZ5HqoQQK0rLFGIPh26pNtdk2YJZxyo,36517
trl/experimental/gspo_token/__init__.py,sha256=ymJxlrn9cMOyLPGHBq_7VKfvGrhbXYl1ZPi8OyGjSbE,650
trl/experimental/gspo_token/grpo_trainer.py,sha256=kOIfJq-9gj9wp7FQuhJGAqK_ctEU7rbfed0PO9D4c6E,8262
trl/experimental/judges/__init__.py,sha256=-Yk-310tjPCC4xn4AvU_TJ6TdL_XAWfCFFfjiDbvqNc,986
trl/experimental/judges/judges.py,sha256=uPkvb66J80MnC4TzvgULiVx9zDE4aUx_RTUzfW09q5Q,20486
trl/experimental/kto/__init__.py,sha256=K-M_Blc_9na1bQDKla6jKJKb7fPKxSUmiJyRHNFuSu8,722
trl/experimental/kto/kto_config.py,sha256=OXOM6abuc7siKTOkxSyKrv4DGRs8naqQS4nse8pxQqU,11082
trl/experimental/kto/kto_trainer.py,sha256=lrZ1GuKyG5eaaR8PiRL3ktSM7tbeC6GuEUz57IyKOaw,72311
trl/experimental/minillm/__init__.py,sha256=xJRoMqech-1OcFwcP3Ut-wV7DlYm6z6SXb455kHOlpA,746
trl/experimental/minillm/minillm_config.py,sha256=f-FRRd0jtXdPY2tVJmP32VIsrYC7-lPiSNQ2qdURmXU,7766
trl/experimental/minillm/minillm_trainer.py,sha256=rD-TQFCa7j4KcRFLR33rDHlshsY5kw7ihAOgv0zH8DI,19313
trl/experimental/nash_md/__init__.py,sha256=0-fTu0AiobRY3KTKO6l-HMW_Me66vuaF-l7ym62oRXA,742
trl/experimental/nash_md/nash_md_config.py,sha256=6GlI-rW4umHCMU2ykEwLztRGvd8hpHJlznEu7KzAsH4,1872
trl/experimental/nash_md/nash_md_trainer.py,sha256=zsDsm77lGHq2kc_9i43lyD7vgIkcBpMGmRgVYva6H2E,24680
trl/experimental/online_dpo/__init__.py,sha256=d0PLdODeA1bPSoXLlGWEAeA6XwGiHCd1isltzRGAVOQ,760
trl/experimental/online_dpo/online_dpo_config.py,sha256=KoejPnsRncvl1D3aznB1zFik0DD5KqluI-mVBeo1uDw,22129
trl/experimental/online_dpo/online_dpo_trainer.py,sha256=cHG3hrvYaojhTtcdR14AaVKApRRzGBI2BV72tyr-oI0,75656
trl/experimental/openenv/__init__.py,sha256=LlzcnV_wiUFOTBh64phVNDb6dpKr8A93i_K-ZntlysE,705
trl/experimental/openenv/utils.py,sha256=1wwvoGg2LXmsYX03oQYsw2fYjMW5oqQZbPHFFBk1aqM,5196
trl/experimental/orpo/__init__.py,sha256=raFCz1dhCGKRjdQREuxEWY_MwXpIA1GvpZXxsqzv1EU,728
trl/experimental/orpo/orpo_config.py,sha256=0kpcqcXmE-1Gv1Awld8uxClH8JL0bXLT1A-tR01qiMo,9056
trl/experimental/orpo/orpo_trainer.py,sha256=gjTegw0Bh0SS81566cs9iYf1tJ0NfQVIOeLdmI1hjos,49242
trl/experimental/papo/__init__.py,sha256=qP04taTkxweuEvOll1BfSFU5BlaZyv7OIT-i95PE8CU,687
trl/experimental/papo/papo_config.py,sha256=YN5qFmankCNVYDgEEQ0TRQDo29FqumZGRxfjtIkZb1g,3141
trl/experimental/papo/papo_trainer.py,sha256=mDb0UF9wJskM1cpblxUd0UwbwnvNK8Wo_KZibGgnkXU,15685
trl/experimental/ppo/__init__.py,sha256=7jMTBOcEiFGAs6rYdH61xzg1RWTGfBC_r2YFd3DBtR4,990
trl/experimental/ppo/modeling_value_head.py,sha256=TEUbETl0Pjeg0y2jBG1kl4YnurlHVn4Un1dPGTTk6O8,44279
trl/experimental/ppo/ppo_config.py,sha256=vaAZKwxZA_UOhHGKiVsIBXOjomeNXyi7y3DEVg2HbH4,14854
trl/experimental/ppo/ppo_trainer.py,sha256=ZC7xZTgtb9ZdxgfD1iz4d7G3wbg4bvKghPmvDjeh3NQ,48574
trl/experimental/prm/__init__.py,sha256=D5e_7PoXs3nTMVQaN1rAGvIUra6cQDfOyFViUbZrNR4,722
trl/experimental/prm/prm_config.py,sha256=FkQe5CGjKZ2M_0M6eoPyPm_jctxmTPVuEmO6Xaum7GU,5448
trl/experimental/prm/prm_trainer.py,sha256=WEFWpJ5iOKaXjsuQrIz1mwlH0vr1lftc5GF3KVVXrUs,15792
trl/experimental/xpo/__init__.py,sha256=QcEIbvNKqd-1mR_mHH8gmtE5UGhZGBFG_9bMYLBhuvI,722
trl/experimental/xpo/xpo_config.py,sha256=hWuv1yNMEM-KBFJFv9x_8xu-NhsU8oblvqQLLLF68-Q,1691
trl/experimental/xpo/xpo_trainer.py,sha256=JALn0Zf_GWSsR7GPGJhYwc82FuAe3HGvJ4Mdkp6yfvE,25210
trl/extras/__init__.py,sha256=V1wvJ_Ee6Ro58SbMXQqO7FG-_jvCpy6kB31_7Wtl68A,611
trl/extras/dataset_formatting.py,sha256=D_8NqUiZ3aSF6bl3qnopEOY8suwH3YEhJ_W4gljSXA0,1285
trl/extras/profiling.py,sha256=-sw8FDuQqgnxJL5rEkLwsplPG0t2fa7a4dHwGgs2_hc,6479
trl/extras/vllm_client.py,sha256=dxeFn4T6hrqQMMVgtiNl92MvzbQRYANgCSunp8ge-SI,23874
trl/models/__init__.py,sha256=7Ly3IQjuppDXGbAQtOcj23fWs5Peo-dCO9NFdmiLUtc,1533
trl/models/activation_offloading.py,sha256=ZKnl22gUmvG1FcJrXQZJGyHK_bviFyrqx9mk67Rnxis,34695
trl/models/modeling_base.py,sha256=VlhSCbHGRF8pkG9fIbkLIXqAw21ShWA4dF_W4rKBflg,1424
trl/models/modeling_value_head.py,sha256=6n0xv9x8R4nHTpCWgchXMgPDkpkS50RR_SZ5SXpRJvE,2220
trl/models/utils.py,sha256=cqQ0u-fxkwkrZf3C3KUnPhHnxBoyQ0XyovveahLmA-4,18837
trl/rewards/__init__.py,sha256=J7jBI_tLyUV07IpE3q8y5DwUR9nWA8YKAjLXksnP4PY,1216
trl/rewards/accuracy_rewards.py,sha256=-F7ePyttFOuGEZarzFmwMsFi-WhLJMFh7S_iso7AoWM,7610
trl/rewards/format_rewards.py,sha256=XKId9E_3opkCtiELkYSWKxb8QnYJv2EGLuT9QOcmbS0,2211
trl/rewards/other_rewards.py,sha256=fzad9ow5yukVkdfan3hMWY7alEv2E-4Q7BPckNUcgaQ,2633
trl/scripts/__init__.py,sha256=pfV1yIL5Sh7I18KSxa-aHwpUbyLH3KxpWqmV6UT9hWo,1077
trl/scripts/dpo.py,sha256=zzejfBkA1qMEy55twquxntSHK_TicW1RoP19vN7VcKI,6297
trl/scripts/env.py,sha256=1PbnrAf9Xl8O4C3cMyuBCycuBmIaKXJTJaKUi9oL5NI,3522
trl/scripts/grpo.py,sha256=4hTKtuDtw2iZe8N-XO3e8xPQJgyNHte2qQ08MKoaJjc,7544
trl/scripts/kto.py,sha256=JX5Vp8vMEgbch8kuAZ45DdQweuQyxlykoLq5kZvhqWg,5497
trl/scripts/reward.py,sha256=86ZTxcazpUiz5PII7C7mgWxkd9-L1ac7TOdhs2Tp_q4,3772
trl/scripts/rloo.py,sha256=Pxkj5udjCGGvaezAYWdDt2oGC9OWd6kOGbie-ZiluNM,6822
trl/scripts/sft.py,sha256=ZFQMyeG_ABkcPr0GqrQLBjYQGeM5DCGY0HBtRsi-670,6062
trl/scripts/utils.py,sha256=vAdRpl7bBMX-vFjNXPBCXT8cKZwaq2tTibF2DEEFOzU,18575
trl/scripts/vllm_serve.py,sha256=YjVKFrgFLk7vwDSTOc4nKYR9oi48f0skbA01L5t0cbI,40708
trl/templates/lm_model_card.md,sha256=zq0dXorqEOnjHJ8wxwhI3LS2R6qiHmlcgPcVzliwRmc,2158
trl/templates/rm_model_card.md,sha256=O4lxwEsL9ld81LL7rwBwredxAeMDfWfpzwe-k7UYHeg,1951
trl/trainer/__init__.py,sha256=ptVmgx0o6guyMRdzOoZG4LDxlOLsIfOO7gf9zanAHBM,5794
trl/trainer/base_trainer.py,sha256=tIavhuLicKgPp_bWrFZkZbmDVJWBvEjv5_xsmGi5Mhs,2891
trl/trainer/bco_config.py,sha256=snmvvia9tapKzfPL9bW-wlLchi6_MhVVt8iNDRQxZ8Y,1334
trl/trainer/bco_trainer.py,sha256=Vbd3ayiVb2rgxqfOzCkVIY3q6U20UrfGfEzpZSL9cGk,1362
trl/trainer/callbacks.py,sha256=qlk4BoG2oiyVkMs_XGMP_V3QaVQ9boIM33sF3EWH1AI,32084
trl/trainer/cpo_config.py,sha256=bU2o_GtoB6wSdkbPsVCRgNitMtnphgDKoI8WFzRJidA,1334
trl/trainer/cpo_trainer.py,sha256=8g_RPOH6bM20n2niWlQ7v5vyeSvjAmrhEIhK5ntGZ5k,1362
trl/trainer/dpo_config.py,sha256=PBf_zbFgnCMd0zg18V_NIr3ybhjH9YaF72lgT8AIUoU,27600
trl/trainer/dpo_trainer.py,sha256=XeZEanPYDwI8mpicSBzwz38plmOi9Kyi2mqQV4rBqlc,103098
trl/trainer/gkd_config.py,sha256=bfH6dJWISvoYR6Zg_aB1fFj48ogzodcVgBTlxOBJ1lY,1334
trl/trainer/gkd_trainer.py,sha256=RdA6KonRuwxat8mzk8hq471DKurjRhErzwNKZ4NTG9I,1362
trl/trainer/grpo_config.py,sha256=uEBkFb5_Ka3aQJ5KAxfSPpY32iMJCtMdccMeJ8Mjm7M,55766
trl/trainer/grpo_trainer.py,sha256=VOEgGgL8U8Djo_9h4pNoC9crEGQEL7V8ZFwGAzhOTlM,138556
trl/trainer/judges.py,sha256=rkLwzfUwhm5WCz9ijeBN4NmUqQHYAT3jxxWqRW2QR-A,5096
trl/trainer/kto_config.py,sha256=8_KjHZMjZc6QgEOXr-H4rBq1Jp52qeeEWBMQrEcaEn8,1429
trl/trainer/kto_trainer.py,sha256=xlFQtdF_Hx-bL9g2JJ2LTmsT-NSarjpfKt9fVKBvvuY,1458
trl/trainer/model_config.py,sha256=7k27sX-GRpF3tum8nccoa9jHX4LVu_ZLA9hwa6wWh1U,8813
trl/trainer/nash_md_config.py,sha256=jOSjLEtj44ICYsI5-3vlmpGiPqBAXOAJWiNtAXvSttE,1360
trl/trainer/nash_md_trainer.py,sha256=hgVNgknPIEH9jaBCfoPQQSdZsPHbYNQHlh77ir3J4Wg,1388
trl/trainer/online_dpo_config.py,sha256=E4PHn_-B69eQtEwxNzfiD6kkI0URkGPR7SuFzvxAPOo,1399
trl/trainer/online_dpo_trainer.py,sha256=YYUEZMeBgnziz0ByqHXsHh6Qv6CT27_7IEt9hdmLqQc,1427
trl/trainer/orpo_config.py,sha256=Yv0ZJjwUkHNv4PZUUiXca8i2K-MUOu71tihqhHG4kuA,1342
trl/trainer/orpo_trainer.py,sha256=kOb-sV3gpN6_lr2m6JnLe0UGHuy16spijy1bWCn8aHE,1370
trl/trainer/ppo_config.py,sha256=Ah7Yh3xfrAe9GxE8js_MWftvhhIBsw06vm_4yH8hB6Y,1334
trl/trainer/ppo_trainer.py,sha256=S9AB1GOjl4QLcfIqd_rpi1kj471CtvIPJ-trW2M8M1U,1362
trl/trainer/prm_config.py,sha256=kLF_aYwXGgD3jNguig80IFgsjfNgG7sKuiXTYf-FC6s,1289
trl/trainer/prm_trainer.py,sha256=sM6pa-eQku7qQuAXkCip11U0JcW6oaD7oYo9lO9XQno,1317
trl/trainer/reward_config.py,sha256=uaB5_SwfkDuRu6939mxMdY3uLvbu9sbb4zJGeraEpH0,9323
trl/trainer/reward_trainer.py,sha256=zB5SQY7cfC_YSjz7y4nQSgzqt5OEuCZkUyCqdUcTv34,31306
trl/trainer/rloo_config.py,sha256=9OJeVgqDZRIZxotOt2q65YuIUU_s16i7OV9pHwFiE6o,35785
trl/trainer/rloo_trainer.py,sha256=BpW4aqQK0wVRPnQ7SHcJqaae3xl3G9M6jzWxpxyXDlE,93248
trl/trainer/sft_config.py,sha256=ejXfpi0fq-KZKCE-4hiUqNcJTJkkvb4ehXDH3F5Qwf4,15106
trl/trainer/sft_trainer.py,sha256=KQAN7XHpRXrjS6QpkvaKTD6C_GMpYop_G7EBpPl8ktY,71175
trl/trainer/utils.py,sha256=DkHHk2ciogqQmMc0bpCkcU-ldodkG7Fk6dAxkKMbsvw,50443
trl/trainer/xpo_config.py,sha256=Hdqdt2jqi59tgaOu9qGwDF2N6s1ZlVdEjhDneK7_MZA,1289
trl/trainer/xpo_trainer.py,sha256=KLjxSe2PHRiI9jj9xXZvMDmUjxuwYAM6vanToD33BUE,1317
trl-0.27.2.dist-info/licenses/LICENSE,sha256=G_YUsf3ED700SqWNANF9X9DSUuozOgW-AYo4lZyLKZg,11355
trl-0.27.2.dist-info/METADATA,sha256=FANj2gpAD7gze_I2inJjey_YLh_VoxkBs-ajtmjL0Cw,11420
trl-0.27.2.dist-info/WHEEL,sha256=wUyA8OaulRlbfwMtmQsvNngGrxQHAvkKcvRmdizlJi0,92
trl-0.27.2.dist-info/entry_points.txt,sha256=EiubuQrZSGOohRB4xVoiVAyWsPsOHPSVpbzSk8YB0x0,37
trl-0.27.2.dist-info/top_level.txt,sha256=QU12VhjlpAtMnIJqiO2np3RkTB_Eozt1d-g8QDf5P4c,4
trl-0.27.2.dist-info/RECORD,,
