trl/__init__.py,sha256=U8Z_aS6dzgFd8WJ8fXPvcZwI4ecbi_yXyODa5F-DP8M,6628
trl/_compat.py,sha256=ph2c9r6aK4qdt3nB6USZxzsxyfxPpSOtEfcT-WI_bF8,8978
trl/chat_template_utils.py,sha256=wfKBEnnrUc_3nv1ZDpuAPtSpTfHU5E8W0vnnIbcjxac,24875
trl/cli.py,sha256=jwgZ20oEZRg8rkJuuw2Roj6ToRotpczJDqGWyBwP_28,6909
trl/data_utils.py,sha256=vXrvRd1xSFvD38QU4qqnN9paZTjs7PCVon71jKT5yec,40889
trl/import_utils.py,sha256=-axSkC_bEo3N_dvyFnsdO8YeONuh4CPgua1478T31iw,5798
trl/mergekit_utils.py,sha256=PDl-gYi1t6urIng9S7GdZAoApIK65ZlcWzKZer59l6M,2508
trl/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
trl/accelerate_configs/fsdp1.yaml,sha256=FBw8i6diLwfcUI6Uu7T-UTpd7niY062tLsCFMLoT0c4,725
trl/accelerate_configs/fsdp2.yaml,sha256=zg1L3kVDJb7kvuxIPaqMN6mZQFD2mvG8IxSRmkY7dDk,627
trl/accelerate_configs/multi_gpu.yaml,sha256=yDX-SPo8qY3SW8jsf_53VJX1GwIV20wmRPBbCKf4_8I,321
trl/accelerate_configs/single_gpu.yaml,sha256=4MuOZIjHNir2adOzaoOgBwD9IXXRbPNPzBYVW-zkc7I,316
trl/accelerate_configs/zero1.yaml,sha256=fyUlyzQ_nhP6oamOgOBM7MDZMuHvG4xZfm_-2wnuYTo,441
trl/accelerate_configs/zero2.yaml,sha256=kW58rFIjO1Jz0-TWjg2zUHO5BUBHI4TPFIUHb2M-WiQ,470
trl/accelerate_configs/zero3.yaml,sha256=VN3HDSxEn_WCvYpML4thWO7cpr2N39VwAJjMvPtwfxE,498
trl/experimental/__init__.py,sha256=FMF_-llsmlfdSVPb8RfoW4z6zX0Co7J2jub6IW2bKyE,1310
trl/experimental/merge_model_callback.py,sha256=UG2Yr0VJsYCkrDGmWjwssAvTNwMgJTadpeExsIpdQmg,13850
trl/experimental/utils.py,sha256=3VUizepZ1V7jHjl_7F53m4mc1_ls3wOKmG48UkKcVsY,22630
trl/experimental/winrate_callback.py,sha256=rdcVQ7joSOSafYsQn5zahtDYj59hP0wx8wQkuiavQgY,13164
trl/experimental/bco/__init__.py,sha256=X9vUxV2PcrTORo0CEALpq8EoHXtNTavAh0s-GVBDYio,682
trl/experimental/bco/bco_config.py,sha256=A3eU3jno8BWdZeXcQUmQU2KK4F1khJxnjo6ROzZY9Kc,8871
trl/experimental/bco/bco_trainer.py,sha256=_tNmTfQ1O4uCy2jzQXPKL8lVuuJHJ0A-Yh2aAlowEZM,68429
trl/experimental/bema_for_ref_model/__init__.py,sha256=YSMOnS353SIRvV4_NS-Y-t0sbD6snBcbELbG3ku2Nfg,683
trl/experimental/bema_for_ref_model/callback.py,sha256=RYC7doi9utJa98wKMT0NP8pmY0rITQGISfwZjlQm_Vw,9641
trl/experimental/bema_for_ref_model/dpo_trainer.py,sha256=4YrnaxULpR6TSpjWLvOGoLBziWQNGgWhNqOjuZT1mHg,1181
trl/experimental/cpo/__init__.py,sha256=rO0s9KRAaIsLOMJo2sweX51LkAK4QsLOeDDGIonMFLw,722
trl/experimental/cpo/cpo_config.py,sha256=5PvGc_B7RyQgzC1Yx846hvxZ1oRfjF224qVpkuVvbJ0,9876
trl/experimental/cpo/cpo_trainer.py,sha256=HvspzeqKTJYcWKcFSKrbWo2E1eeZCthELe646k6eiMc,49163
trl/experimental/gfpo/__init__.py,sha256=uP2ol8mB0vbkaDcIXCAAwN_HzW7ulo0c4HGqqlevafY,686
trl/experimental/gfpo/gfpo_config.py,sha256=Zz4vFZ9vAy9kD47EN3RgoSJZtW7_8JnGn35sgHmZzNw,1325
trl/experimental/gfpo/gfpo_trainer.py,sha256=mIgwf2DzLdBPE-y7KpzRZq4Yr9rFYj8jEW0kSNcJCJg,21475
trl/experimental/gkd/__init__.py,sha256=QO5Yki2ia5hOep3fpQArdI3KMnpQkIV1FE0WiznkZrU,722
trl/experimental/gkd/gkd_config.py,sha256=iAdbdxzY-5qmWvTJAPHg_TthR3E_cG61r6jEfNGxsrM,4900
trl/experimental/gkd/gkd_trainer.py,sha256=pJQJQeyx8lvEuEs6Hu3gBxblt-U2p4wnvU64FBeV5OE,20720
trl/experimental/gold/__init__.py,sha256=FnYqi1_ahqtra-Zj2iECHAfr7AHBXQxYWrDNhK-a3Vc,728
trl/experimental/gold/gold.py,sha256=RYgHSL6f1c4hsZ1RoXczQz2Y00L1R0noAax-QONl8UE,5399
trl/experimental/gold/gold_config.py,sha256=cUQb5iIc0lza5vYJ8a8yxAvP0A4UAgN08X3RxCtyCxY,20007
trl/experimental/gold/gold_trainer.py,sha256=Sdqj1Xz3IgPIGuBzQk7MbVGQV5Gj2RPki8Jk2_0P-jA,101877
trl/experimental/grpo_with_replay_buffer/__init__.py,sha256=KPrhB5rG42642HmeBRcnefGPLBICYAdd613MaDGFTys,770
trl/experimental/grpo_with_replay_buffer/grpo_with_replay_buffer_config.py,sha256=UW6s4umTNDvsDQ-2lHMOAovD5Ro1gGlBohJNnuEan0U,1372
trl/experimental/grpo_with_replay_buffer/grpo_with_replay_buffer_trainer.py,sha256=9duMAbykhskzxZ5HqoQQK0rLFGIPh26pNtdk2YJZxyo,36517
trl/experimental/gspo_token/__init__.py,sha256=ymJxlrn9cMOyLPGHBq_7VKfvGrhbXYl1ZPi8OyGjSbE,650
trl/experimental/gspo_token/grpo_trainer.py,sha256=kOIfJq-9gj9wp7FQuhJGAqK_ctEU7rbfed0PO9D4c6E,8262
trl/experimental/judges/__init__.py,sha256=-Yk-310tjPCC4xn4AvU_TJ6TdL_XAWfCFFfjiDbvqNc,986
trl/experimental/judges/judges.py,sha256=REnuXaFXT1aqKijRf2GcHhH9JmOhQUwty4V4JrfNng8,20845
trl/experimental/kto/__init__.py,sha256=K-M_Blc_9na1bQDKla6jKJKb7fPKxSUmiJyRHNFuSu8,722
trl/experimental/kto/kto_config.py,sha256=fb-3wOOeEHZMZMLGygUvg9xdIgyP5a7semwkn-91saU,7549
trl/experimental/kto/kto_trainer.py,sha256=SOVqAZRq0OpiVvsrytdYbl21rjRDtu4oVdgb_GJEPfg,71384
trl/experimental/minillm/__init__.py,sha256=xJRoMqech-1OcFwcP3Ut-wV7DlYm6z6SXb455kHOlpA,746
trl/experimental/minillm/minillm_config.py,sha256=ShF3_VvW1JsPZ4FN0doDXXgvPE52L2i6x-rQVJ6KG3Y,6602
trl/experimental/minillm/minillm_trainer.py,sha256=M-4VU4XsES2JJ_AgX4Jx3VfJ4uyTfhzFmdd--hgzSjQ,20098
trl/experimental/nash_md/__init__.py,sha256=0-fTu0AiobRY3KTKO6l-HMW_Me66vuaF-l7ym62oRXA,742
trl/experimental/nash_md/nash_md_config.py,sha256=6GlI-rW4umHCMU2ykEwLztRGvd8hpHJlznEu7KzAsH4,1872
trl/experimental/nash_md/nash_md_trainer.py,sha256=zsDsm77lGHq2kc_9i43lyD7vgIkcBpMGmRgVYva6H2E,24680
trl/experimental/online_dpo/__init__.py,sha256=d0PLdODeA1bPSoXLlGWEAeA6XwGiHCd1isltzRGAVOQ,760
trl/experimental/online_dpo/online_dpo_config.py,sha256=kZOcyHlYS633UgQFKHVEmfPGGlPJ6S7Bg8nUQ6R0gdU,21882
trl/experimental/online_dpo/online_dpo_trainer.py,sha256=HTKRIoaczjFr0TCOesVXUSqupLX2g5jGGSyd9idYtIs,77277
trl/experimental/openenv/__init__.py,sha256=LlzcnV_wiUFOTBh64phVNDb6dpKr8A93i_K-ZntlysE,705
trl/experimental/openenv/utils.py,sha256=uXI73ca6zidt4F7qrDe2jralGh8Z1jmLl6Yep-A3zKY,7889
trl/experimental/orpo/__init__.py,sha256=raFCz1dhCGKRjdQREuxEWY_MwXpIA1GvpZXxsqzv1EU,728
trl/experimental/orpo/orpo_config.py,sha256=2WwxnwvIreSL8ctiIlSHbKNvVZzvRQclrXj4lmkFZbk,7402
trl/experimental/orpo/orpo_trainer.py,sha256=vC9ywiyf5kf8vH4idCvdVqHAIDmIptPxW8X0Mc6c-G8,48107
trl/experimental/papo/__init__.py,sha256=qP04taTkxweuEvOll1BfSFU5BlaZyv7OIT-i95PE8CU,687
trl/experimental/papo/papo_config.py,sha256=YN5qFmankCNVYDgEEQ0TRQDo29FqumZGRxfjtIkZb1g,3141
trl/experimental/papo/papo_trainer.py,sha256=mDb0UF9wJskM1cpblxUd0UwbwnvNK8Wo_KZibGgnkXU,15685
trl/experimental/ppo/__init__.py,sha256=7jMTBOcEiFGAs6rYdH61xzg1RWTGfBC_r2YFd3DBtR4,990
trl/experimental/ppo/modeling_value_head.py,sha256=TEUbETl0Pjeg0y2jBG1kl4YnurlHVn4Un1dPGTTk6O8,44279
trl/experimental/ppo/ppo_config.py,sha256=8XFYzYXys2HU_dApxSnTS9yJaZHuAc3_I5nUPkf8k2M,13602
trl/experimental/ppo/ppo_trainer.py,sha256=XiJFh9pVxRIVcIERtAGmbte4N3xKPNqyeEFsUjZ1xQQ,49101
trl/experimental/prm/__init__.py,sha256=D5e_7PoXs3nTMVQaN1rAGvIUra6cQDfOyFViUbZrNR4,722
trl/experimental/prm/prm_config.py,sha256=5GGtjgEMnj5Pt0ZFQPsin-4SAVcqNdniIXdIo9vufoI,4375
trl/experimental/prm/prm_trainer.py,sha256=UvgcnFDe74qS0o3YsuwyfXs2T8Y53yJPtvoeAEvu8sQ,16240
trl/experimental/xpo/__init__.py,sha256=QcEIbvNKqd-1mR_mHH8gmtE5UGhZGBFG_9bMYLBhuvI,722
trl/experimental/xpo/xpo_config.py,sha256=hWuv1yNMEM-KBFJFv9x_8xu-NhsU8oblvqQLLLF68-Q,1691
trl/experimental/xpo/xpo_trainer.py,sha256=JALn0Zf_GWSsR7GPGJhYwc82FuAe3HGvJ4Mdkp6yfvE,25210
trl/extras/__init__.py,sha256=V1wvJ_Ee6Ro58SbMXQqO7FG-_jvCpy6kB31_7Wtl68A,611
trl/extras/dataset_formatting.py,sha256=D_8NqUiZ3aSF6bl3qnopEOY8suwH3YEhJ_W4gljSXA0,1285
trl/extras/profiling.py,sha256=kdmjghftaN1onlnUr-QIzJPT71a0BTnufQm4R_J3ZtQ,7368
trl/generation/__init__.py,sha256=aAYDsVEN0dDYZMZaeZvBhAohos1fQX_asTGHJrjmFUE,828
trl/generation/vllm_client.py,sha256=cz7JihwIAdOlkgFzv2h_uxu3vHEsCDJtGBUw_nXX-P4,27897
trl/generation/vllm_generation.py,sha256=lEtFl46bWXUiRbjEAFmhDwipxY8NVJaLh4NCxcBMYuI,36747
trl/models/__init__.py,sha256=7Ly3IQjuppDXGbAQtOcj23fWs5Peo-dCO9NFdmiLUtc,1533
trl/models/activation_offloading.py,sha256=ZKnl22gUmvG1FcJrXQZJGyHK_bviFyrqx9mk67Rnxis,34695
trl/models/modeling_base.py,sha256=VlhSCbHGRF8pkG9fIbkLIXqAw21ShWA4dF_W4rKBflg,1424
trl/models/modeling_value_head.py,sha256=6n0xv9x8R4nHTpCWgchXMgPDkpkS50RR_SZ5SXpRJvE,2220
trl/models/utils.py,sha256=cqQ0u-fxkwkrZf3C3KUnPhHnxBoyQ0XyovveahLmA-4,18837
trl/rewards/__init__.py,sha256=J7jBI_tLyUV07IpE3q8y5DwUR9nWA8YKAjLXksnP4PY,1216
trl/rewards/accuracy_rewards.py,sha256=-F7ePyttFOuGEZarzFmwMsFi-WhLJMFh7S_iso7AoWM,7610
trl/rewards/format_rewards.py,sha256=XKId9E_3opkCtiELkYSWKxb8QnYJv2EGLuT9QOcmbS0,2211
trl/rewards/other_rewards.py,sha256=fzad9ow5yukVkdfan3hMWY7alEv2E-4Q7BPckNUcgaQ,2633
trl/scripts/__init__.py,sha256=pfV1yIL5Sh7I18KSxa-aHwpUbyLH3KxpWqmV6UT9hWo,1077
trl/scripts/dpo.py,sha256=Jpg3pZzGn0mn52gHjBxs0jUzBANgFOaeNW1wPTxA-h8,6235
trl/scripts/env.py,sha256=1PbnrAf9Xl8O4C3cMyuBCycuBmIaKXJTJaKUi9oL5NI,3522
trl/scripts/grpo.py,sha256=4hTKtuDtw2iZe8N-XO3e8xPQJgyNHte2qQ08MKoaJjc,7544
trl/scripts/kto.py,sha256=kpoel9YO_0X-ypn3lDa_0o9uTWAD9ezjFN0BA3bBzCk,5497
trl/scripts/reward.py,sha256=86ZTxcazpUiz5PII7C7mgWxkd9-L1ac7TOdhs2Tp_q4,3772
trl/scripts/rloo.py,sha256=Pxkj5udjCGGvaezAYWdDt2oGC9OWd6kOGbie-ZiluNM,6822
trl/scripts/sft.py,sha256=ov0qy63qvp7q3s6HoPdCb57wxlGuP0K8dEQ-8qeJrWs,6000
trl/scripts/utils.py,sha256=vAdRpl7bBMX-vFjNXPBCXT8cKZwaq2tTibF2DEEFOzU,18575
trl/scripts/vllm_serve.py,sha256=lReCeY1OLOWqOC_6m_CQnlajxq8nl-7HZlsNLkoKxUg,58207
trl/templates/completions_dataset_card.md,sha256=dw3t1mm7WyMWTTcRyttemOWcXo86WLc7BTfRV1YIJS0,1241
trl/templates/lm_model_card.md,sha256=0ZtamGcF3blI4r6d6p52dZMYQJaZjaMk8CSO5kzsnFA,2112
trl/templates/rm_model_card.md,sha256=4GnPVao9WxML3eFTAkffMRGvxROVjUS-jJKcHiBocdU,1905
trl/trainer/__init__.py,sha256=28iq5DrSCuvzIk2_6GsJcJ2_eLO_rGIDQzOsXKz1lGw,5942
trl/trainer/base_trainer.py,sha256=tIavhuLicKgPp_bWrFZkZbmDVJWBvEjv5_xsmGi5Mhs,2891
trl/trainer/bco_config.py,sha256=hTSrpYIpg9Mtd6H88ZI1tpGKirTNlI4HilPW0fK8Mto,1334
trl/trainer/bco_trainer.py,sha256=Vbd3ayiVb2rgxqfOzCkVIY3q6U20UrfGfEzpZSL9cGk,1362
trl/trainer/callbacks.py,sha256=qlk4BoG2oiyVkMs_XGMP_V3QaVQ9boIM33sF3EWH1AI,32084
trl/trainer/cpo_config.py,sha256=6QKt8K_IDQ1QeAMbaJH77p32RaJl0KVINm-oamx2gLY,1334
trl/trainer/cpo_trainer.py,sha256=8g_RPOH6bM20n2niWlQ7v5vyeSvjAmrhEIhK5ntGZ5k,1362
trl/trainer/dpo_config.py,sha256=sHyguMernEAAoqn1rDPXGc-lo2SHXfn21yZTQvbWkiM,38561
trl/trainer/dpo_trainer.py,sha256=HecPzMNuP0yNZboaq9TKa2AXUllBDPHUd30VXeE178U,105723
trl/trainer/gkd_config.py,sha256=pCTgOL5ZSZTvyCTDBGDmjf_EcvTk8WnXHFazNlsKnwE,1334
trl/trainer/gkd_trainer.py,sha256=RdA6KonRuwxat8mzk8hq471DKurjRhErzwNKZ4NTG9I,1362
trl/trainer/grpo_config.py,sha256=w-xnROJxBvqyLE9QVl5euCSLHcLOdYHMud_BhndnqMo,54061
trl/trainer/grpo_trainer.py,sha256=lbM0JPwgtpVxW_tAabbMlmyobMeWkTA743BRQr7kIww,122180
trl/trainer/judges.py,sha256=rkLwzfUwhm5WCz9ijeBN4NmUqQHYAT3jxxWqRW2QR-A,5096
trl/trainer/kto_config.py,sha256=g9ZzUlnwRyvSKcfA3pNI-ep3u4b2kTAK3E3Jkv4XurU,1429
trl/trainer/kto_trainer.py,sha256=xlFQtdF_Hx-bL9g2JJ2LTmsT-NSarjpfKt9fVKBvvuY,1458
trl/trainer/model_config.py,sha256=7k27sX-GRpF3tum8nccoa9jHX4LVu_ZLA9hwa6wWh1U,8813
trl/trainer/nash_md_config.py,sha256=SBMRmNtIpinKspjNjcKpEVYCChLv9jbd9dOzft_-aP8,1360
trl/trainer/nash_md_trainer.py,sha256=hgVNgknPIEH9jaBCfoPQQSdZsPHbYNQHlh77ir3J4Wg,1388
trl/trainer/online_dpo_config.py,sha256=g-jSISrvNt51bXVczcqQQKO7VRYoU6th9ZsUo7boHFg,1399
trl/trainer/online_dpo_trainer.py,sha256=YYUEZMeBgnziz0ByqHXsHh6Qv6CT27_7IEt9hdmLqQc,1427
trl/trainer/orpo_config.py,sha256=UdvSQ1vRan994wWkNnSLqzLV5rNankCwcdWrM8Hp07o,1342
trl/trainer/orpo_trainer.py,sha256=kOb-sV3gpN6_lr2m6JnLe0UGHuy16spijy1bWCn8aHE,1370
trl/trainer/ppo_config.py,sha256=jYPg_sUKLoP_OGoPwte85td4fraxUknxneNYfQNpf4U,1334
trl/trainer/ppo_trainer.py,sha256=S9AB1GOjl4QLcfIqd_rpi1kj471CtvIPJ-trW2M8M1U,1362
trl/trainer/prm_config.py,sha256=PdheP3QIylpIMtJWHY0PFgOf2XwJ1ekdoQ2cqnN_LOw,1289
trl/trainer/prm_trainer.py,sha256=sM6pa-eQku7qQuAXkCip11U0JcW6oaD7oYo9lO9XQno,1317
trl/trainer/reward_config.py,sha256=cXC3eibjs3_4cbtxaIAFRT8oagEybc2YG06jIEs9Xcw,8517
trl/trainer/reward_trainer.py,sha256=jvduuz86VzD8405zEjM3qKP9vgnWEA6UZLOhXVw1qFs,32091
trl/trainer/rloo_config.py,sha256=wiqbJV-3P5yNHAFQoebSbT4qWNaQQjCOH-cf3TXYs_s,33774
trl/trainer/rloo_trainer.py,sha256=QqGgBiDbd50V8SDYSKDPYRpAt2O01k5ncJOargEmfyk,77112
trl/trainer/sft_config.py,sha256=cTrDWpEcr7YYv6SVJs18zlTXsLf-9L_NZPZ2Mu_vTTk,14300
trl/trainer/sft_trainer.py,sha256=HvF0TnxT5R_moP8NLxwV7mJIfh1gkHnkPyTd9hE6SvA,72965
trl/trainer/utils.py,sha256=DkHHk2ciogqQmMc0bpCkcU-ldodkG7Fk6dAxkKMbsvw,50443
trl/trainer/xpo_config.py,sha256=dXbXnrMOnb1U4-VVlVa-w_rhxxuX23U49maej0O8IGQ,1289
trl/trainer/xpo_trainer.py,sha256=KLjxSe2PHRiI9jj9xXZvMDmUjxuwYAM6vanToD33BUE,1317
trl-0.28.0.dist-info/licenses/LICENSE,sha256=G_YUsf3ED700SqWNANF9X9DSUuozOgW-AYo4lZyLKZg,11355
trl-0.28.0.dist-info/METADATA,sha256=bs2TMuh3q8yJaCGoZxkDxTp-RtycfV2IWPcPhMfOIlQ,11617
trl-0.28.0.dist-info/WHEEL,sha256=YCfwYGOYMi5Jhw2fU4yNgwErybb2IX5PEwBKV4ZbdBo,91
trl-0.28.0.dist-info/entry_points.txt,sha256=EiubuQrZSGOohRB4xVoiVAyWsPsOHPSVpbzSk8YB0x0,37
trl-0.28.0.dist-info/top_level.txt,sha256=QU12VhjlpAtMnIJqiO2np3RkTB_Eozt1d-g8QDf5P4c,4
trl-0.28.0.dist-info/RECORD,,
