trl/__init__.py,sha256=k9aUlL_MkRdHEiUp0Bi5lKSv4OfkMGRhAL6AyLo9LKw,7931
trl/chat_template_utils.py,sha256=HNGfulXTKWQmieEh8K4watVDX62hlNP8cnXOQultpBM,18062
trl/cli.py,sha256=cU4bHuqx_uAdLvPDShHopQU6BI3qCVQRNAkw28-_Drk,6909
trl/data_utils.py,sha256=iE_cBEz9nt5H3q45K4s26kLKrCfjn06Iq6uWhbEr2g4,38382
trl/import_utils.py,sha256=SZ7FhWbZx96Ao4I6X5kRsp7tdAhThvMJSV6fJ1gZyR8,6407
trl/mergekit_utils.py,sha256=IIGDoiG6dGuYSxS0qRa-jjJD_usR_vaP1h7IHPmZ2QM,2508
trl/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
trl/accelerate_configs/fsdp1.yaml,sha256=FBw8i6diLwfcUI6Uu7T-UTpd7niY062tLsCFMLoT0c4,725
trl/accelerate_configs/fsdp2.yaml,sha256=zg1L3kVDJb7kvuxIPaqMN6mZQFD2mvG8IxSRmkY7dDk,627
trl/accelerate_configs/multi_gpu.yaml,sha256=yDX-SPo8qY3SW8jsf_53VJX1GwIV20wmRPBbCKf4_8I,321
trl/accelerate_configs/single_gpu.yaml,sha256=4MuOZIjHNir2adOzaoOgBwD9IXXRbPNPzBYVW-zkc7I,316
trl/accelerate_configs/zero1.yaml,sha256=fyUlyzQ_nhP6oamOgOBM7MDZMuHvG4xZfm_-2wnuYTo,441
trl/accelerate_configs/zero2.yaml,sha256=kW58rFIjO1Jz0-TWjg2zUHO5BUBHI4TPFIUHb2M-WiQ,470
trl/accelerate_configs/zero3.yaml,sha256=VN3HDSxEn_WCvYpML4thWO7cpr2N39VwAJjMvPtwfxE,498
trl/experimental/__init__.py,sha256=NLnK79EXgCFzLoEpLy7CWwvDOj7YAyasbYwfl9XKnaI,1310
trl/experimental/merge_model_callback.py,sha256=AqhXqVcekwdPOqdIXH-l_XA3qnbPZEUN55R-AZmRxwM,13850
trl/experimental/winrate_callback.py,sha256=pyAKTwvRjJeZvtNE9q6wnkgiIV_jfR2CliQ6qiOx8I4,13096
trl/experimental/bco/__init__.py,sha256=8CJbPYAotJbNutPt6tlmOFuyLdH3zVDwCu0LoUkLpdQ,682
trl/experimental/bco/bco_config.py,sha256=NzIZn6X73GjBgJFb7_XFWIIUm1FgL2q6L96naCaWwdo,10499
trl/experimental/bco/bco_trainer.py,sha256=xBrzsdnYMYuci_vyUYxa7O4DWavUScvr4H6iVjwxAgg,71286
trl/experimental/bema_for_ref_model/__init__.py,sha256=5pu2RcnVVznaCqfS5aSOLJbiFSoSV6YiGagczI_WGUw,683
trl/experimental/bema_for_ref_model/callback.py,sha256=8bgm5Cm0_l9Q-xaT5R4dg5802_VlH5QaozyOtwjtaX8,9641
trl/experimental/bema_for_ref_model/dpo_trainer.py,sha256=z38itb0kQyDwzLHntTsMdIXF2EM3GjjHvTYljn3Zakw,1181
trl/experimental/cpo/__init__.py,sha256=RHTVHIEDUwDDVF1O3nEW34iWhYPSXYf8nCVmtZXPxlw,722
trl/experimental/cpo/cpo_config.py,sha256=XgmqRk5Ds-z4zxNIcHtk0EVDIskkYUxzEgCpdMlv2xk,10957
trl/experimental/cpo/cpo_trainer.py,sha256=cQBIe_w7MxTG1Dk17-G4hsVgxTuxENIAKioSOLSszmw,50968
trl/experimental/gfpo/__init__.py,sha256=kDdEyI01oN5n6lwG3uLRdzqodtsfy0Z8ySROzUCVZAY,686
trl/experimental/gfpo/gfpo_config.py,sha256=xUcayWWu4lfWZdvWfIQstlssIrLbf4hgcJqpIY_NmVk,1325
trl/experimental/gfpo/gfpo_trainer.py,sha256=AUFnbpFyAJTn-AddpISfmcQrOlTSE4VwDbefuMPYVmg,21471
trl/experimental/gkd/__init__.py,sha256=c6XN9vlLSOKsxXvZY9DnVpVzdVj2xyhU2PrQqZfhv5I,722
trl/experimental/gkd/gkd_config.py,sha256=Tdcv9aB2CrWZIFhkwrT11n6aESKguN1fCk0VnIBrc5A,4900
trl/experimental/gkd/gkd_trainer.py,sha256=qorcJk72hdh722Iq2U5IfW92QEMP_M_YFbWEW_RF75U,20025
trl/experimental/gold/__init__.py,sha256=GYzgNgp_OOSwbaFi3mr5O8j21anppy-oGC9zRbvqE9g,728
trl/experimental/gold/gold.py,sha256=vyLd-u7F4YKbAhMgtfOtqOHW23fzseM4isKCuth8LqU,5038
trl/experimental/gold/gold_config.py,sha256=TH1IvLkc-ht4NIxwlI1u-8bpJ5EF8bHe5-BIYQ2Ronw,19895
trl/experimental/gold/gold_trainer.py,sha256=U7Rms5y7ZWu4sY7ECJsdqrhG9xgT0EgOMtLDm3COidw,98192
trl/experimental/grpo_with_replay_buffer/__init__.py,sha256=XHyiiLigOrWnVkJwmss5STwZlrT5B-TM1wXVWLdpuOU,770
trl/experimental/grpo_with_replay_buffer/grpo_with_replay_buffer_config.py,sha256=F657XvqTASsMeAv4oPnsDi4cTfK71ngOm05hvpWu3XU,1372
trl/experimental/grpo_with_replay_buffer/grpo_with_replay_buffer_trainer.py,sha256=DSklD6hARr4FReQMeadEL6wJ-xL5miYuDwwM_AHR4H0,36513
trl/experimental/gspo_token/__init__.py,sha256=KF6fqOTgMYJQzGyGcHn7u6yfEq8zaYXA_uRTu9ME_4k,650
trl/experimental/gspo_token/grpo_trainer.py,sha256=5XTk4ZWuLzH2FH2w8BTxnn4pbFt7awCcJ_uHEktnG60,8011
trl/experimental/judges/__init__.py,sha256=Hj_oAbR4KdfX6bK85rsb1MJU-I1WHO1H7xQ0z467_ZE,986
trl/experimental/judges/judges.py,sha256=btiymjtJTZC6nXkhXrqd191n46IXoKcMFDHKJtE9C-4,19517
trl/experimental/kto/__init__.py,sha256=su1QBWvphtmE8TYQAwqAkxBWsqibOfDQS8JQoYEhEvc,722
trl/experimental/kto/kto_config.py,sha256=hEVrlbccNnlrx0WL60jsLVRwH-ZSgdZyGMu6FiW7WU8,12360
trl/experimental/kto/kto_trainer.py,sha256=QxYIJNVzwdhm5q-2rCAyveaaxwmNNBAkkARsmLII03c,81864
trl/experimental/minillm/__init__.py,sha256=notYrtpHvEPFdsswisLnLDMYQP4A60P4GrWv68gxJa8,746
trl/experimental/minillm/minillm_config.py,sha256=UtRGqLLfbVXmPmEeYsWB0c2Ids54jDtw5uueOXWIsRI,6981
trl/experimental/minillm/minillm_trainer.py,sha256=XDQKACzfvVoO0s3CmI4_iQBQc8svRHL6LRcVbvZJaHM,19329
trl/experimental/nash_md/__init__.py,sha256=XEGevty-bbLz6gE3cMtrxnwuf-LZEQAisJw3K3KDvZs,742
trl/experimental/nash_md/nash_md_config.py,sha256=UM8DDtsE-7r68zkcFV79VhORFIvU-cZiIDD1tXM_asM,1872
trl/experimental/nash_md/nash_md_trainer.py,sha256=VoVzzIItIFl4Xdu21rMcnZOZdJg9QfC4k241ouD36Cc,22253
trl/experimental/online_dpo/__init__.py,sha256=isId2WdLNSzmhNH0ROcASlg6MzFz2vaLArknph9fqRo,760
trl/experimental/online_dpo/online_dpo_config.py,sha256=rEBySvg-3tgk7wdDPaWk-SsP5_C2Tf5AONIiyXWcnk0,20802
trl/experimental/online_dpo/online_dpo_trainer.py,sha256=amiJtW01T0ch97lRWW5SS1zGET422bwsR6XpjqrLYYM,76184
trl/experimental/openenv/__init__.py,sha256=zqFBDVkvMgWNm1YweERd-epK6mEo-OsMhTVG95FYATU,705
trl/experimental/openenv/utils.py,sha256=9IKkACW-eTDmahpZiQh4aJW2fYL11acIENwJ8-IQRP8,5205
trl/experimental/orpo/__init__.py,sha256=1zrVxcEkXU5zewC8pesepKGG6z3hrJ3QUrEPJKEBoSc,728
trl/experimental/orpo/orpo_config.py,sha256=CGkb_2DNKXnovFFBbWKA58Ka_6CMMjOkT0-pZBT8yz0,8271
trl/experimental/orpo/orpo_trainer.py,sha256=nHiElQ26bpr8uPO697pEz2-dAGD6oASApYCXVFk_WgU,49426
trl/experimental/papo/__init__.py,sha256=mwIFsCHIovHIgwASDUyUhV-OdGCDcPt7L2JQnDPHdWY,687
trl/experimental/papo/papo_config.py,sha256=RBSVOlIr7MUJ0zRYeegbgZiojPXwszBTugRHUqrBfiU,3141
trl/experimental/papo/papo_trainer.py,sha256=OZfig_WCTxAqDbJauJ3PZFneby9ddygAof0QAxc0wlU,15685
trl/experimental/ppo/__init__.py,sha256=-_5U7moFV6t02_HVy9RV2ZDU2-zkGGyKY7Dqpx1h4FM,722
trl/experimental/ppo/ppo_config.py,sha256=W1gQIj1qKSjdj8ZpIVqhrmlT0Hs0_AKR2b_FVuTQzJA,6023
trl/experimental/ppo/ppo_trainer.py,sha256=6rj-wAUe58v8bAmH6tAI6YIgCkFu0zz56vk3Mkyr2go,41920
trl/experimental/prm/__init__.py,sha256=kzDPvKvQ6-5R3ar1M2a9Tc7MiwTfqurv6MVFmmdffzU,722
trl/experimental/prm/prm_config.py,sha256=5JrPdT_54w31WNpiA6QrekntZqZIlAvoKpsU-AxAxbQ,4663
trl/experimental/prm/prm_trainer.py,sha256=XJ9WwKeAH2MbDAU_8KD4NZwzNrAAOlfcPG7XTwjVGWI,13760
trl/experimental/xpo/__init__.py,sha256=zdzpaybRs9LcBsm39XB9sY4oenTYJUJDXMTksxasadI,722
trl/experimental/xpo/xpo_config.py,sha256=X6E6n_WthTu2bgdtpmqmxp-SRFyqPKFxaToa4qQJksc,1691
trl/experimental/xpo/xpo_trainer.py,sha256=Etm0hAl59YT6_rqCpLgjMtgqxEXb0Y6DQDEij3KyOGE,24760
trl/extras/__init__.py,sha256=Po_3-y5piG9oINxuL8hm7ATrU536lj4eL4ganNbLePw,611
trl/extras/dataset_formatting.py,sha256=2u2q4JiJJlYi84ugFUqX2a2u_gEVPK68l1WdepY8B1M,6375
trl/extras/profiling.py,sha256=thY1EHuh8CfDieHEVryUi0Ug2oqmmAnlVkDghwBrNDc,3268
trl/extras/vllm_client.py,sha256=j8aqDgVreBUNGBcLPoxvBFlfWuu7nKKOKIuORZkBZXc,23753
trl/models/__init__.py,sha256=K6JqEb6NLEDC_e7EDMaWgLBrV4GnxOFWrvJxcXUUVa4,1919
trl/models/activation_offloading.py,sha256=ss9xtBXF_2o8FuRI8T2-3HMB4kMcKYy2JX0nfLKFYCg,34695
trl/models/modeling_base.py,sha256=FvF6_rNNB0s7TXqHdLz7xYMUKqPk0i8X-P86FqE4xiQ,31398
trl/models/modeling_value_head.py,sha256=CBNB186PHZBF3NUGaotCJx0vGbYXHOqeUDyL84zmm0o,18883
trl/models/utils.py,sha256=CwEkuTu6MWvgS9ReQwlFFi6R03-hecWLkor4qIJnJCU,23167
trl/rewards/__init__.py,sha256=EUm-tCHoSvMVY51rfqLWhO1nrvvuQryWAcKM6P03XPI,1216
trl/rewards/accuracy_rewards.py,sha256=vQUlnMky4ifisuhSo6IfaeLX1qSi0bwdE4NL6qPZVbI,7610
trl/rewards/format_rewards.py,sha256=fCQhtw6lazljB5Kv20ZAaD5XraoxKqVDBvqbscmldYE,2211
trl/rewards/other_rewards.py,sha256=bjJ-tMrLSX8qIHsDy344luP48MErEzBEJVvZ4vmf8Y0,2633
trl/scripts/__init__.py,sha256=tDv5yBlfQh0ovYdrTF-xW7dLwbARJPhHT8JkgKs4KO4,1077
trl/scripts/dpo.py,sha256=FFz9OQN-NQbHTbaHzc4amyRfZP6jdpNmddNwfhHvOYE,6297
trl/scripts/env.py,sha256=Vj06F7nzIrZZwKjNd0enBgv2EhBoaBLGOVtIiqMY3e4,3522
trl/scripts/grpo.py,sha256=-Ufo0Gsw9OBYERYPw-oXJ-uBo_hYVfehRV3pqECvY40,7544
trl/scripts/kto.py,sha256=SC-fLkkUo7UBdZvfEhfiYeNl5Kz4fF5bgzAFHYrN8lM,5497
trl/scripts/reward.py,sha256=vDS0h5hv-vanyji8XQXeXt8H2sjRt6KEXEBjXNpRuMs,3772
trl/scripts/rloo.py,sha256=Xvae9C6SHvavfJeU7NMXNVvDhBkdBwpfcQC1nyWoplE,6822
trl/scripts/sft.py,sha256=uXfLxtR9aVnc0HITl7p7XhI1Do8hrEBzrbmfSWYk-M0,6062
trl/scripts/utils.py,sha256=M5_KHHK5VM5x_Fcc6JjDkymHXJUNyCwdqXQvxjHAMjk,18912
trl/scripts/vllm_serve.py,sha256=XKeRPt7hIrtnISwAR1gMGTTqHwM_gy9P2Yk9Lk7ragY,39352
trl/templates/lm_model_card.md,sha256=zq0dXorqEOnjHJ8wxwhI3LS2R6qiHmlcgPcVzliwRmc,2158
trl/templates/rm_model_card.md,sha256=O4lxwEsL9ld81LL7rwBwredxAeMDfWfpzwe-k7UYHeg,1951
trl/trainer/__init__.py,sha256=hxCrHTrhd6AXbdyVE8lUVHtXLQFs9pSB_1Uxz_WwM3Q,4600
trl/trainer/base_trainer.py,sha256=HfwfZYf1ex1OMrW6aFVSqAXVbZl5pVtwDLHq3tej5W0,2891
trl/trainer/bco_config.py,sha256=2SOfBMeorvRza8JzQ07I2R1uNeRU2_hoG0pyORENJwI,1334
trl/trainer/bco_trainer.py,sha256=PpRpMBOgtDV0wI7yYw1Azr86cqyAbWW2f5z2QwgVeN4,1362
trl/trainer/callbacks.py,sha256=R5PyiFZBegmK8tjSU1AEvoIhS5NZ8PIki3hnGhL1LPI,33177
trl/trainer/cpo_config.py,sha256=eiG0KYZ0fkVL16dkJj5ZxAKB4e5vm3WH_Xak813soN8,1334
trl/trainer/cpo_trainer.py,sha256=Moj7vt21eDrKdnKb4rXeIe1wJoAbDTbLoZwnYg5DUrk,1362
trl/trainer/dpo_config.py,sha256=-8VBzrWqB1MM1CzLXAVa9aqDk65wIJhupV_yoRZz198,26814
trl/trainer/dpo_trainer.py,sha256=rXE0hkV53NlXw8WdCiNQMUSEKQSsDuzqaQEOsimSxEs,102455
trl/trainer/gkd_config.py,sha256=9YxEC3WRmY_pjPdwatMfjYIMNgFgtZP_SP8-2J4xIAo,1334
trl/trainer/gkd_trainer.py,sha256=JK2VkY4m1q21fPQmPErYQHTr7P8Ta0m7YhSrBJBC2KQ,1362
trl/trainer/grpo_config.py,sha256=B3F6OgX0rW7a9VvaOfW3A6HkmLh91cy_YNw0yoNczCk,50518
trl/trainer/grpo_trainer.py,sha256=h31lEDhsNGNy4XNFidPe3TSjIm7XgRSCFDq6TNzzhrI,130311
trl/trainer/judges.py,sha256=Y4coFZVTJJ3WBLjQ3Lmvd_teOACGc2bQAqN2wkrPvVw,5096
trl/trainer/kto_config.py,sha256=Ag9MP_arUjS9YTFcgAN5eVqWb_qzN4AMerRjP7qxGUc,1429
trl/trainer/kto_trainer.py,sha256=Zz7SGTTjfPVD_R0TsW0I2VKRw16Vplh8DznbonarHwE,1458
trl/trainer/model_config.py,sha256=dY2bfTJhplEmck_0OOpmF7x0u_qoNF_NFnx9CM66y1Y,9359
trl/trainer/nash_md_config.py,sha256=fe5hkXQSDYOp_UV45zGlBVLy3AAfyaYYdyXBfL490rY,1360
trl/trainer/nash_md_trainer.py,sha256=SQKvPT4UHhHPleGfUpR2o0E3Vh-dP0ip_LZuv68h8h8,1388
trl/trainer/online_dpo_config.py,sha256=9ED8rSZzz5Y6njb1-V1eUmBtk4XsYEOtgAVxHNKvStQ,1399
trl/trainer/online_dpo_trainer.py,sha256=wWkp40ajwZS-oVrwuKZOH32zNqLbMg4r7RAOHtf0GuA,1427
trl/trainer/orpo_config.py,sha256=GtI6KA0BnYsdLcaCIvB6L79UaczabzBG0JUqf_vjo8w,1342
trl/trainer/orpo_trainer.py,sha256=Sj1yRMO0i0W37LVrZpbbFj4f7xYl2VSVDljIUF9MpZo,1370
trl/trainer/ppo_config.py,sha256=wQx-KnwmDDx__hLDerbvM5eT7VoNuyDjNrRRl9Xj8mg,1334
trl/trainer/ppo_trainer.py,sha256=u-97eddiMn5kx0_2nd1aakcIq48I8Nzxj-9kraA8NIc,1362
trl/trainer/prm_config.py,sha256=GbIl8hrXSqQRcyhlP7Kh-DDPkTWkQwIOs5P1oI82yx0,1289
trl/trainer/prm_trainer.py,sha256=6lGpMc73fnT0CPnQhnWvYsdxUcPuhppjBxf-fcjs3yA,1317
trl/trainer/reward_config.py,sha256=Re-ySjEjUDngnc6K9oJaM6mEv8JL4zx_tNeSbdNAu4I,8323
trl/trainer/reward_trainer.py,sha256=vNdY3g5YTAWQl8EvAB7Xxg2eVLffhTa5-c8h6IAsVrE,30428
trl/trainer/rloo_config.py,sha256=pF-YCUqY1USn92djGJzEL2Xxif4jwRDLpL4-GEsOa2c,32971
trl/trainer/rloo_trainer.py,sha256=t1-SwH-QcYGFoAP58krCva2i2JvyZ5bE_UgiCH9-LHo,88594
trl/trainer/sft_config.py,sha256=wm3jWA92CED2Q2vN9f9_38EdNyJzy53HuRGqndCydLw,14322
trl/trainer/sft_trainer.py,sha256=cQH-YAqRqnvYnJyAFrvLMAb1MTFwkYWKb7YoP1kakek,69731
trl/trainer/utils.py,sha256=ER83hs-RyYJNKocLEiEYMNTQo5V33wPhPOSWH5P56T8,81749
trl/trainer/xpo_config.py,sha256=Xl0cS9mIjtg8B1PKYjqTgn3rlPRVc_kVJ3mTbiOeWiw,1289
trl/trainer/xpo_trainer.py,sha256=GSrOwbQOYwIxgd3Rz--5IgTv7JDQJOUJ4QqHmZ5Wu-Y,1317
trl-0.26.1.dist-info/licenses/LICENSE,sha256=HZDsv3u4D_J-9nt3hfYhSAtlK4LkbHLYpXMLDbZb81U,11355
trl-0.26.1.dist-info/METADATA,sha256=0djZEMjREL6e0d1JuM8-zaBivA5WdpA-rf4SiiNzoAM,11388
trl-0.26.1.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
trl-0.26.1.dist-info/entry_points.txt,sha256=EiubuQrZSGOohRB4xVoiVAyWsPsOHPSVpbzSk8YB0x0,37
trl-0.26.1.dist-info/top_level.txt,sha256=QU12VhjlpAtMnIJqiO2np3RkTB_Eozt1d-g8QDf5P4c,4
trl-0.26.1.dist-info/RECORD,,
