textpolicy/__init__.py,sha256=6DZdg5ZwbqyPYaGrvITONlHeAj7XwCcsxHAwfnmNnhs,1710
textpolicy/__main__.py,sha256=IlGmjJaW-DJUC7yhxUhbwNOZA3GxkeQGkVbFdS3_wBI,136
textpolicy/cli.py,sha256=3CcJzrRlin1pgd6Mh312Xp3-EihHtTSvhakyYpdfacs,2107
textpolicy/validate.py,sha256=lxmegz83B_c-PS3cFHaaL3c9fgWrEaLsDLkpPFtSj8Y,3780
textpolicy/algorithms/__init__.py,sha256=x8eWBfSGOsLLWpmdKM-hiU6G3oiOaJyGDPKre5ylpPA,2683
textpolicy/algorithms/grpo.py,sha256=muX-VU4e6dESdaW_yHXDCxG2lC6RoaqNQWzmYcshQCI,51539
textpolicy/algorithms/gspo.py,sha256=70AxK1GHeCkOtzpBnE4ThA9_5PFf3dhSfVRBAK_MG74,24966
textpolicy/algorithms/hicra.py,sha256=f1uh3GDEpcg0MxgZZxi_q3q4uKvnu-FjNcXpavM91Ws,14918
textpolicy/algorithms/length_shaping.py,sha256=SFdkiXxUEgcVc19PBUyx34wrTN26D2Vjrvr6Ptbppu0,4813
textpolicy/analysis/__init__.py,sha256=cP1MUrU9xpNTffcx_JzZQuAv42bwnCwtPc6r-olCZx4,1316
textpolicy/analysis/emergence_logger.py,sha256=bK1p0fmNxl6w_K4NOxqmyUXOz4qFcLqJVvDpG1M_ROI,8725
textpolicy/analysis/planning_patterns.py,sha256=SrqdWcnOm6rZdWP6UrpXZFhejqvtcw-QeU0qmM1wXRA,3380
textpolicy/analysis/serialization.py,sha256=JE8OuqfrJeuTVYEJKWqHfFvNR2CH0IhSbPMbd_2WSAk,1928
textpolicy/analysis/strategic_grams.py,sha256=8QQgkVufm1B95jXSblfI9EyIohxnIIV5ozJCHcnwOK4,12609
textpolicy/buffer/__init__.py,sha256=bnSkX9Oe1ajau-yqC2PYNF4a4ELVP05zjlkDmIerXlw,569
textpolicy/buffer/buffer.py,sha256=mDie8ZiWgsjNJ4LiKyfpQNLzN1K0UICxI8XaqQacUMM,7917
textpolicy/buffer/episode.py,sha256=iNyVqeMLzOMauz1Z3fs9JUyL7g7IEC9t8GN1eypThy4,15875
textpolicy/buffer/sampling.py,sha256=aE92R69TQe8c5V0WL_EaKHLXSSxbI2wDlgvtR80fJDc,17598
textpolicy/buffer/storage.py,sha256=dYdROkL4KHx0w3XAqJFvRs6gRbYs3dAsiHqdMnwBMAI,9248
textpolicy/environment/__init__.py,sha256=TzhkXiAq10iC9PGGJ-gn2Bm2ttmJHpQ8d3Lxf_wUnNg,1685
textpolicy/environment/base.py,sha256=7Bh5tlFz20RC-iPQhnpv-zigHf8a6cEwBC3ISV-HS1Y,2829
textpolicy/environment/environment.py,sha256=o8-RY6wj5xrzDBp77HoY2At3XlBwvreF3DKpDFpC7js,1240
textpolicy/environment/factory.py,sha256=pebQo1_M3sMF8Pdc9yvpdXzRXfIDllKJoAQAjQbif0E,3124
textpolicy/environment/gym.py,sha256=P8Bi8PlDtcWWa9uLuCjkhZnYRVs-mg6iSJVSBkG99f8,3186
textpolicy/environment/task_suites.py,sha256=ssPnw2Y3eGYaskWf8dUab4rNu_Bx5L284b3VdhgvSPM,1544
textpolicy/environment/text_generation.py,sha256=4BQNkGs7jqRSvb23A-MjAxj1EV-XatPtEUOUYGosb90,32714
textpolicy/environment/vectorized.py,sha256=ZROtpmdbh1Oi8c0b0D_vmVzqI16Cp2WZTmkjkRbMoDg,9932
textpolicy/generation/__init__.py,sha256=qrzfOBupLhqAv3HaxcHXSN8Z7qmbmx4onaocUX6Dxcg,1612
textpolicy/generation/lora.py,sha256=RZKrgrmrREIObPDd40ZkrjQzBqs9W1ChJ9XilPve7wM,17942
textpolicy/generation/mlx_generation.py,sha256=-0j33JEKr9cT2FeioJ6lZnEQVwM8v2mic2JfAU7_Eus,58195
textpolicy/generation/reload.py,sha256=RYTdt9xH2d2Iccc_t4aoSVlpe8Suq_FC8DYuRh3TxMM,8420
textpolicy/rewards/__init__.py,sha256=mg_wL7oedL_5KLsnaJuPVc_ZHZqZKXRHg9ws2gSifMk,4769
textpolicy/rewards/adapters.py,sha256=Ffwi9eF_mx6DdCoRRmzl7TdhqNJycpz1TovJXa0XxXk,12843
textpolicy/rewards/basic.py,sha256=xlMMfCmLm3TrDJsxpJ-h9vlc-m27tTrvnZ-JGUOD89A,6921
textpolicy/rewards/integrated_system.py,sha256=eGK69J2cAfJD4GoL_ANivA8ZWpXHLtu6A0YoMwGTAzI,11243
textpolicy/rewards/mlx_batch_processor.py,sha256=97jFIHwqq75q7-LADVIBCbNqZJTU8jpbs8xcyUrJNfQ,16850
textpolicy/rewards/registry.py,sha256=azuz4HpbacBUss2-FS0Wji_FOUs7NLtwgpsEynqq7ds,11437
textpolicy/rewards/rollout_rewards.py,sha256=7bSkbBJwsb9MLOQ-YMutocpIgGI_AZdgFjRCh2xv0iY,13805
textpolicy/rewards/verifiers.py,sha256=dxOs9_krT42SQGCsBknOCqLqupnz0ripDxsQ6LRQ6uQ,11439
textpolicy/rollout/__init__.py,sha256=PKjY1NmsARTPmUwzNLSp2tFU4NvgJ4NUP1VPy2g3nxI,1229
textpolicy/rollout/aggregator.py,sha256=HNrZgHn1G4DVh8XSodPjKqNF9tH_XfFJKUENk89yrLM,4509
textpolicy/rollout/base.py,sha256=CuyzsHM_yn3eRKldLCcEDfmnqFnHoq-rJ7k0f-nYHw8,2919
textpolicy/rollout/rollout.py,sha256=HWKEFtMhkE4YBRECRBYA4o8I7pKFBWDoJW0WVf0VLkc,8881
textpolicy/rollout/runner.py,sha256=rDQ22Panm7pI86tmL1YCEbMQF0Mq0CNecz8Wgq66rXo,17714
textpolicy/rollout/strategy.py,sha256=Q97wxgq-FCienL15P1l-pXYEWiUZrh861UmtStj4x3E,7577
textpolicy/rollout/worker.py,sha256=aXOKRtkivKwDks8g8VtaWUv-wQMPR72idZxPuNtwmSE,6939
textpolicy/tasks/__init__.py,sha256=RoZkueebtIrEIXjaHy20nzogxe0B8Pf5ZT3XIRNU4wI,195
textpolicy/tasks/countdown/__init__.py,sha256=wtbntjIbK_4TERtAtsc7XvzNYwRwfm8l9D6XlicCxE8,626
textpolicy/tasks/countdown/dataset.py,sha256=3Gxzf1HMp_STr20Lxh7yz_2fGtZaKCQiZUcq4iehAoI,5348
textpolicy/tasks/countdown/evaluator.py,sha256=fZ30lukzmcWfz1F4T2XaTYJK00QhDpwLFdQC-GqF78s,5957
textpolicy/tasks/countdown/prompt.py,sha256=7JKvzek3jQ5AkkzbaNuH7GwIOEgRd7f2gW9VVf0T53s,2639
textpolicy/tasks/countdown/reward.py,sha256=ME_ogLrogftBPqYnPVcEqcLoRs6vtSWEuUMA8qfIeC0,1555
textpolicy/training/__init__.py,sha256=8ZHic53Y5CNMjL8hclM_bpjVrbYraZPvjRBfp6ov4ug,650
textpolicy/training/metrics.py,sha256=fmY1ZBdyEgYrfH18H3fOZ-dieMtjVNzjxjdxd7yo7OU,7582
textpolicy/training/reasoning_stack.py,sha256=9dbJ3z2b3nx35i9Ais3T2z6bOFiS8P_3kO0qRX7q8Bc,7235
textpolicy/training/rollout_manager.py,sha256=ETD7WTbbaQ8uUzrHPBCDX-PawmEJfSK6Kd5N-dvIZRY,2328
textpolicy/training/trainer.py,sha256=Kx87pAVgrbdF_o-1mnIZSKPRvtrN-H51oVQY2JK2-vs,47494
textpolicy/utils/__init__.py,sha256=v0ji-jnegGRydzmAOccKY4XC0nkBbBZqdHXzk-i6ers,1220
textpolicy/utils/benchmarking.py,sha256=YDN24vU8SL_EsrANQWF1qbmXtfhF4Woj8yjez-h-Io0,18682
textpolicy/utils/data.py,sha256=KJoPzYWYVAJawvDX1BHzwBZEpCXLSBC168rjud7MSB0,1413
textpolicy/utils/debug.py,sha256=ir_5DF88_yZbU43w-o_o05EivgPv9AgNVRovL-adNIE,6139
textpolicy/utils/environment.py,sha256=LyYQgpZVfEDyPlD7774_AHR9crOC6NNGjd6J37ltLGM,13319
textpolicy/utils/memory.py,sha256=H8mfUY52iU5VRPhOLPdanWvBgEGLtLCoUE0xpJIMcfM,3391
textpolicy/utils/performance.py,sha256=YzLMT_bAPs9TnVwmrPvWOEwi4UAy5Bmbr5zTpJacmGA,17823
textpolicy/utils/timing.py,sha256=GTlbPElgtDhD03F4vfH7JAf8DSg9vjh1yGAH3gKhWo8,6238
textpolicy/utils/logging/__init__.py,sha256=YeJ18H7suPzYPgXlfSsE90GaAVF_5lOcbGCDCy8tvuA,512
textpolicy/utils/logging/base.py,sha256=3BBg318dEPNIHYtoJnFiJcktvS5KMcIUNXBKKfn8x_g,1304
textpolicy/utils/logging/console.py,sha256=WIcOO-tT2FhrqKhWO89qSSNmLA06up_KenrN6TGoyo8,1680
textpolicy/utils/logging/factory.py,sha256=vAkMShn7bnVRDuZNOKaVXNmF6XPUNeqaFFPF4dZw70E,3920
textpolicy/utils/logging/multi.py,sha256=kIxuoXiZ4nf_p8JlnzYxtqA0r82LJaqHnO5mEHlJdgM,2501
textpolicy/utils/logging/tensorboard.py,sha256=aY9YMReSJkWEhy6SdAAUlHSB4lzDecivBC8K7CZPcO4,1949
textpolicy/utils/logging/wandb.py,sha256=U4pxuZNOz2l8XiymK8OFbCpiRTBOLNtnZakC_udttfQ,2206
textpolicy/validation/__init__.py,sha256=KcyppNi91w0bF51gZ0ykUIKEiF7z6TT37uuavMFScnA,328
textpolicy/validation/logprob_validation.py,sha256=G_CCy5NRDUTmo7WZIChhNVM3NtP1VmWAjdd5z6TIvos,11749
textpolicy-0.1.10.dist-info/licenses/LICENSE,sha256=AYDHSNRbiqZt4HHH1gaOoQ2hjYjK4bqw4Vd9UyKzx18,1065
textpolicy-0.1.10.dist-info/METADATA,sha256=QxaJOxatmVbjKU-60-chDT0GluZs9Vmdpb4KJQPfVy0,4120
textpolicy-0.1.10.dist-info/WHEEL,sha256=YLJXdYXQ2FQ0Uqn2J-6iEIC-3iOey8lH3xCtvFLkd8Q,91
textpolicy-0.1.10.dist-info/entry_points.txt,sha256=d0Cj5boT6k_l_beVPWPt9LZMllsN4kbIUmsNsn1BANE,51
textpolicy-0.1.10.dist-info/top_level.txt,sha256=Ww6_QEF71dI-AYCaugiGeGcgMoFAixSOszSoRsyX-E0,11
textpolicy-0.1.10.dist-info/RECORD,,
