trl/__init__.py,sha256=YszQMxU4uXNvK9hLbKa-hQx7JUcDD634ATWn-hdq8qk,3666
trl/_compat.py,sha256=AFjmSaDjS6zczDdYOgF3ps9W_BV4-NTf12Dk7mH8hX0,8749
trl/_lazy_module.py,sha256=0KzILrqySOIHVJ2fRP0bVRaBEasS1YRqKOwkeEIg61Q,3264
trl/chat_template_utils.py,sha256=hw77VBnjYRhlNm4OnmMyVtn7c6GH1wFn1yHN5R1N_SQ,24925
trl/data_utils.py,sha256=yT-kUlxrkTwehDt3UxUORqnsa5G3IU0uc62kj7pONVQ,42423
trl/import_utils.py,sha256=M4VFbBRGgcrkdCAKwRQDWPEooSJSIWvk4r2c6kbVmBc,5082
trl/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
trl/accelerate_configs/fsdp1.yaml,sha256=FBw8i6diLwfcUI6Uu7T-UTpd7niY062tLsCFMLoT0c4,725
trl/accelerate_configs/fsdp2.yaml,sha256=zg1L3kVDJb7kvuxIPaqMN6mZQFD2mvG8IxSRmkY7dDk,627
trl/accelerate_configs/multi_gpu.yaml,sha256=yDX-SPo8qY3SW8jsf_53VJX1GwIV20wmRPBbCKf4_8I,321
trl/accelerate_configs/single_gpu.yaml,sha256=4MuOZIjHNir2adOzaoOgBwD9IXXRbPNPzBYVW-zkc7I,316
trl/accelerate_configs/zero1.yaml,sha256=fyUlyzQ_nhP6oamOgOBM7MDZMuHvG4xZfm_-2wnuYTo,441
trl/accelerate_configs/zero2.yaml,sha256=kW58rFIjO1Jz0-TWjg2zUHO5BUBHI4TPFIUHb2M-WiQ,470
trl/accelerate_configs/zero3.yaml,sha256=VN3HDSxEn_WCvYpML4thWO7cpr2N39VwAJjMvPtwfxE,498
trl/cli/__init__.py,sha256=B8PH6sNvyPB70xWMkMH8tFDDPN0gtvFf58IRpER_3mc,656
trl/cli/accelerate_config.py,sha256=UP1H5tldCUyK5gMmXg_hBhAF3XaWsyZqt8hVHmozneU,2008
trl/cli/accelerate_launcher.py,sha256=U0YogVSKf7zcYMQ_gEyA2DRkSbRxmPhx7G1CYsVXmLc,1897
trl/cli/main.py,sha256=Kw5kJozs97cTTUNjz03MXZs-2SpuR8W45QVXcNy5vhQ,1778
trl/cli/commands/__init__.py,sha256=gQlZ1wkQosdWAgJELMPCcam5S1wpyElar1zhJ4FK-X0,1739
trl/cli/commands/base.py,sha256=D8UYEyaCljCKWiUSboowzA8TWFqTzJIRkRZ0S0pyxLM,1885
trl/cli/commands/env.py,sha256=juELnDlMfUJG_RSEM4iPdcHNcees3Sm2G9056zTO83U,1137
trl/cli/commands/skills.py,sha256=amCdxknbhyeYXKhBYahW0_ws_dkFq6gOQJr4-rciPjc,1621
trl/cli/commands/training.py,sha256=5aDCEwQW4rTj2aIny13QUKMByTtsjCFeNkmZTajAwBw,1908
trl/cli/commands/vllm_serve.py,sha256=yCxXiILEBt02cWQNVyNXuYFTZqs7cTnOFhL8GjETlTY,1356
trl/experimental/__init__.py,sha256=FMF_-llsmlfdSVPb8RfoW4z6zX0Co7J2jub6IW2bKyE,1310
trl/experimental/merge_model_callback.py,sha256=UG2Yr0VJsYCkrDGmWjwssAvTNwMgJTadpeExsIpdQmg,13850
trl/experimental/utils.py,sha256=qySmCmwfk9oTTEYJko9vZUIDPqgah9xCnKl3uWOD9sQ,27293
trl/experimental/winrate_callback.py,sha256=rdcVQ7joSOSafYsQn5zahtDYj59hP0wx8wQkuiavQgY,13164
trl/experimental/bco/__init__.py,sha256=X9vUxV2PcrTORo0CEALpq8EoHXtNTavAh0s-GVBDYio,682
trl/experimental/bco/bco_config.py,sha256=WKnGVhvMHI76ibCEWQeuY_JmZsA4EKb2GEJhF_IQ6yw,7905
trl/experimental/bco/bco_trainer.py,sha256=o6B631OuUsrbNLYN0LF9Zc7U2LA4jDuqo5aBnYZEfVk,71685
trl/experimental/bema_for_ref_model/__init__.py,sha256=YSMOnS353SIRvV4_NS-Y-t0sbD6snBcbELbG3ku2Nfg,683
trl/experimental/bema_for_ref_model/callback.py,sha256=RYC7doi9utJa98wKMT0NP8pmY0rITQGISfwZjlQm_Vw,9641
trl/experimental/bema_for_ref_model/dpo_trainer.py,sha256=4YrnaxULpR6TSpjWLvOGoLBziWQNGgWhNqOjuZT1mHg,1181
trl/experimental/cpo/__init__.py,sha256=rO0s9KRAaIsLOMJo2sweX51LkAK4QsLOeDDGIonMFLw,722
trl/experimental/cpo/cpo_config.py,sha256=Iv8LR_ZmwaLTBUZvdOCZJe__UgOuuQEfT4xjWMEy5nQ,8826
trl/experimental/cpo/cpo_trainer.py,sha256=vu62kxy0ZVrEgqLtokrnIO5tKQ7fbk2vVrITZ2q2RKs,49140
trl/experimental/gfpo/__init__.py,sha256=uP2ol8mB0vbkaDcIXCAAwN_HzW7ulo0c4HGqqlevafY,686
trl/experimental/gfpo/gfpo_config.py,sha256=Zz4vFZ9vAy9kD47EN3RgoSJZtW7_8JnGn35sgHmZzNw,1325
trl/experimental/gfpo/gfpo_trainer.py,sha256=sU-Eypf0eoVsr2MXiI-XZcT23FSMX-rKMpZIIBfZWNc,21970
trl/experimental/gkd/__init__.py,sha256=QO5Yki2ia5hOep3fpQArdI3KMnpQkIV1FE0WiznkZrU,722
trl/experimental/gkd/gkd_config.py,sha256=iAdbdxzY-5qmWvTJAPHg_TthR3E_cG61r6jEfNGxsrM,4900
trl/experimental/gkd/gkd_trainer.py,sha256=iIQ3pMHxZvrvbCcZVC666kglG92s2JE5OTbL0q83lvk,20752
trl/experimental/gold/__init__.py,sha256=FnYqi1_ahqtra-Zj2iECHAfr7AHBXQxYWrDNhK-a3Vc,728
trl/experimental/gold/gold.py,sha256=RYgHSL6f1c4hsZ1RoXczQz2Y00L1R0noAax-QONl8UE,5399
trl/experimental/gold/gold_config.py,sha256=cUQb5iIc0lza5vYJ8a8yxAvP0A4UAgN08X3RxCtyCxY,20007
trl/experimental/gold/gold_trainer.py,sha256=_7dS28dM9AmsczI4RSwMoJIdYV_rO8XTLTrHDcvqgz0,101864
trl/experimental/grpo_with_replay_buffer/__init__.py,sha256=KPrhB5rG42642HmeBRcnefGPLBICYAdd613MaDGFTys,770
trl/experimental/grpo_with_replay_buffer/grpo_with_replay_buffer_config.py,sha256=UW6s4umTNDvsDQ-2lHMOAovD5Ro1gGlBohJNnuEan0U,1372
trl/experimental/grpo_with_replay_buffer/grpo_with_replay_buffer_trainer.py,sha256=I4uv385uKMzcm_Y-xvrzyfCznGm_m8bEQxU_aK3Lftg,37031
trl/experimental/gspo_token/__init__.py,sha256=ymJxlrn9cMOyLPGHBq_7VKfvGrhbXYl1ZPi8OyGjSbE,650
trl/experimental/gspo_token/grpo_trainer.py,sha256=kOIfJq-9gj9wp7FQuhJGAqK_ctEU7rbfed0PO9D4c6E,8262
trl/experimental/judges/__init__.py,sha256=-Yk-310tjPCC4xn4AvU_TJ6TdL_XAWfCFFfjiDbvqNc,986
trl/experimental/judges/judges.py,sha256=ReI6FNlWdH0cQhH6QYq-bfZIoQfKwYzAXiyMDYuMWzM,20871
trl/experimental/kto/__init__.py,sha256=K-M_Blc_9na1bQDKla6jKJKb7fPKxSUmiJyRHNFuSu8,722
trl/experimental/kto/kto_config.py,sha256=DMJbMw0p4LFmSRSLR4SUHo6ERjhxnkj0pmxcmejuXJg,6572
trl/experimental/kto/kto_trainer.py,sha256=fuvXaJiBKoagKizl149rR9Tk2cZQDOWX1LSaYOPzkL8,71380
trl/experimental/minillm/__init__.py,sha256=xJRoMqech-1OcFwcP3Ut-wV7DlYm6z6SXb455kHOlpA,746
trl/experimental/minillm/minillm_config.py,sha256=ShF3_VvW1JsPZ4FN0doDXXgvPE52L2i6x-rQVJ6KG3Y,6602
trl/experimental/minillm/minillm_trainer.py,sha256=RWREg5ev_vrEJ6jkbdtHeNR0oEbVRIEIFtVeWOoW5-U,20117
trl/experimental/nash_md/__init__.py,sha256=0-fTu0AiobRY3KTKO6l-HMW_Me66vuaF-l7ym62oRXA,742
trl/experimental/nash_md/nash_md_config.py,sha256=6GlI-rW4umHCMU2ykEwLztRGvd8hpHJlznEu7KzAsH4,1872
trl/experimental/nash_md/nash_md_trainer.py,sha256=J4oJjVGtsl5iTSxfNT7HfQVYEDoa7d3MHHg56uwpG50,24691
trl/experimental/online_dpo/__init__.py,sha256=d0PLdODeA1bPSoXLlGWEAeA6XwGiHCd1isltzRGAVOQ,760
trl/experimental/online_dpo/online_dpo_config.py,sha256=1WrNPgkOE4HA4gR_vdvVMjm8W9YQfen7Bu2lMIKsR3U,20788
trl/experimental/online_dpo/online_dpo_trainer.py,sha256=hfGkzaA5OPOWTTdxi8mhb79DDDJmobYXyIDrLyr9aAc,77912
trl/experimental/openenv/__init__.py,sha256=LlzcnV_wiUFOTBh64phVNDb6dpKr8A93i_K-ZntlysE,705
trl/experimental/openenv/utils.py,sha256=uXI73ca6zidt4F7qrDe2jralGh8Z1jmLl6Yep-A3zKY,7889
trl/experimental/orpo/__init__.py,sha256=raFCz1dhCGKRjdQREuxEWY_MwXpIA1GvpZXxsqzv1EU,728
trl/experimental/orpo/orpo_config.py,sha256=PE7RUY5yRVTM_cVr8iP3Xkujb05zi-BLpw-DQGR9dY0,6290
trl/experimental/orpo/orpo_trainer.py,sha256=tATnxH5gOrfjlR2Py6tSLdBegYzH9EjDi4mYvRBVEK8,48084
trl/experimental/papo/__init__.py,sha256=qP04taTkxweuEvOll1BfSFU5BlaZyv7OIT-i95PE8CU,687
trl/experimental/papo/papo_config.py,sha256=YN5qFmankCNVYDgEEQ0TRQDo29FqumZGRxfjtIkZb1g,3141
trl/experimental/papo/papo_trainer.py,sha256=mDb0UF9wJskM1cpblxUd0UwbwnvNK8Wo_KZibGgnkXU,15685
trl/experimental/ppo/__init__.py,sha256=7jMTBOcEiFGAs6rYdH61xzg1RWTGfBC_r2YFd3DBtR4,990
trl/experimental/ppo/modeling_value_head.py,sha256=TEUbETl0Pjeg0y2jBG1kl4YnurlHVn4Un1dPGTTk6O8,44279
trl/experimental/ppo/ppo_config.py,sha256=ts-WmB1kdQmtIfFUTCPYbujzqvgGe1raPjo12OmSrX4,12575
trl/experimental/ppo/ppo_trainer.py,sha256=ZWSJLrRCJYbs46AA2DF39a45MJ6VDWJYpwOGF08mlzg,49336
trl/experimental/prm/__init__.py,sha256=D5e_7PoXs3nTMVQaN1rAGvIUra6cQDfOyFViUbZrNR4,722
trl/experimental/prm/prm_config.py,sha256=ynh9rVWhqeUin9dTZPnWiXXRPshpQQs0fG3NtPkM22Q,3800
trl/experimental/prm/prm_trainer.py,sha256=UvgcnFDe74qS0o3YsuwyfXs2T8Y53yJPtvoeAEvu8sQ,16240
trl/experimental/xpo/__init__.py,sha256=QcEIbvNKqd-1mR_mHH8gmtE5UGhZGBFG_9bMYLBhuvI,722
trl/experimental/xpo/xpo_config.py,sha256=hWuv1yNMEM-KBFJFv9x_8xu-NhsU8oblvqQLLLF68-Q,1691
trl/experimental/xpo/xpo_trainer.py,sha256=UZMgVOfE83d_VNsDi9SZkDs-Yhx9XxU8YtBU0qxd8po,25201
trl/extras/__init__.py,sha256=V1wvJ_Ee6Ro58SbMXQqO7FG-_jvCpy6kB31_7Wtl68A,611
trl/extras/dataset_formatting.py,sha256=D_8NqUiZ3aSF6bl3qnopEOY8suwH3YEhJ_W4gljSXA0,1285
trl/extras/profiling.py,sha256=kdmjghftaN1onlnUr-QIzJPT71a0BTnufQm4R_J3ZtQ,7368
trl/generation/__init__.py,sha256=aAYDsVEN0dDYZMZaeZvBhAohos1fQX_asTGHJrjmFUE,828
trl/generation/vllm_client.py,sha256=qvnk_iUdqtwY9DRkbekp65hhaahl1_kSUrBv_yLd-pY,26492
trl/generation/vllm_generation.py,sha256=NOG7mc42CqK6K64RbERF4QLqDR8NssAJqL34ll3nZQ0,42240
trl/models/__init__.py,sha256=AdtqJlv3mNNGldTZRmm1-0Ymm0yMrpwnXN0ilv0gdY0,1219
trl/models/activation_offloading.py,sha256=ZKnl22gUmvG1FcJrXQZJGyHK_bviFyrqx9mk67Rnxis,34695
trl/models/utils.py,sha256=cNmmlLozdGnr48Q0YU8XmXEsU9XPmTNXd9k5H-QSt0I,17495
trl/rewards/__init__.py,sha256=IrGRuDNDLkWTJxsemd_WQtWcl8pD3XuB5WkrxL2FOHY,1216
trl/rewards/accuracy_rewards.py,sha256=-F7ePyttFOuGEZarzFmwMsFi-WhLJMFh7S_iso7AoWM,7610
trl/rewards/format_rewards.py,sha256=XKId9E_3opkCtiELkYSWKxb8QnYJv2EGLuT9QOcmbS0,2211
trl/rewards/other_rewards.py,sha256=fzad9ow5yukVkdfan3hMWY7alEv2E-4Q7BPckNUcgaQ,2633
trl/scripts/__init__.py,sha256=uBELpz2YbIG2YxXa5ioNhrWE0nqoior8hkFGP3ZzYe0,1077
trl/scripts/dpo.py,sha256=DQ0ey1blQRaz-vYgCuiyXLcnNte5Z0WAYQz-y0oLu68,5979
trl/scripts/env.py,sha256=1PbnrAf9Xl8O4C3cMyuBCycuBmIaKXJTJaKUi9oL5NI,3522
trl/scripts/grpo.py,sha256=4hTKtuDtw2iZe8N-XO3e8xPQJgyNHte2qQ08MKoaJjc,7544
trl/scripts/kto.py,sha256=kpoel9YO_0X-ypn3lDa_0o9uTWAD9ezjFN0BA3bBzCk,5497
trl/scripts/reward.py,sha256=86ZTxcazpUiz5PII7C7mgWxkd9-L1ac7TOdhs2Tp_q4,3772
trl/scripts/rloo.py,sha256=Pxkj5udjCGGvaezAYWdDt2oGC9OWd6kOGbie-ZiluNM,6822
trl/scripts/sft.py,sha256=ov0qy63qvp7q3s6HoPdCb57wxlGuP0K8dEQ-8qeJrWs,6000
trl/scripts/utils.py,sha256=vAdRpl7bBMX-vFjNXPBCXT8cKZwaq2tTibF2DEEFOzU,18575
trl/scripts/vllm_serve.py,sha256=lNe0bTFjxZ0WtqnX7NIAeAqNTDVH44THtlgIv_WqPF4,43654
trl/skills/__init__.py,sha256=ztKZxcsQqk9gvPe4pV87ZUIPgPW3LwBNXW2-Z9vGwNQ,740
trl/skills/cli.py,sha256=EOZ52Ykz-p6CO8Rb6dL39up52yLEehhf81n98VWH2gQ,6871
trl/skills/skills.py,sha256=3x0WadVnYSNnkJuTAlMU4QwSK_rkayeBHIhI4m6A23M,11834
trl/skills/trl-training/SKILL.md,sha256=z97EE_zwMPKSBQQsuMVqDFQE9jeRmDlwTX2l0EyxlY8,8871
trl/templates/completions_dataset_card.md,sha256=dw3t1mm7WyMWTTcRyttemOWcXo86WLc7BTfRV1YIJS0,1241
trl/templates/lm_model_card.md,sha256=GUAzW9rFpN6Fn47_8wrFHtEarz3ZZTlQtT1gvkIJg74,2351
trl/templates/rm_model_card.md,sha256=pevYy0_B9OThscj5WcDXk_0Fopulfa3IGeHSAr8NwLM,2143
trl/trainer/__init__.py,sha256=TyL6JviatotqQIP4JEEA2XulARdn9guwch7Qmf5bFgs,2577
trl/trainer/base_config.py,sha256=fnR5DCVNT3wWNWmbZcmGxUyNQaWkT--GoV_xHpn2V4s,5758
trl/trainer/base_trainer.py,sha256=ITaSXoSLht97Btzkfhww-R8vjWQrd4X0i2Rq7JUqy6I,3286
trl/trainer/callbacks.py,sha256=V3r1PHsSknFdK0jgb94nAwIPSz98T_3aorIvtSr2Zbs,31337
trl/trainer/dpo_config.py,sha256=qSALqGPDEbynC2piHaXpi7PmB9p_RizzTk4Sssq6G6g,16944
trl/trainer/dpo_trainer.py,sha256=5xNyqcIa8CpOzBzg3pEoOlCiVhY_veVupTVN6G1jkkY,82043
trl/trainer/grpo_config.py,sha256=9vbcXZdF__L60Lzl2hghPks-UKtAd8BGRfadlE8H0g4,52596
trl/trainer/grpo_trainer.py,sha256=ehEmBM1RGGxzgXtNAKyeLXUtZ0uOATWBOVsncy2TIcc,127490
trl/trainer/kto_config.py,sha256=g9ZzUlnwRyvSKcfA3pNI-ep3u4b2kTAK3E3Jkv4XurU,1429
trl/trainer/kto_trainer.py,sha256=xlFQtdF_Hx-bL9g2JJ2LTmsT-NSarjpfKt9fVKBvvuY,1458
trl/trainer/model_config.py,sha256=7k27sX-GRpF3tum8nccoa9jHX4LVu_ZLA9hwa6wWh1U,8813
trl/trainer/reward_config.py,sha256=ksbjk5GgqNhn96v8ynoH3Mq32sN7dWGUz-hV3_E6ZF0,6990
trl/trainer/reward_trainer.py,sha256=JtEtc-rd2Ew815kUPi-Dm91VSs8jpGFzqd7sqDg3xKM,34874
trl/trainer/rloo_config.py,sha256=DD4_xyFXpY5tPKhblrYqY6PsYLnOpes3KNlgnxZinU0,31264
trl/trainer/rloo_trainer.py,sha256=4JhUeOHIaY5uH9C5TI6-I1ltBcLV_QfJAkS8BiHjdws,77940
trl/trainer/sft_config.py,sha256=pVWTPHIxUS0sSD2Ko9nfY0Pl2t--1t03n43-ALVTHWE,13063
trl/trainer/sft_trainer.py,sha256=2_vvyJNFtfhMigIlsRCyfU3QQ_rbP_ObNm4La0I3xsM,74628
trl/trainer/utils.py,sha256=4aas1CwWn3MQVrsCsU8AlgCMbe-XeCLzJcGnvx9kXR8,46583
trl-0.29.0.dist-info/licenses/LICENSE,sha256=G_YUsf3ED700SqWNANF9X9DSUuozOgW-AYo4lZyLKZg,11355
trl-0.29.0.dist-info/METADATA,sha256=xTmZN1o_pmIGOm5tV30OwQs_ycbKYbUz_bwo10aDkts,11299
trl-0.29.0.dist-info/WHEEL,sha256=YCfwYGOYMi5Jhw2fU4yNgwErybb2IX5PEwBKV4ZbdBo,91
trl-0.29.0.dist-info/entry_points.txt,sha256=EiubuQrZSGOohRB4xVoiVAyWsPsOHPSVpbzSk8YB0x0,37
trl-0.29.0.dist-info/top_level.txt,sha256=QU12VhjlpAtMnIJqiO2np3RkTB_Eozt1d-g8QDf5P4c,4
trl-0.29.0.dist-info/RECORD,,
