trl/__init__.py,sha256=IxOUfQnfHEVa0aN_c6X63uoeGZ9op4evfwZbu748fRc,3740
trl/_compat.py,sha256=iaDD6BjnJv5hdC0JLI8kMQ9yYnk_uGslxyNi0ynv0TM,6698
trl/_lazy_module.py,sha256=0KzILrqySOIHVJ2fRP0bVRaBEasS1YRqKOwkeEIg61Q,3264
trl/chat_template_utils.py,sha256=oMv9BKVXh8cWcmL64aBl1iBwdoQHJcgyvYFaQVVWVvs,44102
trl/data_utils.py,sha256=zp6_JqPqRpEQFgn0WgUAm7o49Sa8o4xj0vOqw1a9viw,40789
trl/distributed.py,sha256=taWLPat2ztmNxH02apimEls2Aj1TE-JJPa6xrGCTuPI,3157
trl/import_utils.py,sha256=BK_nNk_8ZwZGaIRIMK-iP5J_XZjOO1PFPhbruxttSb8,5184
trl/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
trl/accelerate_configs/fsdp1.yaml,sha256=FBw8i6diLwfcUI6Uu7T-UTpd7niY062tLsCFMLoT0c4,725
trl/accelerate_configs/fsdp2.yaml,sha256=zg1L3kVDJb7kvuxIPaqMN6mZQFD2mvG8IxSRmkY7dDk,627
trl/accelerate_configs/multi_gpu.yaml,sha256=yDX-SPo8qY3SW8jsf_53VJX1GwIV20wmRPBbCKf4_8I,321
trl/accelerate_configs/single_gpu.yaml,sha256=4MuOZIjHNir2adOzaoOgBwD9IXXRbPNPzBYVW-zkc7I,316
trl/accelerate_configs/zero1.yaml,sha256=fyUlyzQ_nhP6oamOgOBM7MDZMuHvG4xZfm_-2wnuYTo,441
trl/accelerate_configs/zero2.yaml,sha256=kW58rFIjO1Jz0-TWjg2zUHO5BUBHI4TPFIUHb2M-WiQ,470
trl/accelerate_configs/zero3.yaml,sha256=VN3HDSxEn_WCvYpML4thWO7cpr2N39VwAJjMvPtwfxE,498
trl/chat_templates/README.md,sha256=v8PEH0mx1RoyJqFnTDL5pKnUkqzooFNl3Njbn1QWav8,13023
trl/chat_templates/cohere.jinja,sha256=kMM67hSqKiJhJ1FtSO6RhMm5B0XUoExIRiHsLoL7cSw,1318
trl/chat_templates/cohere2.jinja,sha256=IUfEdPQbUitylvdGkrnzHkX0mjFGWWBXap0yEznFkVo,3239
trl/chat_templates/cohere2_training.jinja,sha256=flg2p0wB0iUEMGJz-Ke0n5RPa5YO_uZ2CcB-7wqbopU,3588
trl/chat_templates/cohere_training.jinja,sha256=X5cYv-OhlFNm6nkrlxTkKqWEnx1BoQk8LOTaSnc4OZY,1626
trl/chat_templates/deepseekv3.jinja,sha256=Vjsc59YdUKm0x0OakSoRFvCVtxLfW15NPhEWBJh062Q,2765
trl/chat_templates/deepseekv3_training.jinja,sha256=qttJQgBMGG-bqX0o9lPX8uDcIOQnU1KkhvfK--Tde1E,3379
trl/chat_templates/gemma.jinja,sha256=7NauUT_hA_DrYuirW_qND-RcEHT6OYsInJOn5wwVz9Y,591
trl/chat_templates/gemma3.jinja,sha256=feHFjiCO2kbpx_hjl9837EmIOu7OOfuWHgprJAiN08Q,1532
trl/chat_templates/gemma3_training.jinja,sha256=lZslfn_BYD-MrpyYkOYvQ9be1sD3K5tzxBBqTOqglvw,2722
trl/chat_templates/gemma_training.jinja,sha256=-CXemugOrIqJ-l-eboCt97eauGAlZJB-fEHcFTFdBKs,1363
trl/chat_templates/glm4moe.jinja,sha256=RPgVhovwL6RY3S90GjOARvS_RfOY620Gd2Zya52WzOM,3242
trl/chat_templates/glm4moe_training.jinja,sha256=jJpWJxtRvMQC5hjieaOBcwKWeu8u91oOmCalC2Y2IHU,4720
trl/chat_templates/gptoss.jinja,sha256=pMmRnLvUrN1RzP_iLaBJJksbc-WQVfpYgRqZ7718gUY,16738
trl/chat_templates/gptoss_training.jinja,sha256=at2nzqD2PvFJGL5_JhALMkUlthhajwaTKRQ4j_qlLjI,17057
trl/chat_templates/llama3.jinja,sha256=ugOhIdCXhZx7W5zQOvmar-lSdSENKHb2Qq2ZKaFQ8SI,389
trl/chat_templates/llama3_1.jinja,sha256=4QyjgbHMxc-dtS43HztmUVdsruCmMLRS4oFrLUBNS2U,4614
trl/chat_templates/llama3_2.jinja,sha256=WBb84QRE4DwunuHvikoephrn5p5DhhPzsXtp0EJiI6Q,3827
trl/chat_templates/llama3_training.jinja,sha256=nc6YHilUz3fU0K0tus-ABqX9o0oL30kjB1qTPQi2lHA,863
trl/chat_templates/llava_next.jinja,sha256=LBckOpd_0GQ_tUmlCajiaE9FUX3w-fYI1Yk7cZ8WVp8,663
trl/chat_templates/llava_next_training.jinja,sha256=rgunlIj3wiWuadwz19O6PCOxlzwE2CzdXz9M0WUQl0I,980
trl/chat_templates/nemotron_3_nano.jinja,sha256=q3gTw6vdnLZVkFpBByiybHiE7KRd36uNn5MVU0haeGI,10504
trl/chat_templates/nemotron_3_nano_training.jinja,sha256=9SpKcCkrmNtNG59ppZVGpD_F6GA6Z5R4GXOj5YIb1HU,11158
trl/chat_templates/nemotron_3_super.jinja,sha256=V1-3T1TtJk35BH0OzOPJiTiq6VP7T1A1ZnVwYmTLtoo,10771
trl/chat_templates/nemotron_3_super_training.jinja,sha256=04WVhURFdAkCWdQDymX3Gklrd7C1DzEQaqmaJfXKppI,11585
trl/chat_templates/nemotron_3_ultra.jinja,sha256=gnU771ztxJMsHtUJtcmhK-aA_YbRrbZbw_c5jRHI7rw,10152
trl/chat_templates/nemotron_3_ultra_training.jinja,sha256=1hzKIwrE-BN-dOiNc9imSeTDpxu3m4KSWhnPbcUqbH4,10969
trl/chat_templates/phi3.jinja,sha256=3K7mbfd7-7eJ7FQf5xMhjaMCJaUm8duXE4_DnubcVqo,407
trl/chat_templates/phi3_5.jinja,sha256=eNl2pEK83i8L4Vqvu44wUOEQT4ZzImb2hAMlG4mYKpA,430
trl/chat_templates/phi3_5_training.jinja,sha256=p2qWUal4Wv4mnGuRWY1V8Dq4rfPYSJpKnI70MhKLfAg,971
trl/chat_templates/phi3_training.jinja,sha256=8At3TFkzEp7gpyvtNV2ZR8sJ-AY9bPI7fbcbM7XqIWI,947
trl/chat_templates/qwen2_5.jinja,sha256=zY6UOfBXCFb9cEcL-IievYtdEQcgf2el77RuNCMwUn8,2507
trl/chat_templates/qwen2_5_training.jinja,sha256=DNhvuA9SCIXjUECo3zIVQOcp0zWNpB8nz3TTMQPZT2I,2965
trl/chat_templates/qwen2_5_vl.jinja,sha256=oLxvb8eimoABekM-jwOhzBI26DipRKLQNClaYMTy_ds,1017
trl/chat_templates/qwen2_5_vl_training.jinja,sha256=MchZMqbYgm8P6NUrgXZ-umuGkSiwp8dQPR57qq1OgEM,3239
trl/chat_templates/qwen3.jinja,sha256=pV7hsWYBKLcJhyPgq82SyqB4gGEFHGLVHL6H2c8ZdNg,4168
trl/chat_templates/qwen3_5_nothink.jinja,sha256=Jz2ODmg7iFBx-xfgjXHl8qXd-1MJdWGBaB3k9aGCLYA,7755
trl/chat_templates/qwen3_5_nothink_training.jinja,sha256=I5TcjFgzSZuareC1E9-NFkxp7G4YX6hNG1fUAFNCrYw,8388
trl/chat_templates/qwen3_5_think.jinja,sha256=pK7or88uBxGULPhIiZvmYBb40UqIn_nt4HvKCZwo9xU,7756
trl/chat_templates/qwen3_5_think_training.jinja,sha256=Ivr0Ia-gfatdQkd4ZKV0SffN-05GL_Just7AKRHrCaA,8385
trl/chat_templates/qwen3_6.jinja,sha256=6E8yoj_donaJ-GiqShpWIfQRM-UaSNfz78vqKDlXQlk,7764
trl/chat_templates/qwen3_6_training.jinja,sha256=DTUq7QnpspLvG0LrvTeyOAi4ZCSuNwrbgVNHgHl9b_k,8307
trl/chat_templates/qwen3_instruct_2507.jinja,sha256=ZPhbGYBl0PuiqB834Q7WgWHOLBmnVMcQDmfgyi7pwyY,2630
trl/chat_templates/qwen3_instruct_2507_training.jinja,sha256=SOF6o8r1vyAHW25zZoZO6UPgC28HUqrf6LZwwqsCkaU,3165
trl/chat_templates/qwen3_training.jinja,sha256=TG4c3MsZHOE6evZNrNv4bCLfnVRW9_FOrJy4My5BvjI,4577
trl/chat_templates/qwen3_vl.jinja,sha256=NjbQ8L1r7wJlTN_9xEe3nLLO-KsCzHUmc0WUYpGkieQ,5292
trl/chat_templates/qwen3_vl_training.jinja,sha256=Zr2BmGv3-Kvm1_tKUDQcjYrhSxZjfo-4dryn5-8LnG8,5741
trl/cli/__init__.py,sha256=B8PH6sNvyPB70xWMkMH8tFDDPN0gtvFf58IRpER_3mc,656
trl/cli/accelerate_config.py,sha256=UP1H5tldCUyK5gMmXg_hBhAF3XaWsyZqt8hVHmozneU,2008
trl/cli/accelerate_launcher.py,sha256=U0YogVSKf7zcYMQ_gEyA2DRkSbRxmPhx7G1CYsVXmLc,1897
trl/cli/main.py,sha256=AtvE_bH_ByC7lLZlzZu44-gCnF1bfIm8je7Ad3hiCrM,1660
trl/cli/commands/__init__.py,sha256=g01-bLAZyTna7_GM1qfhOSDKq58XJSlaaBnbiHEV76Q,1209
trl/cli/commands/base.py,sha256=DDKAl_-ezJRx9vwHr5WTDRNNQeDW8i23Suea8HDOTBo,1855
trl/cli/commands/env.py,sha256=LuM17gUHBFiSGzGzsx0pyCDFSszzhJFoDXeh3FJmaJc,1146
trl/cli/commands/skills.py,sha256=amCdxknbhyeYXKhBYahW0_ws_dkFq6gOQJr4-rciPjc,1621
trl/cli/commands/training.py,sha256=Q8QmzYvIvzwdN0NB5raUguJ-WZhUNw5z6CJyWrLHr9M,2753
trl/cli/commands/vllm_serve.py,sha256=ao6er6CntRdLd6m9bn9WByDz6Pq44xRi26Ndc4X-rhA,1429
trl/experimental/__init__.py,sha256=FMF_-llsmlfdSVPb8RfoW4z6zX0Co7J2jub6IW2bKyE,1310
trl/experimental/merge_model_callback.py,sha256=UG2Yr0VJsYCkrDGmWjwssAvTNwMgJTadpeExsIpdQmg,13850
trl/experimental/utils.py,sha256=9AAxjVniBf1dbyZRUTnGCLFc9mKH0sbknPrFl1JrYF4,36499
trl/experimental/a2po/__init__.py,sha256=iRKDdeda5JbO2iUF0UHXaqXwujtrc9B54C3qh_tAI1Q,686
trl/experimental/a2po/a2po_config.py,sha256=_BsgQyGDyp5JgHGu2Vs7UURMBUTiwPYb7mcwdUDHpcg,6402
trl/experimental/a2po/a2po_trainer.py,sha256=lBuTCeM9Iu4NnELI3biNhq9EnzEa08qf0vHDlHRYapQ,18568
trl/experimental/async_grpo/__init__.py,sha256=djISk67rE2GC5S6-3Qm4NJ7f4JfGlmmvYwmcNYE_EFw,708
trl/experimental/async_grpo/async_grpo_config.py,sha256=HqpgngDo4NzuybJkZlG3Q9XeeHluBBGeVApHYP-hJTM,10377
trl/experimental/async_grpo/async_grpo_trainer.py,sha256=kf1wN1QXMZFGUPELCSkNwP5ZdxMPAKSJq7ZOMIScZG0,35584
trl/experimental/async_grpo/async_rollout_worker.py,sha256=TOXNg5zls6eNjnjgzgxiQYywdxtL9xv1NeEe0N1kgaw,35843
trl/experimental/async_grpo/weight_transfer.py,sha256=bIGtA62jlpAYmlPeH98YHG1qbfqzYT4mUL2QBFFOHLk,5808
trl/experimental/bco/__init__.py,sha256=X9vUxV2PcrTORo0CEALpq8EoHXtNTavAh0s-GVBDYio,682
trl/experimental/bco/bco_config.py,sha256=vEdarjRViRa_v4z2IQoms8NSwZLoIOEoyICGUqXvr_U,7270
trl/experimental/bco/bco_trainer.py,sha256=X4MQDNSGCNCHLE56J4mzMMcwdmLxUAkmut3t0GLrmjA,71747
trl/experimental/bema_for_ref_model/__init__.py,sha256=YSMOnS353SIRvV4_NS-Y-t0sbD6snBcbELbG3ku2Nfg,683
trl/experimental/bema_for_ref_model/callback.py,sha256=RYC7doi9utJa98wKMT0NP8pmY0rITQGISfwZjlQm_Vw,9641
trl/experimental/bema_for_ref_model/dpo_trainer.py,sha256=4YrnaxULpR6TSpjWLvOGoLBziWQNGgWhNqOjuZT1mHg,1181
trl/experimental/cpo/__init__.py,sha256=rO0s9KRAaIsLOMJo2sweX51LkAK4QsLOeDDGIonMFLw,722
trl/experimental/cpo/cpo_config.py,sha256=xcd4qAYEviqx_kQE99b_pXR3icNz1RfsWiNNAYsZCxo,8289
trl/experimental/cpo/cpo_trainer.py,sha256=JljuPv9qwMIyzYQoWUtqt1auUsccXeUT8UC7waVD-uw,49536
trl/experimental/distillation/__init__.py,sha256=Grw7RW6Hnb-Fgk660HuK_69ED5HC6y4nlB2M_SU9dF4,776
trl/experimental/distillation/distillation.py,sha256=7jx1DYUBqVIV8V7INbIgBuRqlXYLgzuDDdVJy1fL4ho,6066
trl/experimental/distillation/distillation_config.py,sha256=OxuiDW0lZaxyu8zxqvd6WedUUY-wAym7bVw0QzWlybs,22984
trl/experimental/distillation/distillation_trainer.py,sha256=IJWoHgnG1SzrajGoi0eF4yE1tTDsXyTMymwtuQiAfzg,82219
trl/experimental/dppo/__init__.py,sha256=4vJFyjElYyJyxwOM8_ZWp_h43F5haFGUtAWQYNQhqww,687
trl/experimental/dppo/dppo_config.py,sha256=yujJCnXBk7r-qP4pKdg3uaFtA8hVOlZSgYyrL_tUDT4,5093
trl/experimental/dppo/dppo_trainer.py,sha256=pv2lwmUU_P77K7Scr-Qz4_Xdw9EUyWTgHCLN6EpjjMo,74778
trl/experimental/gfpo/__init__.py,sha256=uP2ol8mB0vbkaDcIXCAAwN_HzW7ulo0c4HGqqlevafY,686
trl/experimental/gfpo/gfpo_config.py,sha256=Zz4vFZ9vAy9kD47EN3RgoSJZtW7_8JnGn35sgHmZzNw,1325
trl/experimental/gfpo/gfpo_trainer.py,sha256=2xgOHFbVyMB9sko0Z56fShD7-oMl8VZlaaXs625w9x4,24509
trl/experimental/gkd/__init__.py,sha256=QO5Yki2ia5hOep3fpQArdI3KMnpQkIV1FE0WiznkZrU,722
trl/experimental/gkd/gkd_config.py,sha256=gFiQXj4H7kAt89IoueUs9ZAOP9kXx3AX6aAJyyKeEtE,4853
trl/experimental/gkd/gkd_trainer.py,sha256=JAGIHWqLnkVBxGByT9uo0Eyxpg_2KCjfHz6f4LDPVDE,21870
trl/experimental/gold/__init__.py,sha256=FnYqi1_ahqtra-Zj2iECHAfr7AHBXQxYWrDNhK-a3Vc,728
trl/experimental/gold/gold.py,sha256=S0WPSyW4oP9TWAUzwJs57_M3MGrR4P17PDF105Awsb4,5408
trl/experimental/gold/gold_config.py,sha256=-PscJGiOuuVq3zk56Vu2jSfZHQJBE8XiviGylqXXYd4,27318
trl/experimental/gold/gold_trainer.py,sha256=7lZA6nQZmi1ia-1P0QLTwjgSj57aPVQwkiLhIdLr9u0,95912
trl/experimental/grpo_with_replay_buffer/__init__.py,sha256=KPrhB5rG42642HmeBRcnefGPLBICYAdd613MaDGFTys,770
trl/experimental/grpo_with_replay_buffer/grpo_with_replay_buffer_config.py,sha256=UW6s4umTNDvsDQ-2lHMOAovD5Ro1gGlBohJNnuEan0U,1372
trl/experimental/grpo_with_replay_buffer/grpo_with_replay_buffer_trainer.py,sha256=37xphuzu4Piwu74fVq1VC_-f36G2jwhSxaRha_ZyKVc,39638
trl/experimental/gspo_token/__init__.py,sha256=ymJxlrn9cMOyLPGHBq_7VKfvGrhbXYl1ZPi8OyGjSbE,650
trl/experimental/gspo_token/grpo_trainer.py,sha256=kOIfJq-9gj9wp7FQuhJGAqK_ctEU7rbfed0PO9D4c6E,8262
trl/experimental/kto/__init__.py,sha256=K-M_Blc_9na1bQDKla6jKJKb7fPKxSUmiJyRHNFuSu8,722
trl/experimental/kto/kto_config.py,sha256=zko2xcXhwhGpcphLTfpJMDXhiy02BcuKlz9LgCMPO3E,8531
trl/experimental/kto/kto_trainer.py,sha256=SCCi2_-g3MbM-yQ4xSd1oEgGO6Xawr9Xu1D_UqVpRtg,72510
trl/experimental/minillm/__init__.py,sha256=xJRoMqech-1OcFwcP3Ut-wV7DlYm6z6SXb455kHOlpA,746
trl/experimental/minillm/minillm_config.py,sha256=c6JAoVSBZaIV3zsRz5nqInyIs_ZIC8MP4v_KIzEW0xU,6619
trl/experimental/minillm/minillm_trainer.py,sha256=RWREg5ev_vrEJ6jkbdtHeNR0oEbVRIEIFtVeWOoW5-U,20117
trl/experimental/nash_md/__init__.py,sha256=0-fTu0AiobRY3KTKO6l-HMW_Me66vuaF-l7ym62oRXA,742
trl/experimental/nash_md/nash_md_config.py,sha256=6GlI-rW4umHCMU2ykEwLztRGvd8hpHJlznEu7KzAsH4,1872
trl/experimental/nash_md/nash_md_trainer.py,sha256=BBOsZ8wnzD7Qzx36-S7VX3X9Fzr0kavIzfXys-mJR9E,22350
trl/experimental/online_dpo/__init__.py,sha256=d0PLdODeA1bPSoXLlGWEAeA6XwGiHCd1isltzRGAVOQ,760
trl/experimental/online_dpo/online_dpo_config.py,sha256=-67eDtJMO5idz7hPutYLzQO5rEfQOoTYTX0FB1YhT5A,19985
trl/experimental/online_dpo/online_dpo_trainer.py,sha256=2UzEQfsQoZI-sx1XIr-AZZ4zzNfiZe0CGKB6ctIX6IY,69485
trl/experimental/openenv/__init__.py,sha256=LlzcnV_wiUFOTBh64phVNDb6dpKr8A93i_K-ZntlysE,705
trl/experimental/openenv/utils.py,sha256=vF39Bk0y6ArPZioTDgtgGGrHqx4nypcl3Ti1KWQaWfs,8056
trl/experimental/openreward/__init__.py,sha256=Cn8PmmYmWF6RqhXioKxH9mG_PszFdvYD7AdGmyMDnSg,677
trl/experimental/openreward/_spec.py,sha256=QUeG7zy8R3b9gl5UKKXmQwTJJeWJka6lKWkx0Uo_rXU,15544
trl/experimental/openreward/environment.py,sha256=AW25hEl1qvRGQUgipBXHHIiFPv1DyRADadB733WOtLM,16330
trl/experimental/orpo/__init__.py,sha256=raFCz1dhCGKRjdQREuxEWY_MwXpIA1GvpZXxsqzv1EU,728
trl/experimental/orpo/orpo_config.py,sha256=JZ2emthcMah8pisNENCWvqpztF95ltEh3SQUN5iGsoE,5753
trl/experimental/orpo/orpo_trainer.py,sha256=dG2w2_yMfyxWfESgcZpmoLnq5erEqs45WflcxVMmrlk,48480
trl/experimental/papo/__init__.py,sha256=qP04taTkxweuEvOll1BfSFU5BlaZyv7OIT-i95PE8CU,687
trl/experimental/papo/papo_config.py,sha256=YN5qFmankCNVYDgEEQ0TRQDo29FqumZGRxfjtIkZb1g,3141
trl/experimental/papo/papo_trainer.py,sha256=mDb0UF9wJskM1cpblxUd0UwbwnvNK8Wo_KZibGgnkXU,15685
trl/experimental/ppo/__init__.py,sha256=7jMTBOcEiFGAs6rYdH61xzg1RWTGfBC_r2YFd3DBtR4,990
trl/experimental/ppo/modeling_value_head.py,sha256=k0r4CXCzUec2hzxv0Eljcor_ePk_73A8hFXl9NsPpOg,45071
trl/experimental/ppo/ppo_config.py,sha256=Bp0aD4DnnP5igczFuUuSs4YPo5ZQ4vATEG_oD0dB32s,12577
trl/experimental/ppo/ppo_trainer.py,sha256=9WP35KciLaDwLxCUMPi25e3FYItQbDs7MTJP2w1wrDU,49814
trl/experimental/prm/__init__.py,sha256=D5e_7PoXs3nTMVQaN1rAGvIUra6cQDfOyFViUbZrNR4,722
trl/experimental/prm/prm_config.py,sha256=HrNL3emLcboZjEgcHhQX9pvQV3_o4P-QTopTeNG9r0c,3802
trl/experimental/prm/prm_trainer.py,sha256=Hj5TsgMFM-vPACP2Tjrvwi3-CV5g-MY2ID-6zXsGrd0,16922
trl/experimental/sdft/__init__.py,sha256=pI92-nBzVF4g_g_CWNPrUmNPLwhscz-zw8CIji54YI0,728
trl/experimental/sdft/loss_utils.py,sha256=UwtXHAABu_hbsMeHJdMmRaTXFVZg4i5BWA-rXJ9wQeQ,6049
trl/experimental/sdft/sdft.py,sha256=jP5TwxCu2erKsPZJFe88PPwKJuJzgvKDfx8OH2e9Oxk,15744
trl/experimental/sdft/sdft_config.py,sha256=UXimRtNuiICJXKpRfZNyARZY0L8M8uz-7-6J0t34gmM,26125
trl/experimental/sdft/sdft_trainer.py,sha256=LEqD5l_3Zd30DClJfAfoi3gkdcLbSvr-o86BzCCE43k,63813
trl/experimental/sdft/teacher_sync.py,sha256=6yIsiPzJLNZBX9Siry9L5gBGOxTM6Sh9_IVitasxtlQ,6647
trl/experimental/sdpo/__init__.py,sha256=66WDtge8cD3Jpp-yTaPgzvDZfF8h-Svju4cc9FSbb_Q,728
trl/experimental/sdpo/loss_utils.py,sha256=UwtXHAABu_hbsMeHJdMmRaTXFVZg4i5BWA-rXJ9wQeQ,6049
trl/experimental/sdpo/sdpo.py,sha256=3G6N2-H2lCI8e0ZD_CXUJaDQKeABGDodsxePzdQ2tq8,14939
trl/experimental/sdpo/sdpo_config.py,sha256=oezEQO6doMbcQZFnEMxruG5A7dAriBBCFueS0Y--hFg,38534
trl/experimental/sdpo/sdpo_trainer.py,sha256=bE-QalLhBQdfbG5d9btnCCYWmSIXfoIn_7wAslqiwYo,87469
trl/experimental/sdpo/teacher_sync.py,sha256=6yIsiPzJLNZBX9Siry9L5gBGOxTM6Sh9_IVitasxtlQ,6647
trl/experimental/ssd/__init__.py,sha256=kZ8pR1q1JG6pwbQmHMbsthOm5bD6Tqtvh4AOWaviS24,722
trl/experimental/ssd/ssd.py,sha256=jHO2m6PWVti5UIybf3tw6751EONXMAZZlxRuwfK2lLE,5658
trl/experimental/ssd/ssd_config.py,sha256=1ymLXjVdBtLg30rOA9NCNAa-f0g6Y2feef6rvVEsM38,11701
trl/experimental/ssd/ssd_eval.py,sha256=uZoN-Pwad17SukjnEDipUOiY78-9MH2rPlk5E49US00,10299
trl/experimental/ssd/ssd_trainer.py,sha256=Ag-kTygJx73Gk0XED9kikcy_HhAOV8R13iI5qQreA5M,23894
trl/experimental/tpo/__init__.py,sha256=fDIWPC3c1BL3VngtbKbnaB-UNRNY4tewOYrr_7yXWG4,722
trl/experimental/tpo/tpo.py,sha256=i_HeccB9rDPoLMCrC36euuDOiikPvLQervsbm6q7nzw,8510
trl/experimental/tpo/tpo_config.py,sha256=DW2ErV2F0TELILwS4XPHdOlqNs15ldEXlLCoU0OfKSY,7395
trl/experimental/tpo/tpo_trainer.py,sha256=Xm1xCBPOu0u6fcSE_15ljqncl5BH1J5vkqgIzWiQriQ,41765
trl/experimental/xpo/__init__.py,sha256=QcEIbvNKqd-1mR_mHH8gmtE5UGhZGBFG_9bMYLBhuvI,722
trl/experimental/xpo/xpo_config.py,sha256=hWuv1yNMEM-KBFJFv9x_8xu-NhsU8oblvqQLLLF68-Q,1691
trl/experimental/xpo/xpo_trainer.py,sha256=lLE6DuopGKjzfctt8s6x4RloryleXeGiuu03F-itvPU,22722
trl/extras/__init__.py,sha256=V1wvJ_Ee6Ro58SbMXQqO7FG-_jvCpy6kB31_7Wtl68A,611
trl/extras/dataset_formatting.py,sha256=D_8NqUiZ3aSF6bl3qnopEOY8suwH3YEhJ_W4gljSXA0,1285
trl/extras/profiling.py,sha256=kdmjghftaN1onlnUr-QIzJPT71a0BTnufQm4R_J3ZtQ,7368
trl/generation/__init__.py,sha256=aAYDsVEN0dDYZMZaeZvBhAohos1fQX_asTGHJrjmFUE,828
trl/generation/vllm_client.py,sha256=_SqrSgfWaVfUiHJ7s7ezGntpM11REhIhsC-kzfEBaCk,35299
trl/generation/vllm_generation.py,sha256=0NImYIV6QSCliDDNNooyke8lNjiT33DyToFWKxjeTJA,36015
trl/models/__init__.py,sha256=AdtqJlv3mNNGldTZRmm1-0Ymm0yMrpwnXN0ilv0gdY0,1219
trl/models/activation_offloading.py,sha256=EDVanxKUClYZT0KOiDDa6xvaoCTtvUQR9Wxh624LBW0,37697
trl/models/utils.py,sha256=O8tGPi_sU2vIZR_TJd9DEjv5DcAihYb70Ui-zOraqyE,17939
trl/rewards/__init__.py,sha256=IrGRuDNDLkWTJxsemd_WQtWcl8pD3XuB5WkrxL2FOHY,1216
trl/rewards/accuracy_rewards.py,sha256=xiwFFssbOKUnku_yEh44ljrQ9XsPBMi92LMDlqvxVIo,10939
trl/rewards/format_rewards.py,sha256=XKId9E_3opkCtiELkYSWKxb8QnYJv2EGLuT9QOcmbS0,2211
trl/rewards/other_rewards.py,sha256=PoXW_0NrApx8VWHZagHeGHXcnx8X-JUCaMkqP3BINTY,3199
trl/scripts/__init__.py,sha256=uBELpz2YbIG2YxXa5ioNhrWE0nqoior8hkFGP3ZzYe0,1077
trl/scripts/_hf_argparser.py,sha256=RygJLSzKIm9-R_2LUo2rpsWHxarnO29o1Syg-kU11Z0,21107
trl/scripts/dpo.py,sha256=rdzB0uXOcw-3ytn6wRbXByEeGR74_oHoUweJtKMoaYg,5192
trl/scripts/env.py,sha256=NwKqs_IQK3tpW0xbBZU6qEx_68-T_SqAv_-BElbkroY,3285
trl/scripts/grpo.py,sha256=ztnT1n9DUqfVK8p8vWD1YDAc780K3aDDljwQNTgIGqs,7194
trl/scripts/kto.py,sha256=O5rFvS4Xpu7ozDy62oPf07x_FfAqsgN13Jey9sn-bWA,5160
trl/scripts/reward.py,sha256=C2N3Ni306KTuDMNyBvHBqr27MO1EMaoBz2Mk3ONALXw,4051
trl/scripts/rloo.py,sha256=BDgVC9nELZBdlJjbYNXwB21ibUrpOUPMMI7eGSr3fdM,7194
trl/scripts/sft.py,sha256=TQN8mo5IsiaHk9luwJpNdrUp4cHcrIUWOnoYP83sCAs,4896
trl/scripts/utils.py,sha256=LMFn84Y8ZYx3G7kc3Y9l60JO0dd7jYz8p8nC08YSrcg,18260
trl/scripts/vllm_serve.py,sha256=5gYACkVgXF5KzsVysK4KaYXHpHKIAU0cyqeDDtWSAh4,59744
trl/skills/__init__.py,sha256=ztKZxcsQqk9gvPe4pV87ZUIPgPW3LwBNXW2-Z9vGwNQ,740
trl/skills/cli.py,sha256=qVMHN-wOJEfumxEUMH7aBhTR1ejOV3E3XW4r-7Bqg9U,6875
trl/skills/skills.py,sha256=sSue1fufWyApyTHipKacmi1VR81X9VX57aR5kCTDcC8,11708
trl/skills/trl-training/SKILL.md,sha256=z97EE_zwMPKSBQQsuMVqDFQE9jeRmDlwTX2l0EyxlY8,8871
trl/templates/completions_dataset_card.md,sha256=48c5hNBP1BtG01GYcHWHtyFsMxL9O63OXKHpTyk2xOw,1233
trl/templates/lm_model_card.md,sha256=GUAzW9rFpN6Fn47_8wrFHtEarz3ZZTlQtT1gvkIJg74,2351
trl/templates/rm_model_card.md,sha256=pevYy0_B9OThscj5WcDXk_0Fopulfa3IGeHSAr8NwLM,2143
trl/trainer/__init__.py,sha256=r6ucMHWPi6MFNO5HnsRAktwuiuDNKi4e7wHLM7RBpjg,2641
trl/trainer/base_config.py,sha256=wD4Fur8JA0h6OwmstTTVDJKdAbI6gCekZOoU9KVznS4,5759
trl/trainer/base_trainer.py,sha256=KNS3GojNuafsyeFguRFu1h_2tWKPU5bcZp52oGxgp5E,6757
trl/trainer/callbacks.py,sha256=V3r1PHsSknFdK0jgb94nAwIPSz98T_3aorIvtSr2Zbs,31337
trl/trainer/dpo_config.py,sha256=QYnS0ed3go3D1VqaKDMmf_dNfT54txRb-eRzfK0cX0Q,18192
trl/trainer/dpo_trainer.py,sha256=dQ6pPRpFhb-3wVEnUwl3qOxLFG0bL4rvm8vANYyuua8,86705
trl/trainer/grpo_config.py,sha256=WuQO1uUWp9MjHbdzGLtsKyZ8J-ptVKmmYCyfV3KGGWU,60367
trl/trainer/grpo_trainer.py,sha256=VlUwv3pUPaQqTuT3fDKAKniEKXl9Vkila1AII59rtyE,154954
trl/trainer/kto_config.py,sha256=g9ZzUlnwRyvSKcfA3pNI-ep3u4b2kTAK3E3Jkv4XurU,1429
trl/trainer/kto_trainer.py,sha256=xlFQtdF_Hx-bL9g2JJ2LTmsT-NSarjpfKt9fVKBvvuY,1458
trl/trainer/model_config.py,sha256=522k6Fnr4p1salbtguFX9Y37GBfjM0RcXZO5Fj6-2n8,8905
trl/trainer/reward_config.py,sha256=TmiX7vD1dPW0Deosi9-H1uHAO-_XamJUAGV4_NiAPJI,7823
trl/trainer/reward_trainer.py,sha256=EboaLAykQFBXA2iYY6YPUlsj-05YYDjgMCLhWlKRILE,36035
trl/trainer/rloo_config.py,sha256=Ok34RSevZyHFM_B0d8NGP3Sz35bD0oBdmzAI9hRhimE,32809
trl/trainer/rloo_trainer.py,sha256=JnuS1xNnNbYCvWj_MeRBtCIsQp-nSNOiR-TvkZXGFZY,86179
trl/trainer/sft_config.py,sha256=nwSZpp901jyzL_tGnHH-T3L-62e44yjXuhuEZop9Dck,17475
trl/trainer/sft_trainer.py,sha256=4eZpuI_XzZL2o9i0JLH1YH_8i1Vr9hVViuZ_MACdPno,97097
trl/trainer/utils.py,sha256=jIeRjj4o0o6DQxP1uUlh6O9vDpuetW6KCuoeen6i_XI,56962
trl-1.6.0.dist-info/licenses/LICENSE,sha256=G_YUsf3ED700SqWNANF9X9DSUuozOgW-AYo4lZyLKZg,11355
trl-1.6.0.dist-info/METADATA,sha256=0diyOvVmQ96iRBd_3hlvA8UqBa6e00cfXv8KKiqxS24,11481
trl-1.6.0.dist-info/WHEEL,sha256=aeYiig01lYGDzBgS8HxWXOg3uV61G9ijOsup-k9o1sk,91
trl-1.6.0.dist-info/entry_points.txt,sha256=EiubuQrZSGOohRB4xVoiVAyWsPsOHPSVpbzSk8YB0x0,37
trl-1.6.0.dist-info/top_level.txt,sha256=QU12VhjlpAtMnIJqiO2np3RkTB_Eozt1d-g8QDf5P4c,4
trl-1.6.0.dist-info/RECORD,,
