|
../../../bin/trl,sha256=A6jHbvcoJh1GIN9JszH1OgYJXr5xUCLNvwjVz2mnhHA,228
|
|
trl-0.17.0.dist-info/INSTALLER,sha256=zuuue4knoyJ-UwPPXg8fezS7VCrXJQrAP7zeNuwvFQg,4
|
|
trl-0.17.0.dist-info/METADATA,sha256=caaBuDcjJQGnHPWU8C8unNSldzgwQtdmd-RdP3E83XY,12215
|
|
trl-0.17.0.dist-info/RECORD,,
|
|
trl-0.17.0.dist-info/REQUESTED,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
trl-0.17.0.dist-info/WHEEL,sha256=SmOxYU7pzNKBqASvQJ7DjX3XGUF92lrGhMb3R6_iiqI,91
|
|
trl-0.17.0.dist-info/entry_points.txt,sha256=EiubuQrZSGOohRB4xVoiVAyWsPsOHPSVpbzSk8YB0x0,37
|
|
trl-0.17.0.dist-info/licenses/LICENSE,sha256=HZDsv3u4D_J-9nt3hfYhSAtlK4LkbHLYpXMLDbZb81U,11355
|
|
trl-0.17.0.dist-info/top_level.txt,sha256=QU12VhjlpAtMnIJqiO2np3RkTB_Eozt1d-g8QDf5P4c,4
|
|
trl/__init__.py,sha256=E8gfZkCbE34CMIljkyshgWe-RbUF_9SVB2kqn8C_Rkk,6135
|
|
trl/__pycache__/__init__.cpython-311.pyc,,
|
|
trl/__pycache__/cli.cpython-311.pyc,,
|
|
trl/__pycache__/core.cpython-311.pyc,,
|
|
trl/__pycache__/data_utils.cpython-311.pyc,,
|
|
trl/__pycache__/import_utils.cpython-311.pyc,,
|
|
trl/__pycache__/mergekit_utils.cpython-311.pyc,,
|
|
trl/cli.py,sha256=9EnWsBdoHL_8ZBEUc3iY3NaD3AaXK4ei-67SU9eHYT4,4692
|
|
trl/core.py,sha256=vHZbFc_VxuLicw8fYiLRrvJbKlqy60YuJ1_ffMeOf1I,5978
|
|
trl/data_utils.py,sha256=8PXZmtyRDEAjfstLdwEcNh3O1_OwTPnZD1MylObe2mI,26165
|
|
trl/environment/__init__.py,sha256=JANVP5oKaZE9xPXVm-ikSEr4-11zIjiLY7M6K_VjjR4,989
|
|
trl/environment/__pycache__/__init__.cpython-311.pyc,,
|
|
trl/environment/__pycache__/base_environment.cpython-311.pyc,,
|
|
trl/environment/base_environment.py,sha256=nQ7lwncNKUrIRIfKqMwqME7nPVQAVrm9EuYsCtd8v3Q,17860
|
|
trl/extras/__init__.py,sha256=5CIPkzvP9D6vpnWLNZz23RNU98MfjeBsxBFMHXKM09U,961
|
|
trl/extras/__pycache__/__init__.cpython-311.pyc,,
|
|
trl/extras/__pycache__/best_of_n_sampler.cpython-311.pyc,,
|
|
trl/extras/__pycache__/dataset_formatting.cpython-311.pyc,,
|
|
trl/extras/__pycache__/profiling.cpython-311.pyc,,
|
|
trl/extras/__pycache__/vllm_client.cpython-311.pyc,,
|
|
trl/extras/best_of_n_sampler.py,sha256=YFuEKXT1NuHardyjAXn1CHnqpazT-Y3d7hBMCM5tYk4,5770
|
|
trl/extras/dataset_formatting.py,sha256=J4FKqOCjEKjX5a4ExbzX9r3hLEUjdtXQv0PxgAcM15A,4468
|
|
trl/extras/profiling.py,sha256=uPgksx-5YhNXPYX7kex5_p0t9PcHTHNarioyPrwTzmw,2878
|
|
trl/extras/vllm_client.py,sha256=0iAFIo4e0nlBn3mJuIxAWTpSb1PgWAmJCpO50rK_cGU,12468
|
|
trl/import_utils.py,sha256=T_vVgE2dHeX26jLcy9nQonM6VFK_yghR4gKFYd2AqtQ,5515
|
|
trl/mergekit_utils.py,sha256=RkaYt1cZYEIu50Y13K9_N4ozKbJIH4JRYSOsdxEDEZY,11109
|
|
trl/models/__init__.py,sha256=teQNcPJwQr6AueSI5E8luecLNcoq13aF6R3gbzvLjQ8,2407
|
|
trl/models/__pycache__/__init__.cpython-311.pyc,,
|
|
trl/models/__pycache__/auxiliary_modules.cpython-311.pyc,,
|
|
trl/models/__pycache__/modeling_base.cpython-311.pyc,,
|
|
trl/models/__pycache__/modeling_sd_base.cpython-311.pyc,,
|
|
trl/models/__pycache__/modeling_value_head.cpython-311.pyc,,
|
|
trl/models/__pycache__/sd_utils.cpython-311.pyc,,
|
|
trl/models/__pycache__/utils.cpython-311.pyc,,
|
|
trl/models/auxiliary_modules.py,sha256=akE5FsiGCR63aIYRTGRyjgocNnUPzYNfcSD3u3vktiE,3344
|
|
trl/models/modeling_base.py,sha256=ParLEmLYi4uVmR-n26XGD3bFqwlDWqgreTHI3UaSYA8,30835
|
|
trl/models/modeling_sd_base.py,sha256=aqKyfNGtr72kn5MU0_JIibAyzsL8kWtQvZu7gCYedQ0,42252
|
|
trl/models/modeling_value_head.py,sha256=wkrq82sK2pOayIef7EMYxD9xyQM3ZR5_q-qD3AZBsTU,18859
|
|
trl/models/sd_utils.py,sha256=scJfKtQWKSXCCuMBHMPe8XaRrGgJgVSTI-2zEB4Tq5k,5879
|
|
trl/models/utils.py,sha256=Y0nlO8AUUXPdkG-7mzCb2_UkPytpRaEDd5gT_iFAXt4,11898
|
|
trl/scripts/__init__.py,sha256=V7eYI1BLoXW4VVJP7Qe0avdLaRK-kVaiXEG4QVlP9xc,1003
|
|
trl/scripts/__pycache__/__init__.cpython-311.pyc,,
|
|
trl/scripts/__pycache__/chat.cpython-311.pyc,,
|
|
trl/scripts/__pycache__/dpo.cpython-311.pyc,,
|
|
trl/scripts/__pycache__/env.cpython-311.pyc,,
|
|
trl/scripts/__pycache__/grpo.cpython-311.pyc,,
|
|
trl/scripts/__pycache__/kto.cpython-311.pyc,,
|
|
trl/scripts/__pycache__/sft.cpython-311.pyc,,
|
|
trl/scripts/__pycache__/utils.cpython-311.pyc,,
|
|
trl/scripts/__pycache__/vllm_serve.cpython-311.pyc,,
|
|
trl/scripts/chat.py,sha256=ypVG23dr252Qnh1xC5-r8zbnrLmonZEKZ8G0cHlYBbI,20780
|
|
trl/scripts/dpo.py,sha256=AA-TLLjwQFFtGXWe2M_U8paGhwkCvNq2x11w25g4rqo,5057
|
|
trl/scripts/env.py,sha256=VJoiibpMNWX-VCje8DdOoobmU8muNYFRc7LZxgUY6as,3382
|
|
trl/scripts/grpo.py,sha256=PHhI6zVE9Eu2yvFLiz2TxU3aCde3txbF7DecFgJqCAI,3521
|
|
trl/scripts/kto.py,sha256=rplxV9wf9iENgNbhaN6CchG7G1ff4XyKQ7EMED7fAVI,4121
|
|
trl/scripts/sft.py,sha256=kKSCGsQqP6v95okJEPowOXOSbdpJB1CYfnEYOk9U84s,4917
|
|
trl/scripts/utils.py,sha256=q5WyfmuWiCf9wEJdFMAc_iM7U7K2YofhPwlcVNQCakw,9820
|
|
trl/scripts/vllm_serve.py,sha256=5rTvZVnanKo3VN9HiNJ7_OaKdmuhLyunHmBQtefpuoI,24070
|
|
trl/templates/lm_model_card.md,sha256=zq0dXorqEOnjHJ8wxwhI3LS2R6qiHmlcgPcVzliwRmc,2158
|
|
trl/trainer/__init__.py,sha256=4z0-b1cMzU5-RJC-UI6pejv05AHfKRSs-xFwnkmNrWk,5505
|
|
trl/trainer/__pycache__/__init__.cpython-311.pyc,,
|
|
trl/trainer/__pycache__/alignprop_config.cpython-311.pyc,,
|
|
trl/trainer/__pycache__/alignprop_trainer.cpython-311.pyc,,
|
|
trl/trainer/__pycache__/bco_config.cpython-311.pyc,,
|
|
trl/trainer/__pycache__/bco_trainer.cpython-311.pyc,,
|
|
trl/trainer/__pycache__/callbacks.cpython-311.pyc,,
|
|
trl/trainer/__pycache__/cpo_config.cpython-311.pyc,,
|
|
trl/trainer/__pycache__/cpo_trainer.cpython-311.pyc,,
|
|
trl/trainer/__pycache__/ddpo_config.cpython-311.pyc,,
|
|
trl/trainer/__pycache__/ddpo_trainer.cpython-311.pyc,,
|
|
trl/trainer/__pycache__/dpo_config.cpython-311.pyc,,
|
|
trl/trainer/__pycache__/dpo_trainer.cpython-311.pyc,,
|
|
trl/trainer/__pycache__/gkd_config.cpython-311.pyc,,
|
|
trl/trainer/__pycache__/gkd_trainer.cpython-311.pyc,,
|
|
trl/trainer/__pycache__/grpo_config.cpython-311.pyc,,
|
|
trl/trainer/__pycache__/grpo_trainer.cpython-311.pyc,,
|
|
trl/trainer/__pycache__/iterative_sft_trainer.cpython-311.pyc,,
|
|
trl/trainer/__pycache__/judges.cpython-311.pyc,,
|
|
trl/trainer/__pycache__/kto_config.cpython-311.pyc,,
|
|
trl/trainer/__pycache__/kto_trainer.cpython-311.pyc,,
|
|
trl/trainer/__pycache__/model_config.cpython-311.pyc,,
|
|
trl/trainer/__pycache__/nash_md_config.cpython-311.pyc,,
|
|
trl/trainer/__pycache__/nash_md_trainer.cpython-311.pyc,,
|
|
trl/trainer/__pycache__/online_dpo_config.cpython-311.pyc,,
|
|
trl/trainer/__pycache__/online_dpo_trainer.cpython-311.pyc,,
|
|
trl/trainer/__pycache__/orpo_config.cpython-311.pyc,,
|
|
trl/trainer/__pycache__/orpo_trainer.cpython-311.pyc,,
|
|
trl/trainer/__pycache__/ppo_config.cpython-311.pyc,,
|
|
trl/trainer/__pycache__/ppo_trainer.cpython-311.pyc,,
|
|
trl/trainer/__pycache__/prm_config.cpython-311.pyc,,
|
|
trl/trainer/__pycache__/prm_trainer.cpython-311.pyc,,
|
|
trl/trainer/__pycache__/reward_config.cpython-311.pyc,,
|
|
trl/trainer/__pycache__/reward_trainer.cpython-311.pyc,,
|
|
trl/trainer/__pycache__/rloo_config.cpython-311.pyc,,
|
|
trl/trainer/__pycache__/rloo_trainer.cpython-311.pyc,,
|
|
trl/trainer/__pycache__/sft_config.cpython-311.pyc,,
|
|
trl/trainer/__pycache__/sft_trainer.cpython-311.pyc,,
|
|
trl/trainer/__pycache__/utils.cpython-311.pyc,,
|
|
trl/trainer/__pycache__/xpo_config.cpython-311.pyc,,
|
|
trl/trainer/__pycache__/xpo_trainer.cpython-311.pyc,,
|
|
trl/trainer/alignprop_config.py,sha256=jLsZIkPRpyKZspVsk7gcn0JS7Mg2mCrccl-slpwOpIU,10196
|
|
trl/trainer/alignprop_trainer.py,sha256=VvPOjrGr78qALUN4TWhomZ6A5-8a-9UDfRe7diiPhAs,18317
|
|
trl/trainer/bco_config.py,sha256=hesvT6e5C7gFSYJ7mvDS7N8mWV3qM4V3iKV-CSeOSHM,8646
|
|
trl/trainer/bco_trainer.py,sha256=Ro8IUu1mzpKrIP7HIOj5eLJgkJiOBjKuaV0-8Pv6sDY,72842
|
|
trl/trainer/callbacks.py,sha256=WRLjXm86Z4k3NRbfBwk-ojpEPO1mBFwnx-lB-xTFIKo,24426
|
|
trl/trainer/cpo_config.py,sha256=xYFxcg-Za6dpd6ezCV8Lp96GHQM8y7illZWxoKFW6GQ,8126
|
|
trl/trainer/cpo_trainer.py,sha256=bhexhJYmnR3lhy7ifgPsx_NGYU2CJVOXIGCb3e46D34,50973
|
|
trl/trainer/ddpo_config.py,sha256=1qL0nWhpEYFel7PUpaKXVWfc0PHvrYWiTcSiEc1rwdo,12241
|
|
trl/trainer/ddpo_trainer.py,sha256=Apl_M77TkPhrTIEeDL13W6Dn41CkzOcDmVjjpaGKK6U,28012
|
|
trl/trainer/dpo_config.py,sha256=59QDYQh3V7w5mkfuZNZMyQ_aWVVptf17f7OswNx2lQg,20096
|
|
trl/trainer/dpo_trainer.py,sha256=U8twOmESJfS_vn10TbF7Gz36QCLHlG_AWFLiq_KSxzc,80661
|
|
trl/trainer/gkd_config.py,sha256=eonWUOAR6bJOUvuN2UWKp2WozrcH0Dhq0bQXsAe3oZA,4598
|
|
trl/trainer/gkd_trainer.py,sha256=ewwfjORvhy71nVjcZGcpI89PnEUlUl-AS2cotKiZnIU,17551
|
|
trl/trainer/grpo_config.py,sha256=g9U2QDFpWNp1xLtzRR-VYvI1-IbAzDGjyCXeFywOF8w,25832
|
|
trl/trainer/grpo_trainer.py,sha256=QlFhpuT4LufMbU1q0_5-SV25cCidKEJ_RemTaKxemFo,71289
|
|
trl/trainer/iterative_sft_trainer.py,sha256=cwwsUJ-7kiDwBtPwl3W0x01-sIDbyZUg34I7hp6aZRQ,18849
|
|
trl/trainer/judges.py,sha256=bllv6GS7JKAbwiVe9YEuyj5varEA2mF9w5EZ4Y0cddU,19556
|
|
trl/trainer/kto_config.py,sha256=XLvcGK4vuwJ5I5h7h5YEtSZM8RJRvZmtGrZ4OCQfrAk,10255
|
|
trl/trainer/kto_trainer.py,sha256=tYM3S8ybsMbE4LGftUTRJiCXI8CDP1EZM9CBvKHrAMw,83534
|
|
trl/trainer/model_config.py,sha256=XMJkyXhifzXqd1k7-GXGorQqQPbRkrPTEAx2LAhnJBU,8660
|
|
trl/trainer/nash_md_config.py,sha256=T3004FbQP7A9mir_I-XvW9GkzoykRL4U_bMg52NLVFE,1844
|
|
trl/trainer/nash_md_trainer.py,sha256=4pDgRJ4X20cUrO8kIM_yIOlGJxW3g2u0KOXW4DKY0bo,22592
|
|
trl/trainer/online_dpo_config.py,sha256=4-s_UsdvwKm0t1RdckZbqcsSDm16dtc5eofZsd_AV-M,8164
|
|
trl/trainer/online_dpo_trainer.py,sha256=m36YngdUi1VR4FOqPsLPxIzeSG8D22EgfT9ymuBXJLI,40128
|
|
trl/trainer/orpo_config.py,sha256=XuHY2EEeoqha2sddDgN_fpXLoRHQNBKi8uQLNguVGrE,6699
|
|
trl/trainer/orpo_trainer.py,sha256=YJ1oHpLFRgnEsxZK7_ODj0XvXreE3ruRZyjVJaCgoaA,52346
|
|
trl/trainer/ppo_config.py,sha256=5j6-qFy-TE4oZcLLeLioXv1tMtZIE18Tn6UqcKAiT_s,5759
|
|
trl/trainer/ppo_trainer.py,sha256=bLgtDmwwQKPJ7j0eAyc4SDnEvVoAifqBhMl2g8BEXXg,39586
|
|
trl/trainer/prm_config.py,sha256=JNILLJpgaUi0SWWzOx4bjRBUgsY8BZpfvfg2Jp8zJRM,3693
|
|
trl/trainer/prm_trainer.py,sha256=QLAFS9kcjh8pN0XgrAhwGyyBSc5jOLFYfSIW8jH053c,16181
|
|
trl/trainer/reward_config.py,sha256=Y8lRaXGVoo6Nbz9-sXEgw2f-nQseA8iK4W4nnwlobFg,3295
|
|
trl/trainer/reward_trainer.py,sha256=6xwuRm2xwSLfKHUCPA1noPetz95kzasl_adO8VWDctk,18750
|
|
trl/trainer/rloo_config.py,sha256=JWu_ydCFIK9DWzWxXhCdEjLbkT3TIQcjBYHJl08WZ9I,4511
|
|
trl/trainer/rloo_trainer.py,sha256=4PpHlCIw7WVVfVF8MlCe7s9nWr7OXIip4wtcDTwy-f0,34006
|
|
trl/trainer/sft_config.py,sha256=3oJrU0R_Us7mzjO9Y3tT5Q5OCkep94jf4YBj3IhmROQ,11248
|
|
trl/trainer/sft_trainer.py,sha256=8C6txI9gWUc7HKPbvIMtzaslGaQycIOQxxqUA9C2WEw,38258
|
|
trl/trainer/utils.py,sha256=4mTdnfX1UO0p45pBKwe7vBWAFCcIPejd4p4uwfWDAaM,75088
|
|
trl/trainer/xpo_config.py,sha256=nPzvCvvJpEWVBNnq-vv5CPpyTVZkQ47ZucVh_87fOPE,1667
|
|
trl/trainer/xpo_trainer.py,sha256=W0oY0nXVO2d9VBdn6LxZvqnYUb-Ii1My5_AexXvKMSs,25641
|
|
|