openrlhf
View on PyPI — Reverse Dependencies (0)
Wheel Details
Project: | openrlhf |
Version: | 0.5.0 |
Filename: | openrlhf-0.5.0-cp311-cp311-manylinux1_x86_64.whl |
Download: | [link] |
Size: | 126807 |
MD5: | 75fe6fe8ae9c5138e3051100bcdbbd45 |
SHA256: | bf311d564a53a51ac4bd17d782ddbbf00eb5f3371d15cd610bcaa748756b5274 |
Uploaded: | 2024-11-07 10:28:09 +0000 |
dist-info
METADATA · WHEEL · RECORD · top_level.txt
METADATA
WHEEL
Wheel-Version: | 1.0 |
Generator: | bdist_wheel (0.44.0) |
Root-Is-Purelib: | false |
Tag: | cp311-cp311-manylinux1_x86_64 |
RECORD
Path | Digest | Size |
---|---|---|
openrlhf-0.5.0.data/purelib/openrlhf/__init__.py | sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU | 0 |
openrlhf-0.5.0.data/purelib/openrlhf/cli/__init__.py | sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU | 0 |
openrlhf-0.5.0.data/purelib/openrlhf/cli/batch_inference.py | sha256=ZtwvAYaqjsVN8biqLUwKRAo_28cIHICX60W9Is3di08 | 13926 |
openrlhf-0.5.0.data/purelib/openrlhf/cli/interactive_chat.py | sha256=HsQeVhOfk-FphDYyZ5WDyEUinLdo_PHxztBR0dOXCyA | 4302 |
openrlhf-0.5.0.data/purelib/openrlhf/cli/serve_rm.py | sha256=Ms8-QY6jer6RalDA14TNvvW5cNxs0fkzhLYPv7DGbv0 | 4208 |
openrlhf-0.5.0.data/purelib/openrlhf/cli/train_dpo.py | sha256=pQEiuMkscKWbwSeqTE-dQmf7HOLyvWORScI0TpPnFxY | 11287 |
openrlhf-0.5.0.data/purelib/openrlhf/cli/train_kd.py | sha256=xEf9yA_GxyY_tSG65FBJs4w4mGMIekRRs6uNtg6xq9Q | 9359 |
openrlhf-0.5.0.data/purelib/openrlhf/cli/train_kto.py | sha256=3fkBlDAbJS5to6NjsAbY5AfldfOepQAbOZhpXUYhrkE | 9399 |
openrlhf-0.5.0.data/purelib/openrlhf/cli/train_ppo.py | sha256=OAvqLnECkjesIUO-prTplJgXaTmTAyhJqDTzsXJ5V1Q | 16920 |
openrlhf-0.5.0.data/purelib/openrlhf/cli/train_ppo_ray.py | sha256=54P1_9B9dzRIQ-MhFjvjIfv08maPAFhBEAj0nBcp9LU | 17184 |
openrlhf-0.5.0.data/purelib/openrlhf/cli/train_prm.py | sha256=b_j0r6jRtzz4Q_1WNIFfGcKjonA4ajn6vnavBh7KXwg | 8933 |
openrlhf-0.5.0.data/purelib/openrlhf/cli/train_rm.py | sha256=INKyjJ9EONgp5eG9-7i4h0PhQ7Z-vHdsQNdAnNMq0eE | 10424 |
openrlhf-0.5.0.data/purelib/openrlhf/cli/train_sft.py | sha256=JZ0yxwA6IlVAegrl9pl_-PRNZjOTnqVxZQ7CoVVuwPM | 9540 |
openrlhf-0.5.0.data/purelib/openrlhf/datasets/__init__.py | sha256=l3wBBZXsbrnhKtOB0eR-oGI_SeO3MsYEPFAvh3VGZB8 | 245 |
openrlhf-0.5.0.data/purelib/openrlhf/datasets/process_reward_dataset.py | sha256=0dgYmQYwrNvmDMPkWNwT7lPXqdRypwB4OwnXHXZuOMQ | 4773 |
openrlhf-0.5.0.data/purelib/openrlhf/datasets/prompts_dataset.py | sha256=0FkahFZn3j4dIx_0LmGpakMIVEDvTcW1P4kyqGSWVS8 | 1739 |
openrlhf-0.5.0.data/purelib/openrlhf/datasets/reward_dataset.py | sha256=a0ielgZkfYdQV3HSQe6sKj450HsfeeNWc_pfzmRQq08 | 8611 |
openrlhf-0.5.0.data/purelib/openrlhf/datasets/sft_dataset.py | sha256=oq4rJmqt9v5Aubm_pSeaBsa-3swMedgXEyRFYwFx51A | 6448 |
openrlhf-0.5.0.data/purelib/openrlhf/datasets/unpaired_preference_dataset.py | sha256=x29425FkYRfrF5a9TXXBCZI0Uu7fgGDYdXJii3JBImg | 5726 |
openrlhf-0.5.0.data/purelib/openrlhf/datasets/utils.py | sha256=CrcY5A7N7eHz7vLtFo7-GD-ydTaXBgVh8r8PPSUoMfU | 585 |
openrlhf-0.5.0.data/purelib/openrlhf/models/__init__.py | sha256=SVRzZmnsOwe5QlLR2i5IVcmLKbMeMkmzEH4StWBDqpw | 249 |
openrlhf-0.5.0.data/purelib/openrlhf/models/actor.py | sha256=btSr7PXfrpXbLBp-W2T3KOBu3rdJzx1aXs0MAQfBIyM | 9413 |
openrlhf-0.5.0.data/purelib/openrlhf/models/loss.py | sha256=cEx-E9UmlHEP8e1Iwd2StTPrM9z6pxkduDl1MqnOITQ | 11255 |
openrlhf-0.5.0.data/purelib/openrlhf/models/model.py | sha256=P4RevTFrG_lWGn9AoGbcWRNVFpto7qSybKKVsSPjUzc | 11655 |
openrlhf-0.5.0.data/purelib/openrlhf/models/ring_attn_utils.py | sha256=7yd-_1K9EP5VE4uTcsEsLkXhDOI0Ne800bFx7TvqozU | 2590 |
openrlhf-0.5.0.data/purelib/openrlhf/models/utils.py | sha256=EAMTmvFk_p2yWvL9ACA4oC7YKadlA0XU5LsvMVfBR00 | 4277 |
openrlhf-0.5.0.data/purelib/openrlhf/trainer/__init__.py | sha256=fMnpIziivdlJSftRDIXiqUkf31HJ2MWak7cJ-fMwBX4 | 272 |
openrlhf-0.5.0.data/purelib/openrlhf/trainer/dpo_trainer.py | sha256=UjGvmzGe12k9Of05BOWEWvvbxGNrrRGKQNcUIJq0HBw | 21055 |
openrlhf-0.5.0.data/purelib/openrlhf/trainer/kd_trainer.py | sha256=Xo9gIk9PN4XRWMSz4GnFv48puaE0XwgHkZiCetSm5G4 | 10244 |
openrlhf-0.5.0.data/purelib/openrlhf/trainer/kto_trainer.py | sha256=1p9CJte1k-vWswhbF-Z4k2QfmO6mqI5_5Vh8H7N-Qfk | 14260 |
openrlhf-0.5.0.data/purelib/openrlhf/trainer/ppo_trainer.py | sha256=cWgA8o9xFCH98O4YgJWk_YZn8VhxS5L4S7ve1pnTQ6k | 20623 |
openrlhf-0.5.0.data/purelib/openrlhf/trainer/prm_trainer.py | sha256=OXJzaa3lZBliI47Wiwz0xJ0HYB-i90TDAYiMW0VdN1M | 9893 |
openrlhf-0.5.0.data/purelib/openrlhf/trainer/rm_trainer.py | sha256=AvdVEevUOVaYpUDmFY4FrIoeGiDrFLdgEt-A0d8oK9M | 16092 |
openrlhf-0.5.0.data/purelib/openrlhf/trainer/sft_trainer.py | sha256=gUzoZGsn5Uuj3ihggW-cZZdsnNfAYu0FXXwNxEMn5UU | 11407 |
openrlhf-0.5.0.data/purelib/openrlhf/trainer/ppo_utils/__init__.py | sha256=8cK-pZd7WwO14h6at9EA_Oj-QLUK_x1doM51ayFvWBw | 198 |
openrlhf-0.5.0.data/purelib/openrlhf/trainer/ppo_utils/experience_maker.py | sha256=946doo3vFi0JDn_d4FuEH9bHRzHuK-LuyQ5FspSjMYs | 26155 |
openrlhf-0.5.0.data/purelib/openrlhf/trainer/ppo_utils/kl_controller.py | sha256=nzcvDrFUDuysAnwJR5SWek8Hwv-K2l49cL7std-FaGA | 738 |
openrlhf-0.5.0.data/purelib/openrlhf/trainer/ppo_utils/replay_buffer.py | sha256=QnjNCU6UOs5U4Nq93hPfMsfkQgbLTQ0eUqrPxRnE2L0 | 7574 |
openrlhf-0.5.0.data/purelib/openrlhf/trainer/ray/__init__.py | sha256=jzfMQ4LLoEOvsps9H7pT_TjAn5KyuIT5xnwp5_wRfCs | 241 |
openrlhf-0.5.0.data/purelib/openrlhf/trainer/ray/launcher.py | sha256=toGWkWSAUEqr6IFEMyOqltUULmbgwe08CT6-EtYV1RE | 12435 |
openrlhf-0.5.0.data/purelib/openrlhf/trainer/ray/ppo_actor.py | sha256=WszrWRxve4RB35AqGNUV57yWMKyOi1JzgYaFHLMe-PY | 15135 |
openrlhf-0.5.0.data/purelib/openrlhf/trainer/ray/ppo_critic.py | sha256=TyP__9kChU_NLHP7o6UfaXKQRd6dbbK4FoACdKGT49Q | 7132 |
openrlhf-0.5.0.data/purelib/openrlhf/trainer/ray/vllm_engine.py | sha256=HJiig-0Ck642xiIHc0610jWDiblljyCl5577QFxvbUM | 4694 |
openrlhf-0.5.0.data/purelib/openrlhf/trainer/ray/vllm_worker_wrap.py | sha256=f9PU09TF_J9o58UaU3aLSiILpIZHLj0w-7HHU537jFc | 1873 |
openrlhf-0.5.0.data/purelib/openrlhf/utils/__init__.py | sha256=2L_K3fD6o1REMQ8LUNc9Xnqh3ad1AyeuvR97QpTdUxc | 166 |
openrlhf-0.5.0.data/purelib/openrlhf/utils/deepspeed.py | sha256=ODmkbgnjXJxPM9ajHAHw17i1BCs3_jXAA7O6P91_xlc | 16991 |
openrlhf-0.5.0.data/purelib/openrlhf/utils/deepspeed_utils.py | sha256=4VhNS6FmBl4Ii6SoGXAOwASYxYwLDSDUWlSVld4Vfwk | 3115 |
openrlhf-0.5.0.data/purelib/openrlhf/utils/distributed_sampler.py | sha256=WgmRlcY-R19C_RfkO0xA7REzrDI39iNBC-__zJAFzac | 6482 |
openrlhf-0.5.0.data/purelib/openrlhf/utils/distributed_util.py | sha256=QLTxvaV6mNZvnucyuZLKegqr7ae3bR2BlDGq_iiPQXo | 2347 |
openrlhf-0.5.0.data/purelib/openrlhf/utils/logging_utils.py | sha256=Ph1HPTiuqllCugM5jXCxB_3Ts-LnGEED2AYCo8eGBto | 1796 |
openrlhf-0.5.0.data/purelib/openrlhf/utils/processor.py | sha256=3n9ya135UGqr2ey5uzxlfFPV7vhODekxyVmJAgm1e-k | 3093 |
openrlhf-0.5.0.data/purelib/openrlhf/utils/remote_rm_utils.py | sha256=1-0y0MKlMGLuzlcYiHfboSKQHA0xVfk1oH7gDiNlgog | 1725 |
openrlhf-0.5.0.data/purelib/openrlhf/utils/utils.py | sha256=4SgEvbF8t2kGXMJ69NdW1rEDJHtz_CdBBmIcHFwV_S4 | 4578 |
openrlhf-0.5.0.dist-info/LICENSE | sha256=QwcOLU5TJoTeUhuIXzhdCEEDDvorGiC6-3YTOl4TecE | 11356 |
openrlhf-0.5.0.dist-info/METADATA | sha256=kPo9N6a5Ap68ODUn5vtQRJ17_4lDDvswrw0pYPlEXqE | 19968 |
openrlhf-0.5.0.dist-info/WHEEL | sha256=Vd5A18-d2wZAY8WDmgxtOE2bK9Ob_vQGjJ7aeTWaXz4 | 110 |
openrlhf-0.5.0.dist-info/top_level.txt | sha256=PKhp5t7FXoRFbYrUoMcbRiF_qVRlj4NRLGQYc4M3axY | 9 |
openrlhf-0.5.0.dist-info/RECORD | — | — |
top_level.txt
openrlhf