openrlhf

View on PyPIReverse Dependencies (0)

0.5.1 openrlhf-0.5.1-cp311-cp311-manylinux1_x86_64.whl
openrlhf-0.5.1-cp310-cp310-manylinux1_x86_64.whl
0.5.0 openrlhf-0.5.0-cp311-cp311-manylinux1_x86_64.whl
openrlhf-0.5.0-cp310-cp310-manylinux1_x86_64.whl

Wheel Details

Project: openrlhf
Version: 0.5.1
Filename: openrlhf-0.5.1-cp310-cp310-manylinux1_x86_64.whl
Download: [link]
Size: 129357
MD5: e0dafb6e298d8ae44e394629691b4cb3
SHA256: 567ab1da402c4fbfd93137c68892a6c5efc596e7f6cf8e301984656d5937aa2e
Uploaded: 2024-11-14 13:08:51 +0000

dist-info

METADATA

Metadata-Version: 2.1
Name: openrlhf
Version: 0.5.1
Summary: A Ray-based High-performance RLHF framework.
Classifier: Programming Language :: Python :: 3.10
Classifier: Programming Language :: Python :: 3.11
Classifier: Environment :: GPU :: NVIDIA CUDA
Classifier: Topic :: Scientific/Engineering :: Artificial Intelligence
Classifier: Topic :: System :: Distributed Computing
Requires-Python: >=3.10
Requires-Dist: accelerate
Requires-Dist: bitsandbytes
Requires-Dist: datasets
Requires-Dist: deepspeed (==0.15.0)
Requires-Dist: einops
Requires-Dist: flash-attn (==2.6.1)
Requires-Dist: isort
Requires-Dist: jsonlines
Requires-Dist: loralib
Requires-Dist: optimum
Requires-Dist: packaging
Requires-Dist: peft
Requires-Dist: ray[default] (==2.12.0)
Requires-Dist: tensorboard
Requires-Dist: torch
Requires-Dist: torchmetrics
Requires-Dist: tqdm
Requires-Dist: transformers (==4.46.1)
Requires-Dist: transformers-stream-generator
Requires-Dist: wandb
Requires-Dist: wheel
Requires-Dist: vllm (==0.4.2); extra == "vllm"
Requires-Dist: vllm (>0.4.2); extra == "vllm-latest"
Provides-Extra: vllm
Provides-Extra: vllm_latest
Description-Content-Type: text/markdown
License-File: LICENSE
[Description omitted; length: 18642 characters]

WHEEL

Wheel-Version: 1.0
Generator: bdist_wheel (0.45.0)
Root-Is-Purelib: false
Tag: cp310-cp310-manylinux1_x86_64

RECORD

Path Digest Size
openrlhf-0.5.1.data/purelib/openrlhf/__init__.py sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU 0
openrlhf-0.5.1.data/purelib/openrlhf/cli/__init__.py sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU 0
openrlhf-0.5.1.data/purelib/openrlhf/cli/batch_inference.py sha256=ZtwvAYaqjsVN8biqLUwKRAo_28cIHICX60W9Is3di08 13926
openrlhf-0.5.1.data/purelib/openrlhf/cli/interactive_chat.py sha256=yT-zO3fQ1GOgS6VAZR5mt2CMZV9brOTbFpYcJyfBamE 4788
openrlhf-0.5.1.data/purelib/openrlhf/cli/serve_rm.py sha256=Ms8-QY6jer6RalDA14TNvvW5cNxs0fkzhLYPv7DGbv0 4208
openrlhf-0.5.1.data/purelib/openrlhf/cli/train_dpo.py sha256=5TOqdIonMQcrBUO-IGFGQzFzuIWEp1jLr0k1ArUE8mk 11515
openrlhf-0.5.1.data/purelib/openrlhf/cli/train_kd.py sha256=qAL8s-uJ6d095DGXZGl4WrWgNDn7vyBR-EZbt6kkvVg 9758
openrlhf-0.5.1.data/purelib/openrlhf/cli/train_kto.py sha256=n5Pf1CPrYSkhwdU8TGzR9yMgG5yrUkoBqb7DvJPviBU 9628
openrlhf-0.5.1.data/purelib/openrlhf/cli/train_ppo.py sha256=tyP-YLaPL2B0E0UrG3atdgJ7pmcP8xDR0qwkvMCOLec 17605
openrlhf-0.5.1.data/purelib/openrlhf/cli/train_ppo_ray.py sha256=oijFLvdcXZ6N-VAgdRBcPlUFwUGpwxD294OvF5Ag9XY 17751
openrlhf-0.5.1.data/purelib/openrlhf/cli/train_prm.py sha256=b_j0r6jRtzz4Q_1WNIFfGcKjonA4ajn6vnavBh7KXwg 8933
openrlhf-0.5.1.data/purelib/openrlhf/cli/train_rm.py sha256=xjkuZpgPOCj7cjcdD1Gcf__YE6mHZs72sSTd3LfBbzc 10652
openrlhf-0.5.1.data/purelib/openrlhf/cli/train_sft.py sha256=ZSI-qkmmfCYVsuKjZyNIzxEwCtCIjCNMcYMcgBxUIS8 9768
openrlhf-0.5.1.data/purelib/openrlhf/datasets/__init__.py sha256=l3wBBZXsbrnhKtOB0eR-oGI_SeO3MsYEPFAvh3VGZB8 245
openrlhf-0.5.1.data/purelib/openrlhf/datasets/process_reward_dataset.py sha256=0dgYmQYwrNvmDMPkWNwT7lPXqdRypwB4OwnXHXZuOMQ 4773
openrlhf-0.5.1.data/purelib/openrlhf/datasets/prompts_dataset.py sha256=0FkahFZn3j4dIx_0LmGpakMIVEDvTcW1P4kyqGSWVS8 1739
openrlhf-0.5.1.data/purelib/openrlhf/datasets/reward_dataset.py sha256=a0ielgZkfYdQV3HSQe6sKj450HsfeeNWc_pfzmRQq08 8611
openrlhf-0.5.1.data/purelib/openrlhf/datasets/sft_dataset.py sha256=oq4rJmqt9v5Aubm_pSeaBsa-3swMedgXEyRFYwFx51A 6448
openrlhf-0.5.1.data/purelib/openrlhf/datasets/unpaired_preference_dataset.py sha256=x29425FkYRfrF5a9TXXBCZI0Uu7fgGDYdXJii3JBImg 5726
openrlhf-0.5.1.data/purelib/openrlhf/datasets/utils.py sha256=CrcY5A7N7eHz7vLtFo7-GD-ydTaXBgVh8r8PPSUoMfU 585
openrlhf-0.5.1.data/purelib/openrlhf/models/__init__.py sha256=SVRzZmnsOwe5QlLR2i5IVcmLKbMeMkmzEH4StWBDqpw 249
openrlhf-0.5.1.data/purelib/openrlhf/models/actor.py sha256=btSr7PXfrpXbLBp-W2T3KOBu3rdJzx1aXs0MAQfBIyM 9413
openrlhf-0.5.1.data/purelib/openrlhf/models/loss.py sha256=cEx-E9UmlHEP8e1Iwd2StTPrM9z6pxkduDl1MqnOITQ 11255
openrlhf-0.5.1.data/purelib/openrlhf/models/model.py sha256=P4RevTFrG_lWGn9AoGbcWRNVFpto7qSybKKVsSPjUzc 11655
openrlhf-0.5.1.data/purelib/openrlhf/models/ring_attn_utils.py sha256=7yd-_1K9EP5VE4uTcsEsLkXhDOI0Ne800bFx7TvqozU 2590
openrlhf-0.5.1.data/purelib/openrlhf/models/utils.py sha256=EAMTmvFk_p2yWvL9ACA4oC7YKadlA0XU5LsvMVfBR00 4277
openrlhf-0.5.1.data/purelib/openrlhf/trainer/__init__.py sha256=fMnpIziivdlJSftRDIXiqUkf31HJ2MWak7cJ-fMwBX4 272
openrlhf-0.5.1.data/purelib/openrlhf/trainer/dpo_trainer.py sha256=LrXz3wvbOpjlqLFKnHOkTsjzwCi44seKgGmCA98ollY 21383
openrlhf-0.5.1.data/purelib/openrlhf/trainer/kd_trainer.py sha256=ElAz0Sc8ezleHFyC8QApWQg8FPFOB71gg9OaI4_Am8k 10545
openrlhf-0.5.1.data/purelib/openrlhf/trainer/kto_trainer.py sha256=J_AAIX2ol2zqwibi4usjoY1pu5BKpUeM8vsOmtDGbKw 14487
openrlhf-0.5.1.data/purelib/openrlhf/trainer/ppo_trainer.py sha256=_Gi89nF-IrUkrxR_cnFx_DrB_0ffa1bWEvb14l_qamw 21424
openrlhf-0.5.1.data/purelib/openrlhf/trainer/prm_trainer.py sha256=bdYv68ijxacEYLWI-5uJ8ZjpbYPoIaDf8g-tIFFJ15A 10016
openrlhf-0.5.1.data/purelib/openrlhf/trainer/rm_trainer.py sha256=TfJ8jGsN0AmYAz7VjzC-AVOPl1-ePPf828Cj7zWbgxE 16309
openrlhf-0.5.1.data/purelib/openrlhf/trainer/sft_trainer.py sha256=y5Kc75bgnaYpw-WAgxT3mEn01wJZyelPI1CXZa5ArBM 11668
openrlhf-0.5.1.data/purelib/openrlhf/trainer/ppo_utils/__init__.py sha256=8cK-pZd7WwO14h6at9EA_Oj-QLUK_x1doM51ayFvWBw 198
openrlhf-0.5.1.data/purelib/openrlhf/trainer/ppo_utils/experience_maker.py sha256=yNvVTYKrTcrCfbXXuEq7zfTRteh7xEP4HzEptp03ssY 29725
openrlhf-0.5.1.data/purelib/openrlhf/trainer/ppo_utils/kl_controller.py sha256=nzcvDrFUDuysAnwJR5SWek8Hwv-K2l49cL7std-FaGA 738
openrlhf-0.5.1.data/purelib/openrlhf/trainer/ppo_utils/replay_buffer.py sha256=EyS5tjpD4JJ10S58r1_j1PTZ8GEeb8xvb6ZlIMWTOZo 7644
openrlhf-0.5.1.data/purelib/openrlhf/trainer/ray/__init__.py sha256=jzfMQ4LLoEOvsps9H7pT_TjAn5KyuIT5xnwp5_wRfCs 241
openrlhf-0.5.1.data/purelib/openrlhf/trainer/ray/launcher.py sha256=pj4ZMrUMMo5x-nOYufH2gRJgbEhaFidhk1LqvC1OHxA 12520
openrlhf-0.5.1.data/purelib/openrlhf/trainer/ray/ppo_actor.py sha256=WszrWRxve4RB35AqGNUV57yWMKyOi1JzgYaFHLMe-PY 15135
openrlhf-0.5.1.data/purelib/openrlhf/trainer/ray/ppo_critic.py sha256=TyP__9kChU_NLHP7o6UfaXKQRd6dbbK4FoACdKGT49Q 7132
openrlhf-0.5.1.data/purelib/openrlhf/trainer/ray/vllm_engine.py sha256=HJiig-0Ck642xiIHc0610jWDiblljyCl5577QFxvbUM 4694
openrlhf-0.5.1.data/purelib/openrlhf/trainer/ray/vllm_worker_wrap.py sha256=f9PU09TF_J9o58UaU3aLSiILpIZHLj0w-7HHU537jFc 1873
openrlhf-0.5.1.data/purelib/openrlhf/utils/__init__.py sha256=2L_K3fD6o1REMQ8LUNc9Xnqh3ad1AyeuvR97QpTdUxc 166
openrlhf-0.5.1.data/purelib/openrlhf/utils/deepspeed.py sha256=45zrr8xuOO6YCr0LSldvOn6GSofQOzwqEV7A-tueKDg 17107
openrlhf-0.5.1.data/purelib/openrlhf/utils/deepspeed_utils.py sha256=4VhNS6FmBl4Ii6SoGXAOwASYxYwLDSDUWlSVld4Vfwk 3115
openrlhf-0.5.1.data/purelib/openrlhf/utils/distributed_sampler.py sha256=WgmRlcY-R19C_RfkO0xA7REzrDI39iNBC-__zJAFzac 6482
openrlhf-0.5.1.data/purelib/openrlhf/utils/distributed_util.py sha256=QLTxvaV6mNZvnucyuZLKegqr7ae3bR2BlDGq_iiPQXo 2347
openrlhf-0.5.1.data/purelib/openrlhf/utils/logging_utils.py sha256=Ph1HPTiuqllCugM5jXCxB_3Ts-LnGEED2AYCo8eGBto 1796
openrlhf-0.5.1.data/purelib/openrlhf/utils/processor.py sha256=3n9ya135UGqr2ey5uzxlfFPV7vhODekxyVmJAgm1e-k 3093
openrlhf-0.5.1.data/purelib/openrlhf/utils/remote_rm_utils.py sha256=NX-M-JMlgOJlyCvNrQUJDzd8xNVhO7msQmVJVH82kvs 1737
openrlhf-0.5.1.data/purelib/openrlhf/utils/utils.py sha256=4SgEvbF8t2kGXMJ69NdW1rEDJHtz_CdBBmIcHFwV_S4 4578
openrlhf-0.5.1.dist-info/LICENSE sha256=QwcOLU5TJoTeUhuIXzhdCEEDDvorGiC6-3YTOl4TecE 11356
openrlhf-0.5.1.dist-info/METADATA sha256=b7y8bjU1uNw1xlz0b_OlmsjlNPluUHL4ySTOo-aGCLE 19928
openrlhf-0.5.1.dist-info/WHEEL sha256=LhMuTQRgPmHRbvWpgkjl7i0JI_W0ZDIPY5R6r3j2-8o 110
openrlhf-0.5.1.dist-info/top_level.txt sha256=PKhp5t7FXoRFbYrUoMcbRiF_qVRlj4NRLGQYc4M3axY 9
openrlhf-0.5.1.dist-info/RECORD

top_level.txt

openrlhf