openrlhf

View on PyPIReverse Dependencies (0)

0.5.6 openrlhf-0.5.6-cp311-cp311-manylinux1_x86_64.whl
openrlhf-0.5.6-cp310-cp310-manylinux1_x86_64.whl

Wheel Details

Project: openrlhf
Version: 0.5.6
Filename: openrlhf-0.5.6-cp310-cp310-manylinux1_x86_64.whl
Download: [link]
Size: 135086
MD5: 70556e3a51679cbc2722fb121101e599
SHA256: a824f4582465336e0c808482e452277dd6a8924ad4f1018734ef4af7f95c5aa2
Uploaded: 2025-01-08 01:12:09 +0000

dist-info

METADATA

Metadata-Version: 2.1
Name: openrlhf
Version: 0.5.6
Summary: A Ray-based High-performance RLHF framework.
Author: OpenRLHF Team
Classifier: Programming Language :: Python :: 3.10
Classifier: Programming Language :: Python :: 3.11
Classifier: Environment :: GPU :: NVIDIA CUDA
Classifier: Topic :: Scientific/Engineering :: Artificial Intelligence
Classifier: Topic :: System :: Distributed Computing
Requires-Python: >=3.10
Requires-Dist: accelerate
Requires-Dist: bitsandbytes
Requires-Dist: datasets
Requires-Dist: deepspeed (==0.15.0)
Requires-Dist: einops
Requires-Dist: flash-attn (==2.7.0.post2)
Requires-Dist: isort
Requires-Dist: jsonlines
Requires-Dist: loralib
Requires-Dist: optimum
Requires-Dist: packaging
Requires-Dist: peft
Requires-Dist: ray[default] (==2.12.0)
Requires-Dist: tensorboard
Requires-Dist: torch
Requires-Dist: torchmetrics
Requires-Dist: tqdm
Requires-Dist: transformers (==4.46.3)
Requires-Dist: transformers-stream-generator
Requires-Dist: wandb
Requires-Dist: wheel
Requires-Dist: vllm (==0.6.5); extra == "vllm"
Requires-Dist: vllm (>0.6.5); extra == "vllm-latest"
Provides-Extra: vllm
Provides-Extra: vllm_latest
Description-Content-Type: text/markdown
License-File: LICENSE
[Description omitted; length: 21237 characters]

WHEEL

Wheel-Version: 1.0
Generator: bdist_wheel (0.45.1)
Root-Is-Purelib: false
Tag: cp310-cp310-manylinux1_x86_64

RECORD

Path Digest Size
openrlhf-0.5.6.data/purelib/openrlhf/__init__.py sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU 0
openrlhf-0.5.6.data/purelib/openrlhf/cli/__init__.py sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU 0
openrlhf-0.5.6.data/purelib/openrlhf/cli/batch_inference.py sha256=nmaLlawab_nS4GgSQc0ESE47f5xVlLDXtL0C7T_uV_s 13895
openrlhf-0.5.6.data/purelib/openrlhf/cli/interactive_chat.py sha256=PeYOrr_c-6gf4fI9sUIXtPBEIA4VUnyEgTglMHvmHJA 4813
openrlhf-0.5.6.data/purelib/openrlhf/cli/lora_combiner.py sha256=zjocHW0sSBemjMk8exojAjmC9KlrHxjciC-G7CfjW0M 1927
openrlhf-0.5.6.data/purelib/openrlhf/cli/serve_rm.py sha256=p3kh_P7MlR408i5t6n9IipDTfHMDou8J7QfXd3U0t0Y 4203
openrlhf-0.5.6.data/purelib/openrlhf/cli/train_dpo.py sha256=yak8Xxe5nvbQMVNGTgN_glWNDurPekerj7vtzOEkZuU 11553
openrlhf-0.5.6.data/purelib/openrlhf/cli/train_kd.py sha256=kkjgPSvr1BmCmDpNqUtxJ4gLh_HFmaDn3FSSqu4ofDY 9858
openrlhf-0.5.6.data/purelib/openrlhf/cli/train_kto.py sha256=U3t-Pq5JwqZlptZfv4O_7-1B-WKLY55vMetFJ8NqWQE 9913
openrlhf-0.5.6.data/purelib/openrlhf/cli/train_ppo.py sha256=3j4-iNbFpyoZc9iQKjyv6XQBzk_V8rSrGlFeLGfm4WI 17835
openrlhf-0.5.6.data/purelib/openrlhf/cli/train_ppo_ray.py sha256=CEE-Z-wTjkPEFlvFnD3v-ipwWHB434IxUdhR1Jg_YWw 18069
openrlhf-0.5.6.data/purelib/openrlhf/cli/train_prm.py sha256=zUejY1-0aR5iZ7BiPYURu8C3rmLuJn-VuEWYLiha3xU 9013
openrlhf-0.5.6.data/purelib/openrlhf/cli/train_rm.py sha256=aIn2QJllGcSqhwWYmudFJy0CjgiTZ0S_Rr3F8WFnwbc 10912
openrlhf-0.5.6.data/purelib/openrlhf/cli/train_sft.py sha256=O9rCOBL5o4fESuygV277WE3HSDMrG1ucK1N00DPCRbc 10542
openrlhf-0.5.6.data/purelib/openrlhf/datasets/__init__.py sha256=PiPW5UikYPtgjiPL5BXTvd9Ft8Q5dGXGQdUJeJAr6Ok 358
openrlhf-0.5.6.data/purelib/openrlhf/datasets/process_reward_dataset.py sha256=zBymQVI04IABMoaMYHinqb3RllRbX8xuXTr7GuYZJDE 5391
openrlhf-0.5.6.data/purelib/openrlhf/datasets/prompts_dataset.py sha256=YBz-KIU0YyfO_t-nhrRb2pzzcYm1Hse6ruNGY_3Phf4 1701
openrlhf-0.5.6.data/purelib/openrlhf/datasets/reward_dataset.py sha256=S3QXP2JJPmZj-LaaiLPFXRppSBs-XOJUS6qDOGzHeX0 8589
openrlhf-0.5.6.data/purelib/openrlhf/datasets/sft_dataset.py sha256=KM5ApEBA7gCo7YzSurbpJOevX6oc4X5qZa86G5nV5WQ 7329
openrlhf-0.5.6.data/purelib/openrlhf/datasets/unpaired_preference_dataset.py sha256=HiN2Ny6_aFyhFmLsqLlc7F6NkergISjB6yWlFVZvuLA 5665
openrlhf-0.5.6.data/purelib/openrlhf/datasets/utils.py sha256=YvviQtboetqvL7FFuyBVlA3HnVT8eGA5vepNrIYcW2U 552
openrlhf-0.5.6.data/purelib/openrlhf/models/__init__.py sha256=nF-wgPkpasxjj0C2f-lG-k-RKo0yYq8fU5J37zUqNJ0 487
openrlhf-0.5.6.data/purelib/openrlhf/models/actor.py sha256=wKx1hcWO5H4l7h5L3ZTaeh4JRDt4LpmySB39qpjIJ_0 10758
openrlhf-0.5.6.data/purelib/openrlhf/models/loss.py sha256=_GyBW3qH48H9mn3_rP71_J99cd9AC8uh66pn2zeGnxo 12556
openrlhf-0.5.6.data/purelib/openrlhf/models/model.py sha256=gXnYNm3jwOZqbDWygOX-MMWWZiBAxQwxlHz_77yKZT8 12955
openrlhf-0.5.6.data/purelib/openrlhf/models/ring_attn_utils.py sha256=7yd-_1K9EP5VE4uTcsEsLkXhDOI0Ne800bFx7TvqozU 2590
openrlhf-0.5.6.data/purelib/openrlhf/models/utils.py sha256=SO4_0NAtdrX6OniGs_eLjGI9VLYy2Tz2bfvIp1NtyKI 4254
openrlhf-0.5.6.data/purelib/openrlhf/trainer/__init__.py sha256=aVyKN-flp20cQ20A_enD3G7Xn0BKzRufo0M_VJ0UqAg 435
openrlhf-0.5.6.data/purelib/openrlhf/trainer/dpo_trainer.py sha256=IwiVN5fYi_LVncSACDszw-wic3Swp9EZ8PDbfBx3DCw 21492
openrlhf-0.5.6.data/purelib/openrlhf/trainer/kd_trainer.py sha256=PkPchTiDtssd2MiQLKHgMQbW_KJm0Z27RQrxaIEH8dA 10602
openrlhf-0.5.6.data/purelib/openrlhf/trainer/kto_trainer.py sha256=LJqzJN_7YxqmU1-CxNuewhxI6Owiy8CblePhuwiqYVw 14760
openrlhf-0.5.6.data/purelib/openrlhf/trainer/ppo_trainer.py sha256=YBMz4JMWXgu8sWAGz1ecF6iwfa4pbjwQLuJiDnxR4uo 21369
openrlhf-0.5.6.data/purelib/openrlhf/trainer/prm_trainer.py sha256=HM8O-HF-VKfzLfpVPF8wYHNtc1sUVyxiku1vLwoycvk 10498
openrlhf-0.5.6.data/purelib/openrlhf/trainer/rm_trainer.py sha256=LLRgYjH5C2GLnXoHZDBHCzhWoMkNLZrKmwyMwD8r_8A 16413
openrlhf-0.5.6.data/purelib/openrlhf/trainer/sft_trainer.py sha256=_pLuCez6Zpq_0i8HtFFwpR6UolsAG_4c8UICoRb3LoQ 12588
openrlhf-0.5.6.data/purelib/openrlhf/trainer/ppo_utils/__init__.py sha256=1uRwHMw3NNaSOqZVgZYEX6nVA2vkaNi_DaTg7_zKwD0 366
openrlhf-0.5.6.data/purelib/openrlhf/trainer/ppo_utils/experience_maker.py sha256=kg4tkf0vwO788zTTrNPbFBQzmy_Aq4J1ZoDFAixuEp0 30639
openrlhf-0.5.6.data/purelib/openrlhf/trainer/ppo_utils/kl_controller.py sha256=w2F0RkftKEUHxGQ6aMBqxgVsDW8cV1oDb40eAFCr4ww 712
openrlhf-0.5.6.data/purelib/openrlhf/trainer/ppo_utils/replay_buffer.py sha256=q2dJY9DG2w7Y2WTCXrq94eG2sRJd5bxwj5Jx8TQiuow 7598
openrlhf-0.5.6.data/purelib/openrlhf/trainer/ray/__init__.py sha256=cUTmBbbH-QbbkTixLtEsXZoJDe5cNp65UNth4-6PwiI 449
openrlhf-0.5.6.data/purelib/openrlhf/trainer/ray/launcher.py sha256=NEw4mERTuqQkJv06k0P2wm6zSCFcBRbgQfht82de1tk 12546
openrlhf-0.5.6.data/purelib/openrlhf/trainer/ray/ppo_actor.py sha256=DWIWV5u92L8HVWST7OLjbHpY9TeP0Ynh57ofWBu9jho 15133
openrlhf-0.5.6.data/purelib/openrlhf/trainer/ray/ppo_critic.py sha256=VDaYF3kn53uxWGasBdfuu3nC_DPDWqFzlCmJ4-xamqc 7138
openrlhf-0.5.6.data/purelib/openrlhf/trainer/ray/utils.py sha256=cckNw8B9Yvm1Sw5g3ysqtpfRuFXnAYZJngLPh2vXqe0 1585
openrlhf-0.5.6.data/purelib/openrlhf/trainer/ray/vllm_engine.py sha256=IALFv7sf3mMzkHIzKh7SyDD8Q1J-fZFKY-nAzoWxHu4 5557
openrlhf-0.5.6.data/purelib/openrlhf/trainer/ray/vllm_worker_wrap.py sha256=U4ga5KMrqc8lQ58lNjf5Wj8SbHazR8_FUejuqyZntxY 1840
openrlhf-0.5.6.data/purelib/openrlhf/utils/__init__.py sha256=gvChatVozgw_6V3syLWiNa1UxgXWMWvbhzROuJU5sNo 255
openrlhf-0.5.6.data/purelib/openrlhf/utils/distributed_sampler.py sha256=WgmRlcY-R19C_RfkO0xA7REzrDI39iNBC-__zJAFzac 6482
openrlhf-0.5.6.data/purelib/openrlhf/utils/distributed_util.py sha256=_lfyFjK6od93L8e2ilaaBwrX8irpYWsFJXmntg99b9o 2321
openrlhf-0.5.6.data/purelib/openrlhf/utils/logging_utils.py sha256=Ph1HPTiuqllCugM5jXCxB_3Ts-LnGEED2AYCo8eGBto 1796
openrlhf-0.5.6.data/purelib/openrlhf/utils/processor.py sha256=3n9ya135UGqr2ey5uzxlfFPV7vhODekxyVmJAgm1e-k 3093
openrlhf-0.5.6.data/purelib/openrlhf/utils/remote_rm_utils.py sha256=NX-M-JMlgOJlyCvNrQUJDzd8xNVhO7msQmVJVH82kvs 1737
openrlhf-0.5.6.data/purelib/openrlhf/utils/utils.py sha256=QAJYkxUzQayYNW0u07PVHsPIMRJBnXtnIE5g2OVapNw 4559
openrlhf-0.5.6.data/purelib/openrlhf/utils/deepspeed/__init__.py sha256=yA06KP9cJZR_LEqLol0DX87RgXIdQawPtAqrX5dLF_4 81
openrlhf-0.5.6.data/purelib/openrlhf/utils/deepspeed/deepspeed.py sha256=OM0LenFDXzOatNwHUdWxA834Skp64Bii7pRwWvCBc18 17277
openrlhf-0.5.6.data/purelib/openrlhf/utils/deepspeed/deepspeed_utils.py sha256=LcbtXn9z8oRfSf_Ng1U7zAWK5MXirTjty-PkEpsl7xM 2940
openrlhf-0.5.6.dist-info/LICENSE sha256=QwcOLU5TJoTeUhuIXzhdCEEDDvorGiC6-3YTOl4TecE 11356
openrlhf-0.5.6.dist-info/METADATA sha256=EoSi93_oRcSmGzWms-D8gy8mZWTeIj7HSpEiHs4h6mk 22560
openrlhf-0.5.6.dist-info/WHEEL sha256=6GGaUuu07pzjkTYE39hugrrNVQwFmiPXwEWe_OwpsFE 110
openrlhf-0.5.6.dist-info/top_level.txt sha256=PKhp5t7FXoRFbYrUoMcbRiF_qVRlj4NRLGQYc4M3axY 9
openrlhf-0.5.6.dist-info/RECORD

top_level.txt

openrlhf