oat-llm

View on PyPIReverse Dependencies (0)

0.0.9 oat_llm-0.0.9-py3-none-any.whl

Wheel Details

Project: oat-llm
Version: 0.0.9
Filename: oat_llm-0.0.9-py3-none-any.whl
Download: [link]
Size: 123038
MD5: f1d8cadef10000c88557e6fb13c0e387
SHA256: 4a7419d044188f978350b5ea84447b13fefd2a4579415feed3d7419a0b050917
Uploaded: 2025-03-21 09:43:15 +0000

dist-info

METADATA

Metadata-Version: 2.1
Name: oat-llm
Version: 0.0.9
Summary: Online AlignmenT (OAT) for LLMs.
Author: Zichen Liu
Author-Email: Zichen Liu <liuzc[at]sea.com>, Changyu Chen <chency[at]sea.com>
Home-Page: https://github.com/sail-sg/oat
Project-Url: Documentation, https://github.com/sail-sg/oat#readme
Project-Url: Issues, https://github.com/sail-sg/oat/issues
Project-Url: Source, https://github.com/sail-sg/oat
License: Apache-2.0
Keywords: rlhf,llm reasoning,llm,ai-alignment,rl,bandit,ai,sample-efficiency
Classifier: Development Status :: 4 - Beta
Classifier: Programming Language :: Python
Classifier: Programming Language :: Python :: 3.8
Classifier: Programming Language :: Python :: 3.9
Classifier: Programming Language :: Python :: 3.10
Classifier: Programming Language :: Python :: Implementation :: CPython
Classifier: Programming Language :: Python :: Implementation :: PyPy
Requires-Python: >=3.8, <3.11
Requires-Dist: accelerate
Requires-Dist: bitsandbytes
Requires-Dist: datasets
Requires-Dist: deepspeed (==0.16.3)
Requires-Dist: dm-launchpad[tensorflow]
Requires-Dist: einops
Requires-Dist: flash-attn (==2.7.0.post2)
Requires-Dist: fire
Requires-Dist: httpx
Requires-Dist: jsonlines
Requires-Dist: llm-blender (==0.0.2)
Requires-Dist: loralib
Requires-Dist: ml-collections
Requires-Dist: mosec
Requires-Dist: msgspec
Requires-Dist: optimum
Requires-Dist: packaging
Requires-Dist: peft
Requires-Dist: protobuf (==3.20.0)
Requires-Dist: pyarrow (<12,>=0.6.1)
Requires-Dist: python-Levenshtein (==0.25.1)
Requires-Dist: scipy
Requires-Dist: torchmetrics
Requires-Dist: tqdm
Requires-Dist: tyro
Requires-Dist: transformers (==4.48.2)
Requires-Dist: transformers-stream-generator
Requires-Dist: vllm (==0.7.2)
Requires-Dist: wandb
Requires-Dist: wheel
Description-Content-Type: text/markdown
License-File: LICENSE
[Description omitted; length: 6012 characters]

WHEEL

Wheel-Version: 1.0
Generator: setuptools (75.1.0)
Root-Is-Purelib: true
Tag: py3-none-any

RECORD

Path Digest Size
oat/__about__.py sha256=_ilw_kxPzYYRi7GBrXJ8OMw6FbgCZnHVSzEEw9EgFPM 631
oat/__init__.py sha256=1qFdHw5d-gq-rUaVGMqwzZxyExAbrz4XJ6jQNrqu450 594
oat/args.py sha256=X79l6un9p03woZZXxygT4l_CZMddR_4-j8EJVoOvSSg 8525
oat/exploration.py sha256=WgoFXXd0FLIAklCdizENz8CMYP7CuxbPMrIzsl3mwvs 14761
oat/interface.py sha256=oXfRIvNJkRy-GNBiKWDJfNJ9O0QWgeOO_Nv6Vti9xuM 3911
oat/model.py sha256=l4nsxK5PJUeNPO7_Y_onlpdbiJG5ZmE7hEGyLBEKg4A 11362
oat/multistep.py sha256=sm7pvNUggNNnd6dl1j0oI9C9pddSQ1oMXetS7hWvlJY 4242
oat/prompts.py sha256=rm5WFoquTASjzTMgTVPklqDBdAh3xlWHrM_Cxo9ebUU 5660
oat/types.py sha256=SnQFe_MYRwKqxvcQGQbKao1h_cVXDkv5gt1XVqm0H78 1579
oat/actors/__init__.py sha256=ip78PkydUg-ELAmshbyNGZ1RTDjb53DT3fD3vsmjsg8 733
oat/actors/base.py sha256=6ISkd46cRcFDcAewG8jCSn_1Hn3xFZzNybD0jlVLdV0 7502
oat/actors/preference.py sha256=FVCfjtLFx09ybWN8xcotuhvft_K8hFm22g6OJ7Ob8xg 9708
oat/actors/reward.py sha256=IQgj8HU3VLjN_0ilNbERzEuvk2x4AbgWT8DnC0UFg7Q 5187
oat/algorithms/__init__.py sha256=1qFdHw5d-gq-rUaVGMqwzZxyExAbrz4XJ6jQNrqu450 594
oat/algorithms/apl.py sha256=TQY2SxJVb3ixNcZi200aSmxcdLBlkVTwtyhU3qGIb10 16254
oat/algorithms/ppo.py sha256=86bz0nkVMlR7HWI3707UTT4HFMqJ6Puq0nshpg4iZ_Q 28817
oat/algorithms/rft.py sha256=Zb0OQY7UW7iJaTQyfZ9RUf5X2uMNaIq5zBlu-z7bhPw 3585
oat/algorithms/xpo.py sha256=RZDxTzMVbVNSX8tYnKsP83axezAfMKr-j5QeKOxC--8 5088
oat/collectors/__init__.py sha256=ga3mgI4jO55ExaCpVn0swrJQPM9u6AFKO2ZBSKmilCA 767
oat/collectors/asynchronous.py sha256=yHbsaCmR5-PqgoB0tQgojt714jNfz65Cb6OZushMrTg 2227
oat/collectors/base.py sha256=WSfQdkKDZo92Hpz-PBPu8S1tr2zdaGivX3wd72luIEA 3627
oat/experiment/__init__.py sha256=1qFdHw5d-gq-rUaVGMqwzZxyExAbrz4XJ6jQNrqu450 594
oat/experiment/main.py sha256=QsUJi9EwUtVDvWNjaoHU24RnuvvE0XvHA1hruL_3wQE 1342
oat/experiment/run_apl.py sha256=z-DBKM0V5kFVOrWpcw2gc2zTAtU2b6Z-sfbbvtqTvBk 1218
oat/experiment/run_offline.py sha256=8p_7VexJBzQAyHZuYZRL6yxJ-BzFJRBbtBLTvCxBGvU 1727
oat/experiment/run_offline_lp.py sha256=sd2cE3TZFdfoHxXX48r_V1rhI74mfj8hb75UoZLKmvU 1823
oat/experiment/run_offline_ppo.py sha256=YIUBAWYK6TaQxkWN73qQE_bafIjoOT0XizCp60JkLi8 1333
oat/experiment/run_ppo.py sha256=8XpW7Dhx5CapWZnqqBk0vbgnn7FKdu5wc3B2wxWdHsI 1347
oat/experiment/run_xpo.py sha256=8_t65gh7GzVSdOERKdTnUclwDk8QunV7NdP-1Z4l1mE 1153
oat/learners/__init__.py sha256=6DW6oUFlfxJ59COBTuDzAz5lj_OLDvxYsgQkLFGDlXk 1149
oat/learners/base.py sha256=80Mhs3I7pf2BvLXfKnr5vzf4WAInFN9I_BkixcssUQY 25813
oat/learners/dap.py sha256=gH8zV0U78jMoMJh78IPvK1oHGvzpPRawVI32u34q560 13915
oat/learners/dap_with_rm.py sha256=RjSMCGQpq75j5qh9Zu-7IOfBK0jrjCBAI_D8LPSA7ZA 4780
oat/learners/loss.py sha256=zMQHZcyJasbqN3gnqlnx4mkaMIpgTvXMZArAe1qbGFA 6631
oat/learners/ntp.py sha256=wIDRE1DjYlzxFhGnpzEw3IL9X1vg5aB4j34E5gNvbls 3581
oat/learners/offline.py sha256=kps1nT00ICnVB3byc6tvrf0U0CskNd2Fbdn9I8r9lQg 2540
oat/learners/offline_dap.py sha256=fstjbBL-9OriF-jM3k9vHTFL03kGh8YpRZPyr_CRudY 4262
oat/learners/rl.py sha256=Mf9hQ926YqyjqPQAaZlRheunRT0o_sAIzmY8Qa0lG-I 7438
oat/learners/sft.py sha256=KrXsubhyjRHmPVEnFrF2UpHNTgBWaszV6XXEyY4_StQ 2053
oat/oracles/__init__.py sha256=t2aEpwk9HT25HVlok0M4LQ7CAGF_cUxvR-t79oRw374 1213
oat/oracles/base.py sha256=nerRGHXMILptHPd3NTTzdNLapf0fS41EWE4MVnUMQ1M 2413
oat/oracles/countdown.py sha256=ohgiYOIJsZ_9hHMn0DagspIF4pyQ8if7P5puv7QoLBc 5394
oat/oracles/gpt.py sha256=w4zwX1q_lbC8r0l9Z199hnXpz27vFWitljc1bI-3C_w 6274
oat/oracles/gsm8k.py sha256=S23srHIi2thkfyBnwmMIl6SGoxrsriT-gyCB2j777zA 3256
oat/oracles/pair.py sha256=NWRj-4evuXWAhgAmZ_-5TE7q5nCA425ouAL92-3rCQI 1601
oat/oracles/remote/__init__.py sha256=1qFdHw5d-gq-rUaVGMqwzZxyExAbrz4XJ6jQNrqu450 594
oat/oracles/remote/client.py sha256=OLqE6HHPwfod20gSY1Gyu46I1Jg9gqrDNpeyEainCYA 6143
oat/oracles/remote/server.py sha256=GinoMzaIKujthGwgGhq_pwK_6Gf_t1d70AaWKOAnsx4 5829
oat/rm/__init__.py sha256=1qFdHw5d-gq-rUaVGMqwzZxyExAbrz4XJ6jQNrqu450 594
oat/rm/backbone.py sha256=kdD3fRmpZL9RTuMPGNRAT0LygCsv3S9g2ZRZannOc5w 8514
oat/rm/model.py sha256=5Lgt5_XhIXP-Bk77d6b_XkAEwCbPReTNfMeILhTiCNg 10247
oat/rm/networks.py sha256=t_hEFCIvWOb2blZnqGhWDUtc7szu_nDEs99hINnmj3k 4628
oat/rm/uncertainty.py sha256=mYyl-kzuCqJ11b8IoHlgw_z_O4Sx79vL63l4tPSsSWk 2799
oat/utils/__init__.py sha256=1qFdHw5d-gq-rUaVGMqwzZxyExAbrz4XJ6jQNrqu450 594
oat/utils/buffer.py sha256=UzLam3S9fR9VJdKyJ5eS1KqL0t9A_qmcH21QzGubRZw 2195
oat/utils/data.py sha256=Khus9C_TU1bml1-3Bc5ckQ5CPrz-iLdaptVEohvTTXo 16575
oat/utils/deepspeed.py sha256=TTslAXHP3osu0sNDbkc4AIG0Pu5wY7Hs4qtooNUNB6A 25673
oat/utils/distributed.py sha256=eWqt5f4qIGEGwLeYdaq9Na_QKfXzKwTyx4oS2Pl3czA 6616
oat/utils/ipc.py sha256=1t-f6TxsXVdHlN_rtF9IUojGyXZ7bSPr9DuKuUS2r54 2969
oat/utils/launcher.py sha256=_0e164FG8rSFUsyPeksLOQSFiRgcQeR5w6YJCcojJ2g 1574
oat/utils/ops.py sha256=uR7RVsw56KENbNx9dsp8iIhrb7EXZMS6YjeKtXvFwJs 2718
oat/utils/slicer.py sha256=RqY9is8gA54OADDfCQFnNGUDXAM_sTUcIWlYtr4_nkI 3456
oat_llm-0.0.9.dist-info/LICENSE sha256=ITvk9LYfj913BttV6IpAgfbDx-tp10FTgQOtZMXDH5k 11358
oat_llm-0.0.9.dist-info/METADATA sha256=Q-u5Ejjaym_BPveuG1d8prW3lgDY0FeUyqmT4y_4fl8 7818
oat_llm-0.0.9.dist-info/WHEEL sha256=GV9aMThwP_4oNCtvEC2ec3qUYutgWeAzklro_0m4WJQ 91
oat_llm-0.0.9.dist-info/top_level.txt sha256=DDLx4L-7a-XNurRXMHbz5QX0avtmuu3x7jR0E4wTCmk 4
oat_llm-0.0.9.dist-info/RECORD

top_level.txt

oat