rewardbench

View on PyPIReverse Dependencies (0)

0.1.3 rewardbench-0.1.3-py3-none-any.whl

Wheel Details

Project: rewardbench
Version: 0.1.3
Filename: rewardbench-0.1.3-py3-none-any.whl
Download: [link]
Size: 139699
MD5: a93845402c9cc3f73dcfd41a48c00842
SHA256: 3f26eb1102cdac329ef98d9a35780517c377790b3e0ab80e59df93286df5d488
Uploaded: 2024-10-04 23:28:33 +0000

dist-info

METADATA

Metadata-Version: 2.1
Name: rewardbench
Version: 0.1.3
Summary: Tools for evaluating reward models
Author: Nathan Lambert
Author-Email: nathanl[at]allenai.org
Home-Page: https://github.com/allenai/rewardbench
Classifier: Programming Language :: Python :: 3
Classifier: License :: OSI Approved :: Apache Software License
Classifier: Operating System :: OS Independent
Requires-Python: >=3.10
Requires-Dist: accelerate
Requires-Dist: bitsandbytes
Requires-Dist: black
Requires-Dist: datasets
Requires-Dist: deepspeed
Requires-Dist: einops
Requires-Dist: flake8 (>=6.0)
Requires-Dist: fschat
Requires-Dist: huggingface-hub
Requires-Dist: hf-transfer
Requires-Dist: isort (>=5.12.0)
Requires-Dist: pandas
Requires-Dist: peft
Requires-Dist: pytest
Requires-Dist: scipy
Requires-Dist: sentencepiece
Requires-Dist: tabulate
Requires-Dist: tokenizers
Requires-Dist: torch
Requires-Dist: tiktoken (==0.6.0)
Requires-Dist: transformers (==4.43.4)
Requires-Dist: trl (>=0.8.2)
Requires-Dist: wandb
Requires-Dist: vllm (==0.5.5); extra == "generative"
Requires-Dist: openai; extra == "generative"
Requires-Dist: anthropic; extra == "generative"
Requires-Dist: together; extra == "generative"
Provides-Extra: generative
Description-Content-Type: text/markdown
License-File: LICENSE
[Description omitted; length: 13329 characters]

WHEEL

Wheel-Version: 1.0
Generator: bdist_wheel (0.41.2)
Root-Is-Purelib: true
Tag: py3-none-any

RECORD

Path Digest Size
analysis/__init__.py sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU 0
analysis/bon_to_alpacaeval.py sha256=Y1wXHkwEQUhOg3fplyXMXUwf6AE0Pe-0tE4wl09ErSo 3818
analysis/draw_model_histogram.py sha256=v8RTKKmuOCQFqLtxa-BjBVyybKkIMVRhK8FP75SPy-A 2421
analysis/draw_mtbench_analysis.py sha256=sXyTnlmrOi5mgvqqapnjLFjmWv0DMAz8hpZiAMoKC3Y 1648
analysis/draw_per_token_reward.py sha256=6IGOzqOlo5snjVLLwuBkVkWH_4msedwi79W6al2U3fU 3987
analysis/draw_subtoken_statistics.py sha256=1bsiz77f9QW-Jp9VmfPRckFSC73-mnGEUoBZ5poHd5Q 2040
analysis/get_benchmark_results.py sha256=gqV2GlWLrg3oAYaO9gW9HcR1pandEnmwwPMkErZQNxY 10122
analysis/get_dpo_ref_free_results.py sha256=DLl6GbQZiON_LhmXwsfAquzBzgmAGqTsGry3vQU6u7E 9058
analysis/get_per_token_reward.py sha256=QhlgHN-0iH0eWgMJdLwogI_tAK_zuGCOS3Xzo1w-2Ks 15447
analysis/get_subtoken_statistics.py sha256=IgX2zlNGO65v7BKHefoFdpg1X4Fs74pWER8adDMLZh0 6176
analysis/plot_per_model_dist.py sha256=c3oI35UIFIkUMoueuiLgFx4eJ-O7JMBTna3bvHjObLU 6527
analysis/plot_per_subset_dist.py sha256=YuTMXVa_YtdJG-_sih6hEakv70cTEqN0P1wYMR2GWk4 6542
analysis/run_ensemble_offline.py sha256=MDxYjjF4HuUcpiRjJK22dZB_xQtqhfmrDHHbrc6Bxbw 7085
analysis/utils.py sha256=7ElHjzHOGU7Wgc0DEM6OvBTHF9IutUl0-AMW_qdU0rg 5824
analysis/visualization.py sha256=_Q0ZqEDfcFCFtV-R3epfmBMbHQg50Z_hQhofePa7Ses 17157
rewardbench/__init__.py sha256=wlp5n_-zNzK4bEy3qHT3GyoHScedes5mDwE9HGkaa3s 1266
rewardbench/__main__.py sha256=6Z-9d13BK60d8OzGRTcX7svk98A1RIxKSf5DRAR5LdE 12284
rewardbench/chattemplates.py sha256=gIiML-QNBIhDSC7329IxZ4LFo2Npi6mYhk-QMycmpEg 2175
rewardbench/constants.py sha256=TDZhtIsYl4O53D7VQk-OLQ4kqe4_0sNTFxPiEt2dIn0 4067
rewardbench/dpo.py sha256=l4XgbXo8skZi3HD-wAGbWXlm18fs3icjVxB2Xg9AOVY 19382
rewardbench/generative.py sha256=dUrjUImU8-9_2_7mOF8f8oFzrP5qMvxTyasHm-j48zw 26623
rewardbench/rewardbench.py sha256=mwXAHIW3FOED7_L1zvAD-U6BRz6MZ2hRpG0c5K0nnc0 26597
rewardbench/utils.py sha256=V6QoqNiGWKb3AfZsFmq5E7ECstOsD5chv1YkLVU9rUs 27790
rewardbench/models/__init__.py sha256=DPOLULscHS-g6fNmIdKO34XpIJt7Pe7BPxD3cUhqnLY 7338
rewardbench/models/armorm.py sha256=n7BRePA3YH9CvqWYXONnHe2itK_Pnb4S7sefoGkUj2M 2072
rewardbench/models/beaver.py sha256=H5TxtRlGL8WDE6Jk2Y3VSHvpzQwZQcCexo-lnQtYlxo 18441
rewardbench/models/betterpairrm.py sha256=XKxlDGcCH7RhT2rOhIjhSbxUU2c1YqQkXESIq7pqCOs 5399
rewardbench/models/grm.py sha256=b8yA3v99v_skIJgbba3MTCwmcZGrp6J_hEj-QmpDgFs 4862
rewardbench/models/internlm.py sha256=zC4VmAl0LWUT8vnRrbnT8rGmbrCceY2Yq7pY6EKuhhk 2555
rewardbench/models/openassistant.py sha256=LTsf5cfSsX6nGv4vWXotho9JT3Ovv5QYza-GgFNpLe8 3411
rewardbench/models/openbmb.py sha256=ALbv0F0Vb6ZqrCRqpY0oD0hCSJiMmVsX0QerkyafLi4 2791
rewardbench/models/pairrm.py sha256=KcRPczdAqoOFQPjmu7vctyWNfdqyUmtemDETo1jz-io 10357
rewardbench/models/pipeline.py sha256=qAnYrq0ARXmewvsMq0pnnzZLZJdSLrWurrTvG13U-uo 3360
rewardbench/models/shp.py sha256=DMSZouHh6K9RP2REW_MLRmi4oC8bknJLv8rsR_Rcflc 5374
rewardbench/models/slicpairpm.py sha256=LM0q1zahbvnyXS8ZgsBT_C7JKEl-i6_nK7XQ5Lmr1S0 3594
rewardbench/models/starling.py sha256=nveBi61T15GS5H3aLjim_hc_2kZAd0V-j2mEMFEjm2U 6232
rewardbench/models/ziya.py sha256=vin63B0AiREh1VLT4tBcQtdGzU4E9Man7NzuSXwdrdo 1397
scripts/__init__.py sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU 0
scripts/run_bon.py sha256=Dq2QppLUbfLQbOCegjr3PCLZmS-cdcbYiQptgsRpHhM 12428
scripts/run_dpo.py sha256=XiBoZ81PxhKREBcAEV4qrJ_TPfCEP7HFCYVB8EC-CAI 12347
scripts/run_generative.py sha256=uGNvOusyNi6pvilkBHBuVsR5cmeHS5vFHIl1CCHST1E 15892
scripts/run_rm.py sha256=M1-ff8aRdNr7Mv6_EkaVp71DR_1fuEi3NBGXpiHdTDY 16710
scripts/submit_eval_jobs.py sha256=5LRnAnXgQHzqZ66ZExTvncLMvUzrQhaBo6j9EsJlcDw 7205
scripts/submit_train_jobs.py sha256=7VIHAh3is04LIhPdPMVNfxHYZez8LimHq7qEJJFt5WU 3843
scripts/train_rm.py sha256=9sxHIR5Bs2bjI0NUUP72UsvAYS4kq77OuID8BEMPZzI 16889
tests/__init__.py sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU 0
tests/test_data.py sha256=Z-vi5QRpH52BgVB481_kDHzd4sCwGNe2ka0Yt9QCPgM 12800
tests/test_package.py sha256=nmj_6k0BVPFbatWWroL1gBF0l-cxVHUFkYHg4baXyyE 1979
tests/test_utils.py sha256=UIjOZO8DbjqXIkLPdaBhW0y9uw4nTt1Kh8BgUZB5oV4 1544
rewardbench-0.1.3.dist-info/LICENSE sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ 11357
rewardbench-0.1.3.dist-info/METADATA sha256=4Ap5q9WDcl-jOKPV6Qr2Ch3LndYeStR4ODLytkblVyw 14675
rewardbench-0.1.3.dist-info/WHEEL sha256=yQN5g4mg4AybRjkgi-9yy4iQEFibGQmlz78Pik5Or-A 92
rewardbench-0.1.3.dist-info/entry_points.txt sha256=4yMfP0piyPClWFqJQ6PXcmGUl-IlD-WD6yZcFOE58j0 107
rewardbench-0.1.3.dist-info/top_level.txt sha256=_plLZM-jHyDonj3-MP5LPFMpYF2AR_Q5KbvyfZVb5NU 35
rewardbench-0.1.3.dist-info/RECORD

top_level.txt

analysis
rewardbench
scripts
tests

entry_points.txt

rewardbench = rewardbench.rewardbench:main
rewardbench-gen = scripts.run_generative:main