shtec-rlhf

View on PyPIReverse Dependencies (0)

1.0.5 shtec_rlhf-1.0.5-py3-none-any.whl

Wheel Details

Project: shtec-rlhf
Version: 1.0.5
Filename: shtec_rlhf-1.0.5-py3-none-any.whl
Download: [link]
Size: 301429
MD5: 6f8043a3f8a2fa8eb796e9a4b6dddea4
SHA256: 2c211da6704b7d4f922b943f6ddcc8ae8739e59fecf7d861c3b4c5b825989eaf
Uploaded: 2024-06-24 05:55:05 +0000

dist-info

METADATA

Metadata-Version: 2.1
Name: shtec-rlhf
Version: 1.0.5
Summary: shtec-rlhf: Safe Reinforcement Learning from Human Feedback
Author: PKU-Alignment Team
Project-Url: Homepage, https://github.com/PKU-Alignment/shtec-rlhf
Project-Url: Repository, https://github.com/PKU-Alignment/shtec-rlhf
Project-Url: Documentation, https://shtec-rlhf.readthedocs.io
Project-Url: Bug Report, https://github.com/PKU-Alignment/shtec-rlhf
License: Apache License, Version 2.0
Keywords: Reinforcement Learning,Safe Reinforcement Learning,Reinforcement Learning from Human Feedback,Safe Reinforcement Learning from Human Feedback,Large Language Model,Language Model,RLHF,Safe RLHF,LLM
Classifier: Development Status :: 4 - Beta
Classifier: License :: OSI Approved :: Apache Software License
Classifier: Programming Language :: Python :: 3
Classifier: Programming Language :: Python :: 3.8
Classifier: Programming Language :: Python :: 3.9
Classifier: Programming Language :: Python :: 3.10
Classifier: Programming Language :: Python :: 3.11
Classifier: Intended Audience :: Science/Research
Classifier: Topic :: Scientific/Engineering :: Artificial Intelligence
Classifier: Topic :: Software Development :: Libraries :: Python Modules
Requires-Python: >=3.8
Requires-Dist: torch (>=1.13)
Requires-Dist: transformers (>=4.37)
Requires-Dist: datasets
Requires-Dist: tokenizers (>=0.13.3)
Requires-Dist: accelerate
Requires-Dist: deepspeed
Requires-Dist: numpy
Requires-Dist: scipy
Requires-Dist: sentencepiece
Requires-Dist: wandb
Requires-Dist: tensorboard
Requires-Dist: optree
Requires-Dist: matplotlib
Requires-Dist: tqdm
Requires-Dist: rich
Requires-Dist: isort (>=5.11.0); extra == "lint"
Requires-Dist: black (>=23.1.0); extra == "lint"
Requires-Dist: pylint[spelling] (>=2.15.0); extra == "lint"
Requires-Dist: mypy (>=1.0); extra == "lint"
Requires-Dist: flake8; extra == "lint"
Requires-Dist: flake8-bugbear; extra == "lint"
Requires-Dist: flake8-comprehensions; extra == "lint"
Requires-Dist: flake8-docstrings; extra == "lint"
Requires-Dist: flake8-pyi; extra == "lint"
Requires-Dist: flake8-simplify; extra == "lint"
Requires-Dist: ruff; extra == "lint"
Requires-Dist: doc8; extra == "lint"
Requires-Dist: pydocstyle[toml]; extra == "lint"
Requires-Dist: pyenchant; extra == "lint"
Requires-Dist: pre-commit; extra == "lint"
Provides-Extra: lint
Description-Content-Type: text/markdown
License-File: LICENSE
[Description omitted; length: 98 characters]

WHEEL

Wheel-Version: 1.0
Generator: bdist_wheel (0.38.4)
Root-Is-Purelib: true
Tag: py3-none-any

RECORD

Path Digest Size
safe_rlhf/__init__.py sha256=MTigF4tRYjECn1il1j7InHFX1oQAy-WTqUkIZyQWaOo 1388
safe_rlhf/logger.py sha256=ORwAiz2hoWAhgX-m2tcvrVSqQnnw1GE3D9aYcMdfsDU 7955
safe_rlhf/utils.py sha256=KO1mjEIT6YRjrXExkfs8rtlkLpzOMw9COG7rVj1hY58 9576
safe_rlhf/version.py sha256=yoww-bab4S0sGD9iWVzgcBbaYR_RfUzdm1lr8gtxBB4 1821
safe_rlhf/algorithms/__init__.py sha256=ABXxt48HMhg57WS2WMxUDQuKKP7_3xUUM4zYE8mhdO0 974
safe_rlhf/algorithms/dpo/__init__.py sha256=KDkxqfTtok6gBDP1o3dTY6zWz0tc66EYOvvXYTr3QCc 833
safe_rlhf/algorithms/dpo/__main__.py sha256=dhAIrXefIKp5i6zWaGoES4lP38bk4jEozcN_1upmp-E 858
safe_rlhf/algorithms/dpo/main.py sha256=oYMAR3e1yA4qPxRF_hPnm7y9Wy8uEAwySmttUcEE2To 9634
safe_rlhf/algorithms/dpo/trainer.py sha256=f1mtMaQ7n8U3L1FBkw2pzXaonIO8QrqT-930LTjnkNg 10432
safe_rlhf/algorithms/ppo/__init__.py sha256=yISCKfVJKBW62MRtJuo7kcpMnw7sb0dB9k9c74UReZI 806
safe_rlhf/algorithms/ppo/__main__.py sha256=byDaymRuRlZXSi0Vb7v51BgWTvruEj7XKTFaRDTVrXc 867
safe_rlhf/algorithms/ppo/main.py sha256=GlBFVoWBpF0dcUqkjjNRK6OvYJI1XUzLlOQj3WOwVYQ 14063
safe_rlhf/algorithms/ppo/trainer.py sha256=5Czlf_975-S0U498HDCWyEbN1nGzBqPn8G95pojaW5o 9401
safe_rlhf/algorithms/ppo_lag/__init__.py sha256=OfrOywqWmDdMgDTy2KcVK6Ense6bM76uHtRqY8qVo7I 831
safe_rlhf/algorithms/ppo_lag/__main__.py sha256=ge0-TPnqgbqsbnv9B8vWTCu3Bo1hbQHs6cf4_oLAh6E 886
safe_rlhf/algorithms/ppo_lag/main.py sha256=arnsOSYtBPgYbHUh4adG_NqbhG69LsFyDFzinf0kSfs 15752
safe_rlhf/algorithms/ppo_lag/trainer.py sha256=3vtpfbcTN-WzoLma_NriWf60g4P24A-ITl_VQBuKCH8 18909
safe_rlhf/algorithms/ppo_reward_shaping/__init__.py sha256=srYpPK7-zDcQlwm-L-LOHFu6I0Lo9FFWxXcn_txmpDc 872
safe_rlhf/algorithms/ppo_reward_shaping/__main__.py sha256=Vc5Ocmz0sMuJGh_RqRoROFC3AGydtkVvYlrm_yUuYTk 908
safe_rlhf/algorithms/ppo_reward_shaping/main.py sha256=NxJxCapcL4kDQf2P53IA0KqtpinhGIIUF41fskRQPq8 14853
safe_rlhf/algorithms/ppo_reward_shaping/trainer.py sha256=7itZ2MrJYM02wiSP0bzXAQkohQ0hZ2qVwfennDa0aSw 11900
safe_rlhf/configs/__init__.py sha256=lw1JdY-cxOFaUI8nTelz-vToKBoJMpncHVwYRRFHimQ 1085
safe_rlhf/configs/constants.py sha256=ZrHeDlKsJML7aupCmpF6a03_g0yHfZqBZ1ekREwLjTk 1616
safe_rlhf/configs/deepspeed_config.py sha256=91JRIPOPb0PlVryWaZ8DrOvcG9QVd6DEovSfQW_z7vQ 5409
safe_rlhf/configs/ds_eval_config_template.json sha256=ACWig0lsY2L_GFxssLwasV0lv0wtJjvFBk6y10JkICk 443
safe_rlhf/configs/ds_train_config_template.json sha256=OVtNwtzZ666CfNZbIB8WZzSrPCSB23f0uxAT5HSA9XI 872
safe_rlhf/configs/fsdp_config.json sha256=LxAyJZsiCiuDYJh_96KLBDslLs3iUwV-6zhkdfIYCzo 66
safe_rlhf/datasets/__init__.py sha256=eUXvdQ1mAmH_BE4S-UL84HEL4NbF3xCLnaWUgjdxcYA 2468
safe_rlhf/datasets/base.py sha256=nnN_c-6PfZAWWC0jLk9GZE0fePIZRWSxsaS30B3nF9Q 15819
safe_rlhf/datasets/preference.py sha256=v94mp_orFbNNOUv7HsyQdCLKp4CsF3NY2RyB92B-spc 4184
safe_rlhf/datasets/prompt_only.py sha256=9qvUzmeA6HysbsqBi5YJ0saZ7Urhve-UcXH8-RCCxdw 3031
safe_rlhf/datasets/safety_preference.py sha256=ipWlte_G2wZzukS1ulVI-uxYD9BMWw7ifrmN8vbCbeE 5735
safe_rlhf/datasets/supervised.py sha256=pguM2pyf8G_qQGl6Elokj_psKyed9vXRriDHK8jqi5A 4308
safe_rlhf/datasets/utils.py sha256=QkXo9PvWZSVuwVc5t7Ntdp3yxdjx7a3DxBhvGDNCovg 2057
safe_rlhf/datasets/raw/__init__.py sha256=LIJ4KQHsRo5-E2Tax1q-3adHvRK7Y0yyCYj7mfXZCpk 1611
safe_rlhf/datasets/raw/alpaca.py sha256=2rCqDXv0Jn5T0V1hV3kk14vvO1LyeXhHUPdnpRhmmRE 1563
safe_rlhf/datasets/raw/firefly.py sha256=RTSYfOcDqz1XWju0ln35MHEaG6-XW0H2ZWi6X8F18WE 1344
safe_rlhf/datasets/raw/hh_rlhf.py sha256=_XkNkGkTUvZVoJA9Ma-tchaLCabgCf0DosVZav87RyM 4811
safe_rlhf/datasets/raw/moss.py sha256=wakJg51Gsr-2EeSjyVnX42pU461dz-LQGUoandT8HEQ 4588
safe_rlhf/datasets/raw/safe_rlhf.py sha256=gcT3pdBqKngXb228lA60eRq9z0L2cMN2NKevJ3aPoDY 2965
safe_rlhf/evaluate/__init__.py sha256=d4peV74_KVADiKGlS7490jDsPRZ2ip3cN0lUQQnOz7Q 690
safe_rlhf/evaluate/arena.py sha256=xtjwohxwBPS0SEhoJDfQEpO5_sjEyneDh0WiyeGPgj8 19900
safe_rlhf/evaluate/cost.py sha256=CaOqLyS38E3oXvLOJLKyIunrliBNZokxAVHEoDqy9rs 13767
safe_rlhf/evaluate/reward.py sha256=H1_FlONUy06f5Bp9fiWv2Sq819hgen7EUH5dRcv9LZw 10038
safe_rlhf/evaluate/bigbench/__init__.py sha256=d4peV74_KVADiKGlS7490jDsPRZ2ip3cN0lUQQnOz7Q 690
safe_rlhf/evaluate/bigbench/__main__.py sha256=MqsbUS5Ndq8Ntq-Hv2c-mXrs1AtPWhGX35W3S4TE7-U 804
safe_rlhf/evaluate/bigbench/eval.py sha256=LsnbDk8TNmZlu2kIf4jEndEfeVP8JYNJgfnFxXY51oc 6846
safe_rlhf/evaluate/bigbench/model.py sha256=Uv5z0yFTk_FVRk0DKNadw8NZnq9mXgbRowrFhMu_f5Q 7018
safe_rlhf/evaluate/gpt4/__init__.py sha256=d4peV74_KVADiKGlS7490jDsPRZ2ip3cN0lUQQnOz7Q 690
safe_rlhf/evaluate/gpt4/__main__.py sha256=kN2NiNNtpsMmmjV6aKyNNrM_rP1PUsM_eT0N18HzqCQ 800
safe_rlhf/evaluate/gpt4/eval.py sha256=Z9bUZ_HdCI_OkjFjDJezpxSF-7hix0HQIyq-IjpLZmo 6184
safe_rlhf/evaluate/gpt4/problem.json sha256=EbcJd9s49jhQDH3Yb3hqzspKHOl2iOzBvElHssbOcTI 13213
safe_rlhf/finetune/__init__.py sha256=QuvRQwdeOtfQWQMG4wCcEXioT8HDs9uzVfgpqUNc01g 835
safe_rlhf/finetune/__main__.py sha256=PvPRfoHEw6deIDJ14-nCxl1n8aaRQKMlZKGoox6Aw40 858
safe_rlhf/finetune/deepspeed.py sha256=MbvldFExVTtmlLrMN--D_b05Q5KGn6w2h9D9wt2m6TU 9232
safe_rlhf/finetune/huggingface.py sha256=YFnD8KpEOvtFI6Bx-1aFlbvX0t8BHrym6FJUeah7hJ0 3205
safe_rlhf/finetune/main.py sha256=XSXkiCzenf0I9vhHrkSXY4kZO41iGa75O5DgnMJguG4 841
safe_rlhf/finetune/trainer.py sha256=jR3qAWEMp4G0yLlrlb3Gr6essjfyGPvy5Nf9jpvcKNI 2778
safe_rlhf/models/__init__.py sha256=fdWLaxdIOLW52_9QRid6ol2Izb4dAPtDG7SIhcyecQ8 967
safe_rlhf/models/normalizer.py sha256=dCTVXun0K5zTe6FlVJlqNTbZ3dO00GVJVhOnzVVFLF0 6948
safe_rlhf/models/pretrained.py sha256=KRGoY6IGhgH7__FO7DkEcXQJYIVU8ZKOu7dj2bVYd14 7822
safe_rlhf/models/score_model/__init__.py sha256=nOereYT307lCpTNdsAuY4ZyDpS1NTvnfFt2NGYA_Rvs 9709
safe_rlhf/models/score_model/bloom/__init__.py sha256=wk_CAgMS9B5TtyCkf33ka_j94j-z_U-9_XvGHV3sOkI 768
safe_rlhf/models/score_model/bloom/modeling_bloom.py sha256=RwoxCHhv7bJz1h5GD1vB7JmjT1ArvuxwF6iFInVRw0I 4526
safe_rlhf/models/score_model/gemma/__init__.py sha256=zjoP0s9i7Ak6Yfg8b8p9KARneP_IU_WoyAZE-NNAyfs 768
safe_rlhf/models/score_model/gemma/modeling_gemma.py sha256=m_QdzKOBorur4dSOxQufEei2EE1Z2Yfesv8QSRrUzIk 4034
safe_rlhf/models/score_model/gpt2/__init__.py sha256=HoQbNr0t9iCgnpgXvtcDlF5DTiSKLFxTRc6wSmfAu_w 765
safe_rlhf/models/score_model/gpt2/modeling_gpt2.py sha256=jTgmaQYqtvI_Yu6C9t6elJIVhwzn1jl5-6YiZIQ0Ty8 6520
safe_rlhf/models/score_model/gpt_neo/__init__.py sha256=qwYBDatLN1Va7iUW0dXxv_EvfjRZJeEh-jLNA964aGY 773
safe_rlhf/models/score_model/gpt_neo/modeling_gpt_neo.py sha256=Dj5KxF97RWqAjpr9fmVrEa_ceDIIJz0GTbRspXfLUaY 4302
safe_rlhf/models/score_model/gpt_neox/__init__.py sha256=IodGU0Sp19BV8bu5HuYmk0gJshvzohtL5ns5fWxzOkE 776
safe_rlhf/models/score_model/gpt_neox/modeling_gpt_neox.py sha256=1UmZsPR6JU5qHzpCBnXGyJLsoXRQQ81ZZwEnQ8t1cys 4012
safe_rlhf/models/score_model/gptj/__init__.py sha256=I4fi4xOqJjLH32DgVGbhIaj2Xh3DFTWVPEf1AYLriHc 765
safe_rlhf/models/score_model/gptj/modeling_gptj.py sha256=HnZkLlFXSWn3dJ_k-0UjEiqJQHo7d4It1LhpVu5-kIM 6250
safe_rlhf/models/score_model/llama/__init__.py sha256=osPYp4TzZneVPMvRrpWKodhjZBHpLLWe9i0VqeCoMTU 768
safe_rlhf/models/score_model/llama/modeling_llama.py sha256=-3R0wpBVoWK3irngoSNLhIswSxN0HA7njcUrvwz2HDQ 4034
safe_rlhf/models/score_model/mistral/__init__.py sha256=uh41PCpTSzGM4Pb6W6qcNoEwcrwdG6zencE54ww0ouc 774
safe_rlhf/models/score_model/mistral/modeling_mistral.py sha256=HMIgyCQf_I8_md96vYjWgybaeED91g6f8GLM6_D6cqs 4052
safe_rlhf/models/score_model/opt/__init__.py sha256=41x9QUS84yvyZJEol9NS5yJNwFFqiaTY6S7KoyjxHy8 762
safe_rlhf/models/score_model/opt/modeling_opt.py sha256=r6ZYwXvECW_khuDCJsiNB6qDOHJPNvE75UUdkP8wTwQ 4035
safe_rlhf/models/score_model/phi/__init__.py sha256=KsexlzbKKAGF_bpEOjgR3dN1orMn_q7gIAtQoqh0sKY 762
safe_rlhf/models/score_model/phi/modeling_phi.py sha256=AE1Iqk_X9t41_rNNVlhdxoT5_j3dteoUHkAxhvP0APU 4016
safe_rlhf/models/score_model/qwen2/__init__.py sha256=VFEbKgdMuEldRjA2YBnh8l6TWHTYYYxxE-VcAoFinnI 768
safe_rlhf/models/score_model/qwen2/modeling_qwen2.py sha256=LRlK5Th7kRq3TRA2xTXiX_NLRPh6ttn7i9xpDNwsq2I 4228
safe_rlhf/serve/__init__.py sha256=d4peV74_KVADiKGlS7490jDsPRZ2ip3cN0lUQQnOz7Q 690
safe_rlhf/serve/arena.py sha256=gIEZeK1auz6_9FgN63SoLSHLpfwtjIz_9GmMFHqo7CI 3494
safe_rlhf/serve/chatbot.py sha256=2pO6ATtEuS5o-c2QUMJin4ZHdVCfByJupKwAfX7BrBo 12499
safe_rlhf/serve/cli.py sha256=rg-vvvk3D-O9ZQcgkg3XiE20GA5QtRBxG-WOckeA0lc 9349
safe_rlhf/trainers/__init__.py sha256=C-52MkZ3C9XFbKBEFc7cfZlKeKqShfz4RfBK5XtsEAo 952
safe_rlhf/trainers/base.py sha256=7nppBM2Anwx-j4xjcfbkwVPLtyxJqyM2NEI62cp3uDc 5039
safe_rlhf/trainers/rl_trainer.py sha256=E5tf3xcaMzd7bq5fxVyPUL50mL83uVQbIvlPWn5yiPc 26388
safe_rlhf/trainers/supervised_trainer.py sha256=K4GxwHDQL9ha0G-tnjQaDhGYh_kxT5UMOlshLXRnh5U 9225
safe_rlhf/values/__init__.py sha256=5Tzvf_PHWAx8Rhq0Prj1Vd6xJ_cwYAeTI3QqOl7izbM 869
safe_rlhf/values/cost/__init__.py sha256=rrfiIKRsscwq3fddZPGjyPjhUBticz-u_NaKQMeLlWg 774
safe_rlhf/values/cost/__main__.py sha256=odqMBMkpmMCKtfx-SrFbzh7Iqrdasy1DXwXO42e851w 866
safe_rlhf/values/cost/main.py sha256=Le81EiJrPWsfOGN-xufONN30nn1g5IGEHDnabvcj4-U 10422
safe_rlhf/values/cost/trainer.py sha256=RSn9K_C0cwdLCOK1dsqPBJAEoGTi34J-ttfSi11LtUA 14402
safe_rlhf/values/reward/__init__.py sha256=KBOuaK6LTCJx8VWNPZZTf9_sKYxAjND1DDs6VvBmj_w 780
safe_rlhf/values/reward/__main__.py sha256=EmaGmlNO_y5VKeEmmXETZrISTpdK1mE-ls_OAhNdi8k 870
safe_rlhf/values/reward/main.py sha256=7oV8aci9e6gSMSaYNhbzdbqdkd3ZvNZlrMi9U-ZqccQ 10442
safe_rlhf/values/reward/trainer.py sha256=RVLRx7O0U3bY6MKF86k7tAKDin1vqpEdYBa2Xbos0KM 11127
shtec_rlhf/__init__.py sha256=Hx3fU_J_IdXdaFQ-E22R1S7mOjaOYiYZtnKwj_niDzo 1226
shtec_rlhf/logger.py sha256=ORwAiz2hoWAhgX-m2tcvrVSqQnnw1GE3D9aYcMdfsDU 7955
shtec_rlhf/utils.py sha256=KO1mjEIT6YRjrXExkfs8rtlkLpzOMw9COG7rVj1hY58 9576
shtec_rlhf/version.py sha256=2Hk1fL8Gk3cVrUxJbJ01oKjZnfqZQQ6K3nKfhB7ukfY 1818
shtec_rlhf/algorithms/__init__.py sha256=ABXxt48HMhg57WS2WMxUDQuKKP7_3xUUM4zYE8mhdO0 974
shtec_rlhf/algorithms/dpo/__init__.py sha256=KDkxqfTtok6gBDP1o3dTY6zWz0tc66EYOvvXYTr3QCc 833
shtec_rlhf/algorithms/dpo/__main__.py sha256=dhAIrXefIKp5i6zWaGoES4lP38bk4jEozcN_1upmp-E 858
shtec_rlhf/algorithms/dpo/main.py sha256=Lj025fhVZ4bwtuY6g4idqGotrFDr-XivO2CwJ6u3SCw 9588
shtec_rlhf/algorithms/dpo/trainer.py sha256=8ZzBam-Sq6nZppejEcxIHiDjJF4zx__kKKpir5XtVsw 10300
shtec_rlhf/algorithms/ppo/__init__.py sha256=yISCKfVJKBW62MRtJuo7kcpMnw7sb0dB9k9c74UReZI 806
shtec_rlhf/algorithms/ppo/__main__.py sha256=byDaymRuRlZXSi0Vb7v51BgWTvruEj7XKTFaRDTVrXc 867
shtec_rlhf/algorithms/ppo/main.py sha256=NQmDJp4qukR6ZBwgVnPNu-M-g1mLtHyfIsJGiGLMDpY 14017
shtec_rlhf/algorithms/ppo/trainer.py sha256=HDcU0Soa3eU5vzLVc1VzILNuAPxfOcM9vV6z6rlmdY4 9350
shtec_rlhf/algorithms/ppo_lag/__init__.py sha256=OfrOywqWmDdMgDTy2KcVK6Ense6bM76uHtRqY8qVo7I 831
shtec_rlhf/algorithms/ppo_lag/__main__.py sha256=ge0-TPnqgbqsbnv9B8vWTCu3Bo1hbQHs6cf4_oLAh6E 886
shtec_rlhf/algorithms/ppo_lag/main.py sha256=HUd8piPP_sUJuNWdS-0T6rGOvDbuVbV6PBmygkFp9hs 15708
shtec_rlhf/algorithms/ppo_lag/trainer.py sha256=ynxO4F4wBsszzXM72TYgobdXhYl8WAt8s5c51ANFnFk 18858
shtec_rlhf/algorithms/ppo_reward_shaping/__init__.py sha256=srYpPK7-zDcQlwm-L-LOHFu6I0Lo9FFWxXcn_txmpDc 872
shtec_rlhf/algorithms/ppo_reward_shaping/__main__.py sha256=Vc5Ocmz0sMuJGh_RqRoROFC3AGydtkVvYlrm_yUuYTk 908
shtec_rlhf/algorithms/ppo_reward_shaping/main.py sha256=-2TEzGVVUCWyn3mRz4fIlzflz5zus2kRKEze6q9r1iM 14809
shtec_rlhf/algorithms/ppo_reward_shaping/trainer.py sha256=7itZ2MrJYM02wiSP0bzXAQkohQ0hZ2qVwfennDa0aSw 11900
shtec_rlhf/configs/__init__.py sha256=lw1JdY-cxOFaUI8nTelz-vToKBoJMpncHVwYRRFHimQ 1085
shtec_rlhf/configs/constants.py sha256=ZrHeDlKsJML7aupCmpF6a03_g0yHfZqBZ1ekREwLjTk 1616
shtec_rlhf/configs/deepspeed_config.py sha256=91JRIPOPb0PlVryWaZ8DrOvcG9QVd6DEovSfQW_z7vQ 5409
shtec_rlhf/configs/ds_eval_config_template.json sha256=ACWig0lsY2L_GFxssLwasV0lv0wtJjvFBk6y10JkICk 443
shtec_rlhf/configs/ds_train_config_template.json sha256=OVtNwtzZ666CfNZbIB8WZzSrPCSB23f0uxAT5HSA9XI 872
shtec_rlhf/configs/fsdp_config.json sha256=LxAyJZsiCiuDYJh_96KLBDslLs3iUwV-6zhkdfIYCzo 66
shtec_rlhf/evaluate/__init__.py sha256=d4peV74_KVADiKGlS7490jDsPRZ2ip3cN0lUQQnOz7Q 690
shtec_rlhf/evaluate/arena.py sha256=weDXgqlCZYi-QQz7Q0XbcL-Dhi0zFXIS3V3pSqOeEQM 19835
shtec_rlhf/evaluate/cost.py sha256=RggEIwT8ljscMexKHHXFkw89RAXnIDdKPRN1rMrEO_g 13640
shtec_rlhf/evaluate/reward.py sha256=I5cHtZ7FydnvHp-CWK82DLKBTRrVNl-y-t4J_LC-xoQ 9923
shtec_rlhf/evaluate/bigbench/__init__.py sha256=d4peV74_KVADiKGlS7490jDsPRZ2ip3cN0lUQQnOz7Q 690
shtec_rlhf/evaluate/bigbench/__main__.py sha256=MqsbUS5Ndq8Ntq-Hv2c-mXrs1AtPWhGX35W3S4TE7-U 804
shtec_rlhf/evaluate/bigbench/eval.py sha256=LsnbDk8TNmZlu2kIf4jEndEfeVP8JYNJgfnFxXY51oc 6846
shtec_rlhf/evaluate/bigbench/model.py sha256=Uv5z0yFTk_FVRk0DKNadw8NZnq9mXgbRowrFhMu_f5Q 7018
shtec_rlhf/evaluate/gpt4/__init__.py sha256=d4peV74_KVADiKGlS7490jDsPRZ2ip3cN0lUQQnOz7Q 690
shtec_rlhf/evaluate/gpt4/__main__.py sha256=kN2NiNNtpsMmmjV6aKyNNrM_rP1PUsM_eT0N18HzqCQ 800
shtec_rlhf/evaluate/gpt4/eval.py sha256=Z9bUZ_HdCI_OkjFjDJezpxSF-7hix0HQIyq-IjpLZmo 6184
shtec_rlhf/evaluate/gpt4/problem.json sha256=EbcJd9s49jhQDH3Yb3hqzspKHOl2iOzBvElHssbOcTI 13213
shtec_rlhf/models/__init__.py sha256=fdWLaxdIOLW52_9QRid6ol2Izb4dAPtDG7SIhcyecQ8 967
shtec_rlhf/models/normalizer.py sha256=dCTVXun0K5zTe6FlVJlqNTbZ3dO00GVJVhOnzVVFLF0 6948
shtec_rlhf/models/pretrained.py sha256=KRGoY6IGhgH7__FO7DkEcXQJYIVU8ZKOu7dj2bVYd14 7822
shtec_rlhf/models/score_model/__init__.py sha256=nOereYT307lCpTNdsAuY4ZyDpS1NTvnfFt2NGYA_Rvs 9709
shtec_rlhf/models/score_model/bloom/__init__.py sha256=wk_CAgMS9B5TtyCkf33ka_j94j-z_U-9_XvGHV3sOkI 768
shtec_rlhf/models/score_model/bloom/modeling_bloom.py sha256=RwoxCHhv7bJz1h5GD1vB7JmjT1ArvuxwF6iFInVRw0I 4526
shtec_rlhf/models/score_model/gemma/__init__.py sha256=zjoP0s9i7Ak6Yfg8b8p9KARneP_IU_WoyAZE-NNAyfs 768
shtec_rlhf/models/score_model/gemma/modeling_gemma.py sha256=m_QdzKOBorur4dSOxQufEei2EE1Z2Yfesv8QSRrUzIk 4034
shtec_rlhf/models/score_model/gpt2/__init__.py sha256=HoQbNr0t9iCgnpgXvtcDlF5DTiSKLFxTRc6wSmfAu_w 765
shtec_rlhf/models/score_model/gpt2/modeling_gpt2.py sha256=jTgmaQYqtvI_Yu6C9t6elJIVhwzn1jl5-6YiZIQ0Ty8 6520
shtec_rlhf/models/score_model/gpt_neo/__init__.py sha256=qwYBDatLN1Va7iUW0dXxv_EvfjRZJeEh-jLNA964aGY 773
shtec_rlhf/models/score_model/gpt_neo/modeling_gpt_neo.py sha256=Dj5KxF97RWqAjpr9fmVrEa_ceDIIJz0GTbRspXfLUaY 4302
shtec_rlhf/models/score_model/gpt_neox/__init__.py sha256=IodGU0Sp19BV8bu5HuYmk0gJshvzohtL5ns5fWxzOkE 776
shtec_rlhf/models/score_model/gpt_neox/modeling_gpt_neox.py sha256=1UmZsPR6JU5qHzpCBnXGyJLsoXRQQ81ZZwEnQ8t1cys 4012
shtec_rlhf/models/score_model/gptj/__init__.py sha256=I4fi4xOqJjLH32DgVGbhIaj2Xh3DFTWVPEf1AYLriHc 765
shtec_rlhf/models/score_model/gptj/modeling_gptj.py sha256=HnZkLlFXSWn3dJ_k-0UjEiqJQHo7d4It1LhpVu5-kIM 6250
shtec_rlhf/models/score_model/llama/__init__.py sha256=osPYp4TzZneVPMvRrpWKodhjZBHpLLWe9i0VqeCoMTU 768
shtec_rlhf/models/score_model/llama/modeling_llama.py sha256=-3R0wpBVoWK3irngoSNLhIswSxN0HA7njcUrvwz2HDQ 4034
shtec_rlhf/models/score_model/mistral/__init__.py sha256=uh41PCpTSzGM4Pb6W6qcNoEwcrwdG6zencE54ww0ouc 774
shtec_rlhf/models/score_model/mistral/modeling_mistral.py sha256=HMIgyCQf_I8_md96vYjWgybaeED91g6f8GLM6_D6cqs 4052
shtec_rlhf/models/score_model/opt/__init__.py sha256=41x9QUS84yvyZJEol9NS5yJNwFFqiaTY6S7KoyjxHy8 762
shtec_rlhf/models/score_model/opt/modeling_opt.py sha256=r6ZYwXvECW_khuDCJsiNB6qDOHJPNvE75UUdkP8wTwQ 4035
shtec_rlhf/models/score_model/phi/__init__.py sha256=KsexlzbKKAGF_bpEOjgR3dN1orMn_q7gIAtQoqh0sKY 762
shtec_rlhf/models/score_model/phi/modeling_phi.py sha256=AE1Iqk_X9t41_rNNVlhdxoT5_j3dteoUHkAxhvP0APU 4016
shtec_rlhf/models/score_model/qwen2/__init__.py sha256=VFEbKgdMuEldRjA2YBnh8l6TWHTYYYxxE-VcAoFinnI 768
shtec_rlhf/models/score_model/qwen2/modeling_qwen2.py sha256=LRlK5Th7kRq3TRA2xTXiX_NLRPh6ttn7i9xpDNwsq2I 4228
shtec_rlhf/serve/__init__.py sha256=d4peV74_KVADiKGlS7490jDsPRZ2ip3cN0lUQQnOz7Q 690
shtec_rlhf/serve/arena.py sha256=gIEZeK1auz6_9FgN63SoLSHLpfwtjIz_9GmMFHqo7CI 3494
shtec_rlhf/serve/chatbot.py sha256=2pO6ATtEuS5o-c2QUMJin4ZHdVCfByJupKwAfX7BrBo 12499
shtec_rlhf/serve/cli.py sha256=rg-vvvk3D-O9ZQcgkg3XiE20GA5QtRBxG-WOckeA0lc 9349
shtec_rlhf/values/__init__.py sha256=5Tzvf_PHWAx8Rhq0Prj1Vd6xJ_cwYAeTI3QqOl7izbM 869
shtec_rlhf/values/cost/__init__.py sha256=rrfiIKRsscwq3fddZPGjyPjhUBticz-u_NaKQMeLlWg 774
shtec_rlhf/values/cost/__main__.py sha256=odqMBMkpmMCKtfx-SrFbzh7Iqrdasy1DXwXO42e851w 866
shtec_rlhf/values/cost/main.py sha256=TCsZQxEUc7w9h0xmjCV1-BXLxiXZLJUhEu6Y8xxpalw 10377
shtec_rlhf/values/cost/trainer.py sha256=iw1XCjrDr_sKaIpjgDTQHT7rtLa3XeWwStpj9qx1Nmw 14258
shtec_rlhf/values/reward/__init__.py sha256=KBOuaK6LTCJx8VWNPZZTf9_sKYxAjND1DDs6VvBmj_w 780
shtec_rlhf/values/reward/__main__.py sha256=EmaGmlNO_y5VKeEmmXETZrISTpdK1mE-ls_OAhNdi8k 870
shtec_rlhf/values/reward/main.py sha256=GFGIntABBQyP3jf3BBnDdXdPy1RgtruRqNkpq5PvhZs 10397
shtec_rlhf/values/reward/trainer.py sha256=1Fee7pNavkHaBNEYMttwHtrA1rLe-Mj6oMj1T8WK4-g 10995
shtec_rlhf-1.0.5.dist-info/LICENSE sha256=1qqHIb4EWxMrQ29OsxB6OBiewW_eb9WsLbGF1oEyN2Y 11380
shtec_rlhf-1.0.5.dist-info/METADATA sha256=rpHQJJtCUNqvk6CGL2iAd3b096Gc75WO_CzlDKuAmzY 2509
shtec_rlhf-1.0.5.dist-info/WHEEL sha256=2wepM1nk4DS4eFpYrW1TTqPcoGNfHhhO_i5m4cOimbo 92
shtec_rlhf-1.0.5.dist-info/top_level.txt sha256=2HJwowMnZse7nGlMq36TDAFJT8pat6ikEOmBDkHgKBI 11
shtec_rlhf-1.0.5.dist-info/RECORD

top_level.txt

shtec_rlhf