Path |
Digest |
Size |
safe_rlhf/__init__.py |
sha256=MTigF4tRYjECn1il1j7InHFX1oQAy-WTqUkIZyQWaOo
|
1388 |
safe_rlhf/logger.py |
sha256=ORwAiz2hoWAhgX-m2tcvrVSqQnnw1GE3D9aYcMdfsDU
|
7955 |
safe_rlhf/utils.py |
sha256=KO1mjEIT6YRjrXExkfs8rtlkLpzOMw9COG7rVj1hY58
|
9576 |
safe_rlhf/version.py |
sha256=yoww-bab4S0sGD9iWVzgcBbaYR_RfUzdm1lr8gtxBB4
|
1821 |
safe_rlhf/algorithms/__init__.py |
sha256=ABXxt48HMhg57WS2WMxUDQuKKP7_3xUUM4zYE8mhdO0
|
974 |
safe_rlhf/algorithms/dpo/__init__.py |
sha256=KDkxqfTtok6gBDP1o3dTY6zWz0tc66EYOvvXYTr3QCc
|
833 |
safe_rlhf/algorithms/dpo/__main__.py |
sha256=dhAIrXefIKp5i6zWaGoES4lP38bk4jEozcN_1upmp-E
|
858 |
safe_rlhf/algorithms/dpo/main.py |
sha256=oYMAR3e1yA4qPxRF_hPnm7y9Wy8uEAwySmttUcEE2To
|
9634 |
safe_rlhf/algorithms/dpo/trainer.py |
sha256=f1mtMaQ7n8U3L1FBkw2pzXaonIO8QrqT-930LTjnkNg
|
10432 |
safe_rlhf/algorithms/ppo/__init__.py |
sha256=yISCKfVJKBW62MRtJuo7kcpMnw7sb0dB9k9c74UReZI
|
806 |
safe_rlhf/algorithms/ppo/__main__.py |
sha256=byDaymRuRlZXSi0Vb7v51BgWTvruEj7XKTFaRDTVrXc
|
867 |
safe_rlhf/algorithms/ppo/main.py |
sha256=GlBFVoWBpF0dcUqkjjNRK6OvYJI1XUzLlOQj3WOwVYQ
|
14063 |
safe_rlhf/algorithms/ppo/trainer.py |
sha256=5Czlf_975-S0U498HDCWyEbN1nGzBqPn8G95pojaW5o
|
9401 |
safe_rlhf/algorithms/ppo_lag/__init__.py |
sha256=OfrOywqWmDdMgDTy2KcVK6Ense6bM76uHtRqY8qVo7I
|
831 |
safe_rlhf/algorithms/ppo_lag/__main__.py |
sha256=ge0-TPnqgbqsbnv9B8vWTCu3Bo1hbQHs6cf4_oLAh6E
|
886 |
safe_rlhf/algorithms/ppo_lag/main.py |
sha256=arnsOSYtBPgYbHUh4adG_NqbhG69LsFyDFzinf0kSfs
|
15752 |
safe_rlhf/algorithms/ppo_lag/trainer.py |
sha256=3vtpfbcTN-WzoLma_NriWf60g4P24A-ITl_VQBuKCH8
|
18909 |
safe_rlhf/algorithms/ppo_reward_shaping/__init__.py |
sha256=srYpPK7-zDcQlwm-L-LOHFu6I0Lo9FFWxXcn_txmpDc
|
872 |
safe_rlhf/algorithms/ppo_reward_shaping/__main__.py |
sha256=Vc5Ocmz0sMuJGh_RqRoROFC3AGydtkVvYlrm_yUuYTk
|
908 |
safe_rlhf/algorithms/ppo_reward_shaping/main.py |
sha256=NxJxCapcL4kDQf2P53IA0KqtpinhGIIUF41fskRQPq8
|
14853 |
safe_rlhf/algorithms/ppo_reward_shaping/trainer.py |
sha256=7itZ2MrJYM02wiSP0bzXAQkohQ0hZ2qVwfennDa0aSw
|
11900 |
safe_rlhf/configs/__init__.py |
sha256=lw1JdY-cxOFaUI8nTelz-vToKBoJMpncHVwYRRFHimQ
|
1085 |
safe_rlhf/configs/constants.py |
sha256=ZrHeDlKsJML7aupCmpF6a03_g0yHfZqBZ1ekREwLjTk
|
1616 |
safe_rlhf/configs/deepspeed_config.py |
sha256=91JRIPOPb0PlVryWaZ8DrOvcG9QVd6DEovSfQW_z7vQ
|
5409 |
safe_rlhf/configs/ds_eval_config_template.json |
sha256=ACWig0lsY2L_GFxssLwasV0lv0wtJjvFBk6y10JkICk
|
443 |
safe_rlhf/configs/ds_train_config_template.json |
sha256=OVtNwtzZ666CfNZbIB8WZzSrPCSB23f0uxAT5HSA9XI
|
872 |
safe_rlhf/configs/fsdp_config.json |
sha256=LxAyJZsiCiuDYJh_96KLBDslLs3iUwV-6zhkdfIYCzo
|
66 |
safe_rlhf/datasets/__init__.py |
sha256=eUXvdQ1mAmH_BE4S-UL84HEL4NbF3xCLnaWUgjdxcYA
|
2468 |
safe_rlhf/datasets/base.py |
sha256=nnN_c-6PfZAWWC0jLk9GZE0fePIZRWSxsaS30B3nF9Q
|
15819 |
safe_rlhf/datasets/preference.py |
sha256=v94mp_orFbNNOUv7HsyQdCLKp4CsF3NY2RyB92B-spc
|
4184 |
safe_rlhf/datasets/prompt_only.py |
sha256=9qvUzmeA6HysbsqBi5YJ0saZ7Urhve-UcXH8-RCCxdw
|
3031 |
safe_rlhf/datasets/safety_preference.py |
sha256=ipWlte_G2wZzukS1ulVI-uxYD9BMWw7ifrmN8vbCbeE
|
5735 |
safe_rlhf/datasets/supervised.py |
sha256=pguM2pyf8G_qQGl6Elokj_psKyed9vXRriDHK8jqi5A
|
4308 |
safe_rlhf/datasets/utils.py |
sha256=QkXo9PvWZSVuwVc5t7Ntdp3yxdjx7a3DxBhvGDNCovg
|
2057 |
safe_rlhf/datasets/raw/__init__.py |
sha256=LIJ4KQHsRo5-E2Tax1q-3adHvRK7Y0yyCYj7mfXZCpk
|
1611 |
safe_rlhf/datasets/raw/alpaca.py |
sha256=2rCqDXv0Jn5T0V1hV3kk14vvO1LyeXhHUPdnpRhmmRE
|
1563 |
safe_rlhf/datasets/raw/firefly.py |
sha256=RTSYfOcDqz1XWju0ln35MHEaG6-XW0H2ZWi6X8F18WE
|
1344 |
safe_rlhf/datasets/raw/hh_rlhf.py |
sha256=_XkNkGkTUvZVoJA9Ma-tchaLCabgCf0DosVZav87RyM
|
4811 |
safe_rlhf/datasets/raw/moss.py |
sha256=wakJg51Gsr-2EeSjyVnX42pU461dz-LQGUoandT8HEQ
|
4588 |
safe_rlhf/datasets/raw/safe_rlhf.py |
sha256=gcT3pdBqKngXb228lA60eRq9z0L2cMN2NKevJ3aPoDY
|
2965 |
safe_rlhf/evaluate/__init__.py |
sha256=d4peV74_KVADiKGlS7490jDsPRZ2ip3cN0lUQQnOz7Q
|
690 |
safe_rlhf/evaluate/arena.py |
sha256=xtjwohxwBPS0SEhoJDfQEpO5_sjEyneDh0WiyeGPgj8
|
19900 |
safe_rlhf/evaluate/cost.py |
sha256=CaOqLyS38E3oXvLOJLKyIunrliBNZokxAVHEoDqy9rs
|
13767 |
safe_rlhf/evaluate/reward.py |
sha256=H1_FlONUy06f5Bp9fiWv2Sq819hgen7EUH5dRcv9LZw
|
10038 |
safe_rlhf/evaluate/bigbench/__init__.py |
sha256=d4peV74_KVADiKGlS7490jDsPRZ2ip3cN0lUQQnOz7Q
|
690 |
safe_rlhf/evaluate/bigbench/__main__.py |
sha256=MqsbUS5Ndq8Ntq-Hv2c-mXrs1AtPWhGX35W3S4TE7-U
|
804 |
safe_rlhf/evaluate/bigbench/eval.py |
sha256=LsnbDk8TNmZlu2kIf4jEndEfeVP8JYNJgfnFxXY51oc
|
6846 |
safe_rlhf/evaluate/bigbench/model.py |
sha256=Uv5z0yFTk_FVRk0DKNadw8NZnq9mXgbRowrFhMu_f5Q
|
7018 |
safe_rlhf/evaluate/gpt4/__init__.py |
sha256=d4peV74_KVADiKGlS7490jDsPRZ2ip3cN0lUQQnOz7Q
|
690 |
safe_rlhf/evaluate/gpt4/__main__.py |
sha256=kN2NiNNtpsMmmjV6aKyNNrM_rP1PUsM_eT0N18HzqCQ
|
800 |
safe_rlhf/evaluate/gpt4/eval.py |
sha256=Z9bUZ_HdCI_OkjFjDJezpxSF-7hix0HQIyq-IjpLZmo
|
6184 |
safe_rlhf/evaluate/gpt4/problem.json |
sha256=EbcJd9s49jhQDH3Yb3hqzspKHOl2iOzBvElHssbOcTI
|
13213 |
safe_rlhf/finetune/__init__.py |
sha256=QuvRQwdeOtfQWQMG4wCcEXioT8HDs9uzVfgpqUNc01g
|
835 |
safe_rlhf/finetune/__main__.py |
sha256=PvPRfoHEw6deIDJ14-nCxl1n8aaRQKMlZKGoox6Aw40
|
858 |
safe_rlhf/finetune/deepspeed.py |
sha256=MbvldFExVTtmlLrMN--D_b05Q5KGn6w2h9D9wt2m6TU
|
9232 |
safe_rlhf/finetune/huggingface.py |
sha256=YFnD8KpEOvtFI6Bx-1aFlbvX0t8BHrym6FJUeah7hJ0
|
3205 |
safe_rlhf/finetune/main.py |
sha256=XSXkiCzenf0I9vhHrkSXY4kZO41iGa75O5DgnMJguG4
|
841 |
safe_rlhf/finetune/trainer.py |
sha256=jR3qAWEMp4G0yLlrlb3Gr6essjfyGPvy5Nf9jpvcKNI
|
2778 |
safe_rlhf/models/__init__.py |
sha256=fdWLaxdIOLW52_9QRid6ol2Izb4dAPtDG7SIhcyecQ8
|
967 |
safe_rlhf/models/normalizer.py |
sha256=dCTVXun0K5zTe6FlVJlqNTbZ3dO00GVJVhOnzVVFLF0
|
6948 |
safe_rlhf/models/pretrained.py |
sha256=KRGoY6IGhgH7__FO7DkEcXQJYIVU8ZKOu7dj2bVYd14
|
7822 |
safe_rlhf/models/score_model/__init__.py |
sha256=nOereYT307lCpTNdsAuY4ZyDpS1NTvnfFt2NGYA_Rvs
|
9709 |
safe_rlhf/models/score_model/bloom/__init__.py |
sha256=wk_CAgMS9B5TtyCkf33ka_j94j-z_U-9_XvGHV3sOkI
|
768 |
safe_rlhf/models/score_model/bloom/modeling_bloom.py |
sha256=RwoxCHhv7bJz1h5GD1vB7JmjT1ArvuxwF6iFInVRw0I
|
4526 |
safe_rlhf/models/score_model/gemma/__init__.py |
sha256=zjoP0s9i7Ak6Yfg8b8p9KARneP_IU_WoyAZE-NNAyfs
|
768 |
safe_rlhf/models/score_model/gemma/modeling_gemma.py |
sha256=m_QdzKOBorur4dSOxQufEei2EE1Z2Yfesv8QSRrUzIk
|
4034 |
safe_rlhf/models/score_model/gpt2/__init__.py |
sha256=HoQbNr0t9iCgnpgXvtcDlF5DTiSKLFxTRc6wSmfAu_w
|
765 |
safe_rlhf/models/score_model/gpt2/modeling_gpt2.py |
sha256=jTgmaQYqtvI_Yu6C9t6elJIVhwzn1jl5-6YiZIQ0Ty8
|
6520 |
safe_rlhf/models/score_model/gpt_neo/__init__.py |
sha256=qwYBDatLN1Va7iUW0dXxv_EvfjRZJeEh-jLNA964aGY
|
773 |
safe_rlhf/models/score_model/gpt_neo/modeling_gpt_neo.py |
sha256=Dj5KxF97RWqAjpr9fmVrEa_ceDIIJz0GTbRspXfLUaY
|
4302 |
safe_rlhf/models/score_model/gpt_neox/__init__.py |
sha256=IodGU0Sp19BV8bu5HuYmk0gJshvzohtL5ns5fWxzOkE
|
776 |
safe_rlhf/models/score_model/gpt_neox/modeling_gpt_neox.py |
sha256=1UmZsPR6JU5qHzpCBnXGyJLsoXRQQ81ZZwEnQ8t1cys
|
4012 |
safe_rlhf/models/score_model/gptj/__init__.py |
sha256=I4fi4xOqJjLH32DgVGbhIaj2Xh3DFTWVPEf1AYLriHc
|
765 |
safe_rlhf/models/score_model/gptj/modeling_gptj.py |
sha256=HnZkLlFXSWn3dJ_k-0UjEiqJQHo7d4It1LhpVu5-kIM
|
6250 |
safe_rlhf/models/score_model/llama/__init__.py |
sha256=osPYp4TzZneVPMvRrpWKodhjZBHpLLWe9i0VqeCoMTU
|
768 |
safe_rlhf/models/score_model/llama/modeling_llama.py |
sha256=-3R0wpBVoWK3irngoSNLhIswSxN0HA7njcUrvwz2HDQ
|
4034 |
safe_rlhf/models/score_model/mistral/__init__.py |
sha256=uh41PCpTSzGM4Pb6W6qcNoEwcrwdG6zencE54ww0ouc
|
774 |
safe_rlhf/models/score_model/mistral/modeling_mistral.py |
sha256=HMIgyCQf_I8_md96vYjWgybaeED91g6f8GLM6_D6cqs
|
4052 |
safe_rlhf/models/score_model/opt/__init__.py |
sha256=41x9QUS84yvyZJEol9NS5yJNwFFqiaTY6S7KoyjxHy8
|
762 |
safe_rlhf/models/score_model/opt/modeling_opt.py |
sha256=r6ZYwXvECW_khuDCJsiNB6qDOHJPNvE75UUdkP8wTwQ
|
4035 |
safe_rlhf/models/score_model/phi/__init__.py |
sha256=KsexlzbKKAGF_bpEOjgR3dN1orMn_q7gIAtQoqh0sKY
|
762 |
safe_rlhf/models/score_model/phi/modeling_phi.py |
sha256=AE1Iqk_X9t41_rNNVlhdxoT5_j3dteoUHkAxhvP0APU
|
4016 |
safe_rlhf/models/score_model/qwen2/__init__.py |
sha256=VFEbKgdMuEldRjA2YBnh8l6TWHTYYYxxE-VcAoFinnI
|
768 |
safe_rlhf/models/score_model/qwen2/modeling_qwen2.py |
sha256=LRlK5Th7kRq3TRA2xTXiX_NLRPh6ttn7i9xpDNwsq2I
|
4228 |
safe_rlhf/serve/__init__.py |
sha256=d4peV74_KVADiKGlS7490jDsPRZ2ip3cN0lUQQnOz7Q
|
690 |
safe_rlhf/serve/arena.py |
sha256=gIEZeK1auz6_9FgN63SoLSHLpfwtjIz_9GmMFHqo7CI
|
3494 |
safe_rlhf/serve/chatbot.py |
sha256=2pO6ATtEuS5o-c2QUMJin4ZHdVCfByJupKwAfX7BrBo
|
12499 |
safe_rlhf/serve/cli.py |
sha256=rg-vvvk3D-O9ZQcgkg3XiE20GA5QtRBxG-WOckeA0lc
|
9349 |
safe_rlhf/trainers/__init__.py |
sha256=C-52MkZ3C9XFbKBEFc7cfZlKeKqShfz4RfBK5XtsEAo
|
952 |
safe_rlhf/trainers/base.py |
sha256=7nppBM2Anwx-j4xjcfbkwVPLtyxJqyM2NEI62cp3uDc
|
5039 |
safe_rlhf/trainers/rl_trainer.py |
sha256=E5tf3xcaMzd7bq5fxVyPUL50mL83uVQbIvlPWn5yiPc
|
26388 |
safe_rlhf/trainers/supervised_trainer.py |
sha256=K4GxwHDQL9ha0G-tnjQaDhGYh_kxT5UMOlshLXRnh5U
|
9225 |
safe_rlhf/values/__init__.py |
sha256=5Tzvf_PHWAx8Rhq0Prj1Vd6xJ_cwYAeTI3QqOl7izbM
|
869 |
safe_rlhf/values/cost/__init__.py |
sha256=rrfiIKRsscwq3fddZPGjyPjhUBticz-u_NaKQMeLlWg
|
774 |
safe_rlhf/values/cost/__main__.py |
sha256=odqMBMkpmMCKtfx-SrFbzh7Iqrdasy1DXwXO42e851w
|
866 |
safe_rlhf/values/cost/main.py |
sha256=Le81EiJrPWsfOGN-xufONN30nn1g5IGEHDnabvcj4-U
|
10422 |
safe_rlhf/values/cost/trainer.py |
sha256=RSn9K_C0cwdLCOK1dsqPBJAEoGTi34J-ttfSi11LtUA
|
14402 |
safe_rlhf/values/reward/__init__.py |
sha256=KBOuaK6LTCJx8VWNPZZTf9_sKYxAjND1DDs6VvBmj_w
|
780 |
safe_rlhf/values/reward/__main__.py |
sha256=EmaGmlNO_y5VKeEmmXETZrISTpdK1mE-ls_OAhNdi8k
|
870 |
safe_rlhf/values/reward/main.py |
sha256=7oV8aci9e6gSMSaYNhbzdbqdkd3ZvNZlrMi9U-ZqccQ
|
10442 |
safe_rlhf/values/reward/trainer.py |
sha256=RVLRx7O0U3bY6MKF86k7tAKDin1vqpEdYBa2Xbos0KM
|
11127 |
shtec_rlhf/__init__.py |
sha256=Hx3fU_J_IdXdaFQ-E22R1S7mOjaOYiYZtnKwj_niDzo
|
1226 |
shtec_rlhf/logger.py |
sha256=ORwAiz2hoWAhgX-m2tcvrVSqQnnw1GE3D9aYcMdfsDU
|
7955 |
shtec_rlhf/utils.py |
sha256=KO1mjEIT6YRjrXExkfs8rtlkLpzOMw9COG7rVj1hY58
|
9576 |
shtec_rlhf/version.py |
sha256=2Hk1fL8Gk3cVrUxJbJ01oKjZnfqZQQ6K3nKfhB7ukfY
|
1818 |
shtec_rlhf/algorithms/__init__.py |
sha256=ABXxt48HMhg57WS2WMxUDQuKKP7_3xUUM4zYE8mhdO0
|
974 |
shtec_rlhf/algorithms/dpo/__init__.py |
sha256=KDkxqfTtok6gBDP1o3dTY6zWz0tc66EYOvvXYTr3QCc
|
833 |
shtec_rlhf/algorithms/dpo/__main__.py |
sha256=dhAIrXefIKp5i6zWaGoES4lP38bk4jEozcN_1upmp-E
|
858 |
shtec_rlhf/algorithms/dpo/main.py |
sha256=Lj025fhVZ4bwtuY6g4idqGotrFDr-XivO2CwJ6u3SCw
|
9588 |
shtec_rlhf/algorithms/dpo/trainer.py |
sha256=8ZzBam-Sq6nZppejEcxIHiDjJF4zx__kKKpir5XtVsw
|
10300 |
shtec_rlhf/algorithms/ppo/__init__.py |
sha256=yISCKfVJKBW62MRtJuo7kcpMnw7sb0dB9k9c74UReZI
|
806 |
shtec_rlhf/algorithms/ppo/__main__.py |
sha256=byDaymRuRlZXSi0Vb7v51BgWTvruEj7XKTFaRDTVrXc
|
867 |
shtec_rlhf/algorithms/ppo/main.py |
sha256=NQmDJp4qukR6ZBwgVnPNu-M-g1mLtHyfIsJGiGLMDpY
|
14017 |
shtec_rlhf/algorithms/ppo/trainer.py |
sha256=HDcU0Soa3eU5vzLVc1VzILNuAPxfOcM9vV6z6rlmdY4
|
9350 |
shtec_rlhf/algorithms/ppo_lag/__init__.py |
sha256=OfrOywqWmDdMgDTy2KcVK6Ense6bM76uHtRqY8qVo7I
|
831 |
shtec_rlhf/algorithms/ppo_lag/__main__.py |
sha256=ge0-TPnqgbqsbnv9B8vWTCu3Bo1hbQHs6cf4_oLAh6E
|
886 |
shtec_rlhf/algorithms/ppo_lag/main.py |
sha256=HUd8piPP_sUJuNWdS-0T6rGOvDbuVbV6PBmygkFp9hs
|
15708 |
shtec_rlhf/algorithms/ppo_lag/trainer.py |
sha256=ynxO4F4wBsszzXM72TYgobdXhYl8WAt8s5c51ANFnFk
|
18858 |
shtec_rlhf/algorithms/ppo_reward_shaping/__init__.py |
sha256=srYpPK7-zDcQlwm-L-LOHFu6I0Lo9FFWxXcn_txmpDc
|
872 |
shtec_rlhf/algorithms/ppo_reward_shaping/__main__.py |
sha256=Vc5Ocmz0sMuJGh_RqRoROFC3AGydtkVvYlrm_yUuYTk
|
908 |
shtec_rlhf/algorithms/ppo_reward_shaping/main.py |
sha256=-2TEzGVVUCWyn3mRz4fIlzflz5zus2kRKEze6q9r1iM
|
14809 |
shtec_rlhf/algorithms/ppo_reward_shaping/trainer.py |
sha256=7itZ2MrJYM02wiSP0bzXAQkohQ0hZ2qVwfennDa0aSw
|
11900 |
shtec_rlhf/configs/__init__.py |
sha256=lw1JdY-cxOFaUI8nTelz-vToKBoJMpncHVwYRRFHimQ
|
1085 |
shtec_rlhf/configs/constants.py |
sha256=ZrHeDlKsJML7aupCmpF6a03_g0yHfZqBZ1ekREwLjTk
|
1616 |
shtec_rlhf/configs/deepspeed_config.py |
sha256=91JRIPOPb0PlVryWaZ8DrOvcG9QVd6DEovSfQW_z7vQ
|
5409 |
shtec_rlhf/configs/ds_eval_config_template.json |
sha256=ACWig0lsY2L_GFxssLwasV0lv0wtJjvFBk6y10JkICk
|
443 |
shtec_rlhf/configs/ds_train_config_template.json |
sha256=OVtNwtzZ666CfNZbIB8WZzSrPCSB23f0uxAT5HSA9XI
|
872 |
shtec_rlhf/configs/fsdp_config.json |
sha256=LxAyJZsiCiuDYJh_96KLBDslLs3iUwV-6zhkdfIYCzo
|
66 |
shtec_rlhf/evaluate/__init__.py |
sha256=d4peV74_KVADiKGlS7490jDsPRZ2ip3cN0lUQQnOz7Q
|
690 |
shtec_rlhf/evaluate/arena.py |
sha256=weDXgqlCZYi-QQz7Q0XbcL-Dhi0zFXIS3V3pSqOeEQM
|
19835 |
shtec_rlhf/evaluate/cost.py |
sha256=RggEIwT8ljscMexKHHXFkw89RAXnIDdKPRN1rMrEO_g
|
13640 |
shtec_rlhf/evaluate/reward.py |
sha256=I5cHtZ7FydnvHp-CWK82DLKBTRrVNl-y-t4J_LC-xoQ
|
9923 |
shtec_rlhf/evaluate/bigbench/__init__.py |
sha256=d4peV74_KVADiKGlS7490jDsPRZ2ip3cN0lUQQnOz7Q
|
690 |
shtec_rlhf/evaluate/bigbench/__main__.py |
sha256=MqsbUS5Ndq8Ntq-Hv2c-mXrs1AtPWhGX35W3S4TE7-U
|
804 |
shtec_rlhf/evaluate/bigbench/eval.py |
sha256=LsnbDk8TNmZlu2kIf4jEndEfeVP8JYNJgfnFxXY51oc
|
6846 |
shtec_rlhf/evaluate/bigbench/model.py |
sha256=Uv5z0yFTk_FVRk0DKNadw8NZnq9mXgbRowrFhMu_f5Q
|
7018 |
shtec_rlhf/evaluate/gpt4/__init__.py |
sha256=d4peV74_KVADiKGlS7490jDsPRZ2ip3cN0lUQQnOz7Q
|
690 |
shtec_rlhf/evaluate/gpt4/__main__.py |
sha256=kN2NiNNtpsMmmjV6aKyNNrM_rP1PUsM_eT0N18HzqCQ
|
800 |
shtec_rlhf/evaluate/gpt4/eval.py |
sha256=Z9bUZ_HdCI_OkjFjDJezpxSF-7hix0HQIyq-IjpLZmo
|
6184 |
shtec_rlhf/evaluate/gpt4/problem.json |
sha256=EbcJd9s49jhQDH3Yb3hqzspKHOl2iOzBvElHssbOcTI
|
13213 |
shtec_rlhf/models/__init__.py |
sha256=fdWLaxdIOLW52_9QRid6ol2Izb4dAPtDG7SIhcyecQ8
|
967 |
shtec_rlhf/models/normalizer.py |
sha256=dCTVXun0K5zTe6FlVJlqNTbZ3dO00GVJVhOnzVVFLF0
|
6948 |
shtec_rlhf/models/pretrained.py |
sha256=KRGoY6IGhgH7__FO7DkEcXQJYIVU8ZKOu7dj2bVYd14
|
7822 |
shtec_rlhf/models/score_model/__init__.py |
sha256=nOereYT307lCpTNdsAuY4ZyDpS1NTvnfFt2NGYA_Rvs
|
9709 |
shtec_rlhf/models/score_model/bloom/__init__.py |
sha256=wk_CAgMS9B5TtyCkf33ka_j94j-z_U-9_XvGHV3sOkI
|
768 |
shtec_rlhf/models/score_model/bloom/modeling_bloom.py |
sha256=RwoxCHhv7bJz1h5GD1vB7JmjT1ArvuxwF6iFInVRw0I
|
4526 |
shtec_rlhf/models/score_model/gemma/__init__.py |
sha256=zjoP0s9i7Ak6Yfg8b8p9KARneP_IU_WoyAZE-NNAyfs
|
768 |
shtec_rlhf/models/score_model/gemma/modeling_gemma.py |
sha256=m_QdzKOBorur4dSOxQufEei2EE1Z2Yfesv8QSRrUzIk
|
4034 |
shtec_rlhf/models/score_model/gpt2/__init__.py |
sha256=HoQbNr0t9iCgnpgXvtcDlF5DTiSKLFxTRc6wSmfAu_w
|
765 |
shtec_rlhf/models/score_model/gpt2/modeling_gpt2.py |
sha256=jTgmaQYqtvI_Yu6C9t6elJIVhwzn1jl5-6YiZIQ0Ty8
|
6520 |
shtec_rlhf/models/score_model/gpt_neo/__init__.py |
sha256=qwYBDatLN1Va7iUW0dXxv_EvfjRZJeEh-jLNA964aGY
|
773 |
shtec_rlhf/models/score_model/gpt_neo/modeling_gpt_neo.py |
sha256=Dj5KxF97RWqAjpr9fmVrEa_ceDIIJz0GTbRspXfLUaY
|
4302 |
shtec_rlhf/models/score_model/gpt_neox/__init__.py |
sha256=IodGU0Sp19BV8bu5HuYmk0gJshvzohtL5ns5fWxzOkE
|
776 |
shtec_rlhf/models/score_model/gpt_neox/modeling_gpt_neox.py |
sha256=1UmZsPR6JU5qHzpCBnXGyJLsoXRQQ81ZZwEnQ8t1cys
|
4012 |
shtec_rlhf/models/score_model/gptj/__init__.py |
sha256=I4fi4xOqJjLH32DgVGbhIaj2Xh3DFTWVPEf1AYLriHc
|
765 |
shtec_rlhf/models/score_model/gptj/modeling_gptj.py |
sha256=HnZkLlFXSWn3dJ_k-0UjEiqJQHo7d4It1LhpVu5-kIM
|
6250 |
shtec_rlhf/models/score_model/llama/__init__.py |
sha256=osPYp4TzZneVPMvRrpWKodhjZBHpLLWe9i0VqeCoMTU
|
768 |
shtec_rlhf/models/score_model/llama/modeling_llama.py |
sha256=-3R0wpBVoWK3irngoSNLhIswSxN0HA7njcUrvwz2HDQ
|
4034 |
shtec_rlhf/models/score_model/mistral/__init__.py |
sha256=uh41PCpTSzGM4Pb6W6qcNoEwcrwdG6zencE54ww0ouc
|
774 |
shtec_rlhf/models/score_model/mistral/modeling_mistral.py |
sha256=HMIgyCQf_I8_md96vYjWgybaeED91g6f8GLM6_D6cqs
|
4052 |
shtec_rlhf/models/score_model/opt/__init__.py |
sha256=41x9QUS84yvyZJEol9NS5yJNwFFqiaTY6S7KoyjxHy8
|
762 |
shtec_rlhf/models/score_model/opt/modeling_opt.py |
sha256=r6ZYwXvECW_khuDCJsiNB6qDOHJPNvE75UUdkP8wTwQ
|
4035 |
shtec_rlhf/models/score_model/phi/__init__.py |
sha256=KsexlzbKKAGF_bpEOjgR3dN1orMn_q7gIAtQoqh0sKY
|
762 |
shtec_rlhf/models/score_model/phi/modeling_phi.py |
sha256=AE1Iqk_X9t41_rNNVlhdxoT5_j3dteoUHkAxhvP0APU
|
4016 |
shtec_rlhf/models/score_model/qwen2/__init__.py |
sha256=VFEbKgdMuEldRjA2YBnh8l6TWHTYYYxxE-VcAoFinnI
|
768 |
shtec_rlhf/models/score_model/qwen2/modeling_qwen2.py |
sha256=LRlK5Th7kRq3TRA2xTXiX_NLRPh6ttn7i9xpDNwsq2I
|
4228 |
shtec_rlhf/serve/__init__.py |
sha256=d4peV74_KVADiKGlS7490jDsPRZ2ip3cN0lUQQnOz7Q
|
690 |
shtec_rlhf/serve/arena.py |
sha256=gIEZeK1auz6_9FgN63SoLSHLpfwtjIz_9GmMFHqo7CI
|
3494 |
shtec_rlhf/serve/chatbot.py |
sha256=2pO6ATtEuS5o-c2QUMJin4ZHdVCfByJupKwAfX7BrBo
|
12499 |
shtec_rlhf/serve/cli.py |
sha256=rg-vvvk3D-O9ZQcgkg3XiE20GA5QtRBxG-WOckeA0lc
|
9349 |
shtec_rlhf/values/__init__.py |
sha256=5Tzvf_PHWAx8Rhq0Prj1Vd6xJ_cwYAeTI3QqOl7izbM
|
869 |
shtec_rlhf/values/cost/__init__.py |
sha256=rrfiIKRsscwq3fddZPGjyPjhUBticz-u_NaKQMeLlWg
|
774 |
shtec_rlhf/values/cost/__main__.py |
sha256=odqMBMkpmMCKtfx-SrFbzh7Iqrdasy1DXwXO42e851w
|
866 |
shtec_rlhf/values/cost/main.py |
sha256=TCsZQxEUc7w9h0xmjCV1-BXLxiXZLJUhEu6Y8xxpalw
|
10377 |
shtec_rlhf/values/cost/trainer.py |
sha256=iw1XCjrDr_sKaIpjgDTQHT7rtLa3XeWwStpj9qx1Nmw
|
14258 |
shtec_rlhf/values/reward/__init__.py |
sha256=KBOuaK6LTCJx8VWNPZZTf9_sKYxAjND1DDs6VvBmj_w
|
780 |
shtec_rlhf/values/reward/__main__.py |
sha256=EmaGmlNO_y5VKeEmmXETZrISTpdK1mE-ls_OAhNdi8k
|
870 |
shtec_rlhf/values/reward/main.py |
sha256=GFGIntABBQyP3jf3BBnDdXdPy1RgtruRqNkpq5PvhZs
|
10397 |
shtec_rlhf/values/reward/trainer.py |
sha256=1Fee7pNavkHaBNEYMttwHtrA1rLe-Mj6oMj1T8WK4-g
|
10995 |
shtec_rlhf-1.0.5.dist-info/LICENSE |
sha256=1qqHIb4EWxMrQ29OsxB6OBiewW_eb9WsLbGF1oEyN2Y
|
11380 |
shtec_rlhf-1.0.5.dist-info/METADATA |
sha256=rpHQJJtCUNqvk6CGL2iAd3b096Gc75WO_CzlDKuAmzY
|
2509 |
shtec_rlhf-1.0.5.dist-info/WHEEL |
sha256=2wepM1nk4DS4eFpYrW1TTqPcoGNfHhhO_i5m4cOimbo
|
92 |
shtec_rlhf-1.0.5.dist-info/top_level.txt |
sha256=2HJwowMnZse7nGlMq36TDAFJT8pat6ikEOmBDkHgKBI
|
11 |
shtec_rlhf-1.0.5.dist-info/RECORD |
— |
— |