sevals
View on PyPI — Reverse Dependencies (1)
0.0.3 | sevals-0.0.3-py3-none-any.whl |
Wheel Details
Project: | sevals |
Version: | 0.0.3 |
Filename: | sevals-0.0.3-py3-none-any.whl |
Download: | [link] |
Size: | 1267698 |
MD5: | 9558f70d293349a855d505ce14d19ea7 |
SHA256: | bacf6ba311d6ed8c145453c0462f473ebcba91e829c2079d571ecf5eda6da31a |
Uploaded: | 2023-12-30 02:27:58 +0000 |
dist-info
METADATA · WHEEL · RECORD · top_level.txt · entry_points.txt
METADATA
WHEEL
Wheel-Version: | 1.0 |
Generator: | bdist_wheel (0.42.0) |
Root-Is-Purelib: | true |
Tag: | py3-none-any |
RECORD
Path | Digest | Size |
---|---|---|
lm_eval/__init__.py | sha256=9-jqCb66p_m29iqX1zVNpo_MzAIGznMZKNKOZKfEsxI | 49 |
lm_eval/__main__.py | sha256=xtWAPM-GQwTg59zFf0vCE4q0zvu1Ijhfoj16H7iB0dY | 12690 |
lm_eval/config.py | sha256=G4D3I0IbuVeqcQ6fklqiK5HpPmv4ylyd1Mesq9Q8O-k | 1691 |
lm_eval/evaluator.py | sha256=q4YqGvU3SGUCfes-5U7GKAYgEM9COONkUcsJLwwGnxM | 25019 |
lm_eval/logger.py | sha256=sbzhLS9KTYWHvoGTiDjlc62aA-QW7ARQp_DjmFhjhEw | 1886 |
lm_eval/scholar_api.py | sha256=CavfGqnDEMwq4On3W6ZyLIMX2FEhTm4aRpWyUQJOswk | 14384 |
lm_eval/utils.py | sha256=0gfz4PtiDI7wHHhf_XeMpROhMqydhgbWfGv7CwD35ME | 25046 |
lm_eval/api/__init__.py | sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU | 0 |
lm_eval/api/filter.py | sha256=B5W5aAVHxRnNgw4l9HiXpCzwmRj-hjThtbQ9T6nx6QA | 2046 |
lm_eval/api/instance.py | sha256=Y7JJt2i5w_C5J8_rFwUohWYmA6KYGANomRaQ6Ixmzsw | 970 |
lm_eval/api/metrics.py | sha256=5Poi2oc3vd3ra8lG6DtQlm7KkO7kbXxII4KYtU02ZAE | 11341 |
lm_eval/api/model.py | sha256=CtjKLJH2gjAku_6jDuqk9eknfDUEqo5vrgST_VdqX5U | 9181 |
lm_eval/api/registry.py | sha256=ly1fBWPG54TQox3WhmGlrygLQ4IQSPHJZS1BzbcmndY | 4580 |
lm_eval/api/samplers.py | sha256=lGwE6NcllaUSbhjuoD1CZyyJPdtZpcSpjpSjLTOlBe4 | 3946 |
lm_eval/api/task.py | sha256=MdJsXMh6Qrb6Ln4TlY_z9TH_gFQNbtpeFmq2d7KEgHA | 49786 |
lm_eval/decontamination/__init__.py | sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU | 0 |
lm_eval/decontamination/archiver.py | sha256=_JyIwE6K2wJRcNB_FW0cyEcVPz8i-LS9sBozoBa_uG8 | 5664 |
lm_eval/decontamination/decontaminate.py | sha256=gXPd4lDVy_chupLZm4gC6VWVn3PRmKkm-rrdbiVaqr4 | 6928 |
lm_eval/decontamination/janitor.py | sha256=vprTq2dYuQUlimblgHyuJXQAfoR0hpvxmlTib120MoI | 13175 |
lm_eval/filters/__init__.py | sha256=LH-vFT3y2ovvymZSNk2tI9e5gHx-bN7xSE4JOeg79lA | 1516 |
lm_eval/filters/decontamination.py | sha256=faJSuxPQVNdLIJOSUvN5z-yNyrdc3oADYS6m2xqTIEg | 630 |
lm_eval/filters/extraction.py | sha256=MBuxKgGJRkddNq7jirV4YkN12SavCV3Jxiw1Mx_9WxU | 1771 |
lm_eval/filters/selection.py | sha256=45oHOvsQZZQ0UepMaoKgSVUHXwJz71viOylkxkeNYkM | 1606 |
lm_eval/filters/transformation.py | sha256=IbrkthJKPDyYWX4oCFYNMt5-vp3jdbEqj-XEnssqRsg | 1532 |
lm_eval/models/__init__.py | sha256=1AY6oTEWf-rS6UkKfSeGu11H-toQ9oXa2CdvysZvEnc | 207 |
lm_eval/models/anthropic_llms.py | sha256=k3EGrWXjqfaGhOqs_9oJdEO_JSHM6tPqAEQfHYWoOqA | 6605 |
lm_eval/models/dummy.py | sha256=uazrWKCG7im191wG1tUu9MpKT1p1sM3-485Unn1un7g | 1111 |
lm_eval/models/gguf.py | sha256=JLa6E6zlTDOpc-l2HnO52SE4rXTF4e6_-sx_pJF-mLI | 4635 |
lm_eval/models/huggingface.py | sha256=lV0PxHqTrBeU-hbCoUESTWKqma-AAjk0pntd5EGFhHA | 42178 |
lm_eval/models/openai_completions.py | sha256=o-Lzy4gWiMk2tgajM9dMihjfk83-i4_4Ld9jlhjd13s | 18993 |
lm_eval/models/textsynth.py | sha256=Vi53mKG4Zvpp4OlCI9ZZjJyWkjKOOjdhopltxI9LeTw | 5543 |
lm_eval/models/vllm_causallms.py | sha256=IV683bLrImMAgI7FLnLsZHgDjtsDn5VK7Zm7OKsn2YY | 16060 |
lm_eval/prompts/__init__.py | sha256=16tuZ-0K2n951_BRSJoM920CnZPLPP_Kc1eg5XSpeOQ | 4437 |
lm_eval/tasks/README.md | sha256=y6MIxC_dZ87xW5jaSylKRRE7CEi12-V_W4mrT4ES5NU | 1909 |
lm_eval/tasks/__init__.py | sha256=OkU6Doku07dNW2wHuzwfK34ULhetq7qCWouIuKrOWEI | 9242 |
lm_eval/tasks/__pycache__/__init__.cpython-39.pyc | sha256=MSsngB30cuOph9eo_trxnwL4LvpcH-nby01OE_SpTz4 | 5844 |
lm_eval/tasks/__pycache__/anli.cpython-39.pyc | sha256=1N1W2l3Oml0KiU2-w46UCnPUv-HY6RLKMNQAgO-do7c | 5606 |
lm_eval/tasks/__pycache__/arc.cpython-39.pyc | sha256=Y0cecXCny9Oyy8IzTwEkT3Z1j8Zxpzyd_pnm6y0EwHs | 3476 |
lm_eval/tasks/__pycache__/arithmetic.cpython-39.pyc | sha256=4jfD6Az5rIL_9fEAOCJb1bd9RH7roNDuQuLzY3n1tv8 | 5485 |
lm_eval/tasks/__pycache__/asdiv.cpython-39.pyc | sha256=V5KcmdhB_IFPbzYHGyDFTre97K5kmzkVBwvkOx80wsY | 4276 |
lm_eval/tasks/__pycache__/babi.cpython-39.pyc | sha256=lbd9TCl8A_Cs08V7TSDluj8XDupn4djfq2bwNyQl27w | 4115 |
lm_eval/tasks/__pycache__/bigbench.cpython-39.pyc | sha256=V2jYfy1d4tBgxuPo7RVBZCDyPZFg4MvIfo8agmxL_ig | 17141 |
lm_eval/tasks/__pycache__/blimp.cpython-39.pyc | sha256=vzBpq5EX0PRI8asEuPetvCprUqpTCtSgPunWzAO-1rs | 16938 |
lm_eval/tasks/__pycache__/cbt.cpython-39.pyc | sha256=CLBSsr7eAlp1CzavnSXyo9ocGCCcU6kkg_rgmboq4hQ | 6145 |
lm_eval/tasks/__pycache__/ceval.cpython-39.pyc | sha256=zEywGuUrFWPU_t9BV9s_Di7nEgnkE_QdvB91P0r-478 | 7552 |
lm_eval/tasks/__pycache__/cmmlu.cpython-39.pyc | sha256=uK6p9wluVajxgZN8KG6dQzP1riynuEukIHAzF3cew5s | 10102 |
lm_eval/tasks/__pycache__/coqa.cpython-39.pyc | sha256=Uzw4kH6McC0UzAw3tQWu_JOiZCuC0d9auUFW9Kd9IJE | 6401 |
lm_eval/tasks/__pycache__/crowspairs.cpython-39.pyc | sha256=rHTgBX7hlcHOKyzs7PMA08sIVFKP5pfOspP-O8N5ycw | 11800 |
lm_eval/tasks/__pycache__/csatqa.cpython-39.pyc | sha256=DDDiVMpwr-jJ6lfVoy4aknaF5mDYXed-yAooE7cXQ9I | 2536 |
lm_eval/tasks/__pycache__/drop.cpython-39.pyc | sha256=ehZzWsfieZQw5pw1CSm68MyYqTRVbBrHW-FUnAmVKs0 | 10896 |
lm_eval/tasks/__pycache__/glue.cpython-39.pyc | sha256=TN1xQgqfRqaHKwNrNDlKc9kwe8WYfm0RxVlhd5D24Cc | 21543 |
lm_eval/tasks/__pycache__/gsm8k.cpython-39.pyc | sha256=dKv-RI9-IRO0SipOyI4oJGg4RVjI4Q0ylqv33GxQeIo | 5580 |
lm_eval/tasks/__pycache__/haerae.cpython-39.pyc | sha256=5UxQZOOrjc-v0bRAVUxwUdN57QpWzaNTPHZuTyVrDuE | 2186 |
lm_eval/tasks/__pycache__/headqa.cpython-39.pyc | sha256=-1yFty5XhkKCKqIbJp2gxfk4cLeWBR1z_V-SVuaqulg | 3929 |
lm_eval/tasks/__pycache__/hellaswag.cpython-39.pyc | sha256=D5M87IwAs1PVVyzo6GkE1LDG3uFxk6MUCme4LfWtOtI | 3548 |
lm_eval/tasks/__pycache__/hendrycks_ethics.cpython-39.pyc | sha256=k1slrMmiLgDocE7tZXMhrdKKgHB5Uxv6oPOodlTE_n8 | 16529 |
lm_eval/tasks/__pycache__/hendrycks_math.cpython-39.pyc | sha256=CEijCrcdR-tcadW39iIBpGlnfc9Xg6UMttkWjaalNiA | 8629 |
lm_eval/tasks/__pycache__/hendrycks_test.cpython-39.pyc | sha256=d2jLfhUqY8YG9SQEXtERUOiLZJBTmjE-bq9-X0fB25Q | 6672 |
lm_eval/tasks/__pycache__/json.cpython-39.pyc | sha256=oi7q-idRVM2TKfa1Qzv-DrJ1gFeCo6uKXVJZlgeuQ6U | 3169 |
lm_eval/tasks/__pycache__/lambada.cpython-39.pyc | sha256=3s3dh1Koaamys9AoA0Qy8kfX6d9VdOlTt8qdaMsHv7U | 4846 |
lm_eval/tasks/__pycache__/lambada_cloze.cpython-39.pyc | sha256=l-2jsLXT6AuzJUcXcwI3sIIfQ_26vr5g3eRWnSF68us | 3016 |
lm_eval/tasks/__pycache__/lambada_multilingual.cpython-39.pyc | sha256=l0tXonWiUqVI-nkO0Txzr0fdHQQU_hUe5C1sweCBtuo | 2563 |
lm_eval/tasks/__pycache__/logiqa.cpython-39.pyc | sha256=XPQdDQ2dE6alEl9-GQHdIbRFRQqk-guMEcI52uwPkw0 | 3613 |
lm_eval/tasks/__pycache__/mathqa.cpython-39.pyc | sha256=xYxV-o8UuY_JfEiNYORm8SnS1QEtrsmcWsLP4nIIZxY | 3130 |
lm_eval/tasks/__pycache__/mc_taco.cpython-39.pyc | sha256=c8XMj7Dit7XtMloNmTb6ayN0kiVNbBSXRYhIK2cqqCo | 6554 |
lm_eval/tasks/__pycache__/mgsm.cpython-39.pyc | sha256=93Y8tlICyh8_dB3zv0rJ5bvdr0_TGWKSTdULZkOwfAo | 8608 |
lm_eval/tasks/__pycache__/mutual.cpython-39.pyc | sha256=M0O859VpKBY3wmYc4T63VSCg2xaPgQetc8OGVRfcmn4 | 4446 |
lm_eval/tasks/__pycache__/naturalqs.cpython-39.pyc | sha256=lCJw62Xxz8VKld4zKUM86nLlYgxL8erMF6SsRrtyKS4 | 5949 |
lm_eval/tasks/__pycache__/nqopen.cpython-39.pyc | sha256=e_5DE9bGuLCVIQTbjyE8Hz2hUTW-bCGicCxwuW4mfFE | 6674 |
lm_eval/tasks/__pycache__/openbookqa.cpython-39.pyc | sha256=bLiDExwE5jL7_DFveJcpi3aPNGDIjtka0GQ7xy_DzDM | 3309 |
lm_eval/tasks/__pycache__/pawsx.cpython-39.pyc | sha256=lfPA_s78cbPzSUJTqVBYEOd68TEjmCEfWTplrqe0wQU | 9276 |
lm_eval/tasks/__pycache__/pile.cpython-39.pyc | sha256=UcXtfVolu5IFNDtysf2oJkqptNglsAaFXjJQYpd3kmc | 5455 |
lm_eval/tasks/__pycache__/piqa.cpython-39.pyc | sha256=WspBvQBG347-zbUHx4rZrFQIrzXr7j-9f8X9T3R4nK4 | 2683 |
lm_eval/tasks/__pycache__/prost.cpython-39.pyc | sha256=dp5N9Ss1cNnXEmxf_x26D_Fm1PLg89hasc3gclXxiGE | 3449 |
lm_eval/tasks/__pycache__/pubmedqa.cpython-39.pyc | sha256=WdnfiezVjT7mmTWg4O719_cPzSpW1eJA7xNRDkCE69E | 4575 |
lm_eval/tasks/__pycache__/qa4mre.cpython-39.pyc | sha256=r2_w2c9X0FQ_EEmjws3qyBE0I3ysKqqibSKLuP7pyDo | 3397 |
lm_eval/tasks/__pycache__/qasper.cpython-39.pyc | sha256=azwRSF0mMi-RkcxUJDylzzUT4jcrMgfkPw2_uhkWnV8 | 7494 |
lm_eval/tasks/__pycache__/quac.cpython-39.pyc | sha256=4i7jHy2jRwbUYPBQf5ApN8PUQ0IdKcmUFktalix1JnE | 5039 |
lm_eval/tasks/__pycache__/race.cpython-39.pyc | sha256=bRYau4sCRHyMfIJTlfRtNanUzY6Xlc_X0b0s0ohabg8 | 6768 |
lm_eval/tasks/__pycache__/sat.cpython-39.pyc | sha256=ka0o0ZOcYG2qWvugZ1bo1Q7Lxe-AZJymhGM7T21hU7Y | 3468 |
lm_eval/tasks/__pycache__/sciq.cpython-39.pyc | sha256=SrkcUb5g5h6OlwUffYnIssd9LrJCg3W3BD1LGIkxdYI | 2865 |
lm_eval/tasks/__pycache__/scrolls.cpython-39.pyc | sha256=4AOW9ahEczfFnk6CbdrLwTpVVu_lcvv6j1jMj009U0I | 17363 |
lm_eval/tasks/__pycache__/squad.cpython-39.pyc | sha256=6MTkJ9vc5qsUCtjjaklymk2oZo26dUbu6Co2Wd4S2_U | 6170 |
lm_eval/tasks/__pycache__/storycloze.cpython-39.pyc | sha256=j_e7oADlNEvYzcQ9gZWae6OKqbs8wZ2JFjQfUHsuxy0 | 7177 |
lm_eval/tasks/__pycache__/superglue.cpython-39.pyc | sha256=naOxaaHoLSDIa-JTGGTZM_kE6FWYhU7zGZ3FrfzmErc | 17890 |
lm_eval/tasks/__pycache__/swag.cpython-39.pyc | sha256=I-qN8BpYjnSl-NUeu2y_QGQ4yUtm2bYeZt7ncQD23Sg | 2621 |
lm_eval/tasks/__pycache__/toxigen.cpython-39.pyc | sha256=qqlzlKqcoJp8bFmlxdqcBJvE7uY1bAjZzKd_1X7FbVQ | 2989 |
lm_eval/tasks/__pycache__/translation.cpython-39.pyc | sha256=HjFnQBQcjLhm4-ANAjawDpTuGs-oyDyXxe44ev99Rw8 | 9039 |
lm_eval/tasks/__pycache__/triviaqa.cpython-39.pyc | sha256=nj5f3jvwnWhUDHQnpAJE8rDcnrWoVtpmJYACnfVE4Lo | 4567 |
lm_eval/tasks/__pycache__/truthfulqa.cpython-39.pyc | sha256=js93Q8b5imoK9juMRZt1v5MafWbN9piXV2OaPITnstU | 14269 |
lm_eval/tasks/__pycache__/unscramble.cpython-39.pyc | sha256=juHWtuO6ME_Y6_sDXnbL3d1iPIpvfSHrHy1ujKWsymo | 4830 |
lm_eval/tasks/__pycache__/webqs.cpython-39.pyc | sha256=EHUxwEoc96zmwXqMJrz6aCSTwLhCElAY7GF4lOeHmY4 | 3902 |
lm_eval/tasks/__pycache__/wikitext.cpython-39.pyc | sha256=0YwJay-rRcBtbh3OGcBt4A1AuRRUCw7odbDQ8eyR12o | 3431 |
lm_eval/tasks/__pycache__/winogrande.cpython-39.pyc | sha256=4dbf4CmDG3jpLlAIvpFNHDQK0pUFlLiJtq-v9SQYm_o | 5695 |
lm_eval/tasks/__pycache__/wsc273.cpython-39.pyc | sha256=aIFFkg4eRPKm0uOGL3psX1Muu47sPxquEXwBCXGH89Q | 7816 |
lm_eval/tasks/__pycache__/xcopa.cpython-39.pyc | sha256=FodWwumN43OS8HSnduyKAdPKVTqca0NxL8JOpohcyfY | 4771 |
lm_eval/tasks/__pycache__/xnli.cpython-39.pyc | sha256=tDnZC7-ICc8Me1J-SJI_QodOp2y6AhVfuzqXzwqBHPM | 10975 |
lm_eval/tasks/__pycache__/xstorycloze.cpython-39.pyc | sha256=gQzvE73bgP8cJG1Ie3XPwKeTuuGSPuy0xAgdK-UXLMA | 3771 |
lm_eval/tasks/__pycache__/xwinograd.cpython-39.pyc | sha256=x7vA0M4GlWNPlx8w8iHMB5zlPd_dPZfNT8PkW7Q8O-U | 3520 |
lm_eval/tasks/anli/README.md | sha256=QKLZp7Ox21Wn815nwzGczGu7Bce0fQVTRmlduKlckWU | 2042 |
lm_eval/tasks/anli/anli_r1.yaml | sha256=eoGw37l-NZcHyRGDUyJqeZ8uyr7QyzEcwgZw1498lUk | 597 |
lm_eval/tasks/anli/anli_r2.yaml | sha256=nHP-W_OHCZpr9VjX3AiRsrLVV4Cb25vSfuHRN5CmTlc | 106 |
lm_eval/tasks/anli/anli_r3.yaml | sha256=AgUdUSygTWd9giQsVVLEauQKz5NZQxjtGNBTKW3RKXo | 106 |
lm_eval/tasks/arc/README.md | sha256=2MQ1rllCO1JgRK1Sv2lYzE6OsVKYuA7HwQlNLEcJ4d8 | 1907 |
lm_eval/tasks/arc/arc_challenge.yaml | sha256=aCYhwmriSxBlotcyRgpVqO8rnyVEV0QxZmyTCanv170 | 71 |
lm_eval/tasks/arc/arc_easy.yaml | sha256=NLxwyWp9Z_wAcJmEfF4Py0W1cllo_CVI_kQW8VdF_7g | 575 |
lm_eval/tasks/arithmetic/README.md | sha256=3jHg0xARN3uYrFIhUuRfD6qv-rYAVy0ffKqzAXqklfw | 2336 |
lm_eval/tasks/arithmetic/arithmetic_1dc.yaml | sha256=vAk_ztJ-odbEj_mi6udITeVk0sxOwvEmEKRK_np4Mak | 345 |
lm_eval/tasks/arithmetic/arithmetic_2da.yaml | sha256=H6DgIxmGIV7NXQ9Vu8MDKCMU8wquqs8b7J9KoeA4oQs | 79 |
lm_eval/tasks/arithmetic/arithmetic_2dm.yaml | sha256=GFtNnpPGogepQEagyIvumrrIzGgodc5M7NlMGCUgiZc | 79 |
lm_eval/tasks/arithmetic/arithmetic_2ds.yaml | sha256=80udKkOsnZHAqgUcfh0tIdQ-CGJg1YbQTXqAZxsbP_Y | 79 |
lm_eval/tasks/arithmetic/arithmetic_3da.yaml | sha256=Hd1BHN8ymJpU4o3unjm6VeQfgmIz4lR5KK1ZinHxb-s | 79 |
lm_eval/tasks/arithmetic/arithmetic_3ds.yaml | sha256=Kj5_zxinzATv18jbv2nK2tXydu_mWXSIoSckgV9-Lvg | 79 |
lm_eval/tasks/arithmetic/arithmetic_4da.yaml | sha256=ZObI8PPmHdx62T2svuU4OYjVpdK9FHcIFIjN9KSPJlM | 79 |
lm_eval/tasks/arithmetic/arithmetic_4ds.yaml | sha256=fT3XQYlIczaRO2v1x0UnTVrqos1LItU0v82ShlWjfPI | 79 |
lm_eval/tasks/arithmetic/arithmetic_5da.yaml | sha256=_kwFCiDnyQshM-90V7fAXMBDQnzInug-9SPcM1puXAM | 79 |
lm_eval/tasks/arithmetic/arithmetic_5ds.yaml | sha256=Lj4eIB4NsS5lMFDpYM3vZv5Kk0eIaauqk7SkYqFoMVs | 79 |
lm_eval/tasks/asdiv/README.md | sha256=TQY5EyoG5evb9oZwMCZl_X_4qAX7B-nMKnOTcI_-0IQ | 1906 |
lm_eval/tasks/asdiv/default.yaml | sha256=QGn_AgOmM3ZD1v63gPDSFBe47f-Y3zLNin1XVC1hEgM | 384 |
lm_eval/tasks/babi/README.md | sha256=Y_b2kkNqyN1l3ONNomyPcZmNOI0wupDTQLAHyankfFY | 2263 |
lm_eval/tasks/babi/babi.yaml | sha256=04pXgw0UahXU8-qtDYJ6On8NuCYCeftgZxJwkQa8rpU | 438 |
lm_eval/tasks/bbh/README.md | sha256=onAqPm8i9ybbgt4mLn6CBWVRvLWg6z7DJWLeE8umSJQ | 1384 |
lm_eval/tasks/bbh/_generate_configs.py | sha256=Omg1Iqxdm5KMngtd1k50ai6KunD6dfx0PI1W8x-6MSg | 2730 |
lm_eval/tasks/bbh/cot_fewshot/_cot_fewshot_template_yaml | sha256=KnFLZMPVPniYOTv3lhovWoPUwpBmjM4-MO0zwWxYeUM | 575 |
lm_eval/tasks/bbh/cot_fewshot/boolean_expressions.yaml | sha256=SX80lLHbh-zixE0MoEdcrBfm9HI_2Rhn74c8KKrFK3A | 2032 |
lm_eval/tasks/bbh/cot_fewshot/causal_judgement.yaml | sha256=aiGhmrt_PlErBpJ71kEUlueod7qvP_cx8PBaUXn8SJM | 3873 |
lm_eval/tasks/bbh/cot_fewshot/date_understanding.yaml | sha256=LNfNG_dm177NKSGKOPNL4iVcEfKly4qlcJWaa14SD2Y | 1388 |
lm_eval/tasks/bbh/cot_fewshot/disambiguation_qa.yaml | sha256=--zOyKYRxK30XxIeohG1CBKI13-Wb5qKTHgg8oXitAM | 3829 |
lm_eval/tasks/bbh/cot_fewshot/dyck_languages.yaml | sha256=Nml5nbVVBz-XB36Qnu4zMsSgrzAWjsoW1lZCPhrbJP8 | 2699 |
lm_eval/tasks/bbh/cot_fewshot/formal_fallacies.yaml | sha256=gWhHSUucV3ZLrVOeX59wryTFkg7iwzFP-lgoCMEIN1k | 4711 |
lm_eval/tasks/bbh/cot_fewshot/geometric_shapes.yaml | sha256=7xyn1RFZL8qRgZcOzUiCl0l38uSB2yK-EKtxrNj6jCs | 5121 |
lm_eval/tasks/bbh/cot_fewshot/hyperbaton.yaml | sha256=ejBz50iniTwzljolduBcOntjBY0pwvVPQhx7WisOgdQ | 3351 |
lm_eval/tasks/bbh/cot_fewshot/logical_deduction_five_objects.yaml | sha256=pc0PspFOkx4f6bDGLvprxzAkYpqw4W2C4aVITsTJib0 | 2772 |
lm_eval/tasks/bbh/cot_fewshot/logical_deduction_seven_objects.yaml | sha256=eUOMm8IO0IOnczpZbAFHw3JL-HNgCeMRhNvGwf6HKz8 | 2774 |
lm_eval/tasks/bbh/cot_fewshot/logical_deduction_three_objects.yaml | sha256=sWp62gOC5EGrLDOPsyqC3iPE-cL3PgKc1rgBwrDnC1o | 2774 |
lm_eval/tasks/bbh/cot_fewshot/movie_recommendation.yaml | sha256=4--VJ9ezO2MAdfKqTBK2AdNgRCJZHkNI9me3YDERKPA | 2355 |
lm_eval/tasks/bbh/cot_fewshot/multistep_arithmetic_two.yaml | sha256=SCPcez8Q0wsr89cmDkO9gxFcRQdK1RDJ0d6RapArX4g | 2617 |
lm_eval/tasks/bbh/cot_fewshot/navigate.yaml | sha256=6vbI3FhHG-Y6C_6MBOa5OuBfnhBFE0oAn-Cjn5rCgog | 2358 |
lm_eval/tasks/bbh/cot_fewshot/object_counting.yaml | sha256=BcqvMVU3zTVJcnMF2cppkaLPEaZE-vLoF23_dKtZECo | 1637 |
lm_eval/tasks/bbh/cot_fewshot/penguins_in_a_table.yaml | sha256=T_AUHb_bDV2i-a0P1VcA-d-eDQJEICw8awa1YbgKvyo | 2617 |
lm_eval/tasks/bbh/cot_fewshot/reasoning_about_colored_objects.yaml | sha256=GBJ5KlCOYrg7YXge38glFGnN1K7s3lGoWShSrHKpJUk | 2572 |
lm_eval/tasks/bbh/cot_fewshot/ruin_names.yaml | sha256=LvnZQ2lh0YTl0g0uTs7cc3sT740f29hb3XZZjAFfoC0 | 3817 |
lm_eval/tasks/bbh/cot_fewshot/salient_translation_error_detection.yaml | sha256=XUDL9CRkr6zWhYcAcxI1rYTeleuYHgrmXEE6WrSg1go | 6421 |
lm_eval/tasks/bbh/cot_fewshot/snarks.yaml | sha256=D6LsaVZXbNG_KdEDLqjM2sZzRFtbIsIPh0KZZANG6XU | 3310 |
lm_eval/tasks/bbh/cot_fewshot/sports_understanding.yaml | sha256=n8lylHWU7Ncui60xqq2rm-KlhE7Iq-mIgue9szB6D8o | 1029 |
lm_eval/tasks/bbh/cot_fewshot/temporal_sequences.yaml | sha256=P-RhNRRAHL-KEF6tf_jdBhsTPnKM1aF-WGpUB0Pab1A | 3288 |
lm_eval/tasks/bbh/cot_fewshot/tracking_shuffled_objects_five_objects.yaml | sha256=LXOk7Cgh4ugEQOYpdhFPDbY5x7uh4y0pcLpteWfS1iU | 2872 |
lm_eval/tasks/bbh/cot_fewshot/tracking_shuffled_objects_seven_objects.yaml | sha256=ejl57zVi3a4jaPDgPVIHeopWZCCabqPc93NF1fhTFmY | 2874 |
lm_eval/tasks/bbh/cot_fewshot/tracking_shuffled_objects_three_objects.yaml | sha256=nZ7XmSNzkeJbi8gmPao0zaRkSo05ykp8GFkg7oxk0Ms | 2874 |
lm_eval/tasks/bbh/cot_fewshot/web_of_lies.yaml | sha256=ReCGKrRD_ZY6C1vmWA0t3dbsc3dNsxJMsNr1Y0YLGMA | 3147 |
lm_eval/tasks/bbh/cot_fewshot/word_sorting.yaml | sha256=lwoyGODKSl7OEhkDFBbr1kl7daBUW-jnvDi1gb4feWY | 2533 |
lm_eval/tasks/bbh/cot_zeroshot/_cot_zeroshot_template_yaml | sha256=YLnPhnc-bjfWXRcSv9_DT1qnoEksUBDe-un-8QjkDPw | 657 |
lm_eval/tasks/bbh/cot_zeroshot/boolean_expressions.yaml | sha256=WeYX1fBxXLi6X-UZGhjTa9qe1421xst4bNjKdkFeH3A | 261 |
lm_eval/tasks/bbh/cot_zeroshot/causal_judgement.yaml | sha256=l1lM4A-gq3787by_DxDRRGc7oREow3mmeQg-mt15TCg | 246 |
lm_eval/tasks/bbh/cot_zeroshot/date_understanding.yaml | sha256=TEftBhr7NNeFk-7JhjmR3c2lB7LE0P-i6ApOLBuzoso | 236 |
lm_eval/tasks/bbh/cot_zeroshot/disambiguation_qa.yaml | sha256=hdTGBg8_BXzL_pdev6ptU34sF81Bj9xbXXNZMor3EcU | 263 |
lm_eval/tasks/bbh/cot_zeroshot/dyck_languages.yaml | sha256=RnWkgB5NmCzsopam6oLMEUFKki8ZjMEhZ79WZZnm_FA | 230 |
lm_eval/tasks/bbh/cot_zeroshot/formal_fallacies.yaml | sha256=bx1n06rJOC64fzrbhxvdOnnzpm2QqbngEO8EsKoFLq4 | 266 |
lm_eval/tasks/bbh/cot_zeroshot/geometric_shapes.yaml | sha256=c2UFUy6b0NOvexJPq865bXE5qxd_XswbyiI0u0ICQRA | 247 |
lm_eval/tasks/bbh/cot_zeroshot/hyperbaton.yaml | sha256=dTdgx0e9hw7dJJ_AK_Uf28oXRAnDzBnVmIyXN4k1daI | 240 |
lm_eval/tasks/bbh/cot_zeroshot/logical_deduction_five_objects.yaml | sha256=1BE-GhGBwh1PIuwp3H5meT3TOHE6bNt_504GwG-K3Gw | 316 |
lm_eval/tasks/bbh/cot_zeroshot/logical_deduction_seven_objects.yaml | sha256=j3wiZvAibQcVhB3IkoFNhakDXaWRlfV3HzoM0jDP2z0 | 318 |
lm_eval/tasks/bbh/cot_zeroshot/logical_deduction_three_objects.yaml | sha256=LTphZr5bUez-pjXx6cvRSFqDdMWXcnL8cxUskXq5DP0 | 318 |
lm_eval/tasks/bbh/cot_zeroshot/movie_recommendation.yaml | sha256=Dusez1KwBng77R8y8o2QQOLV9y92QZ21TaUNKGf2rRo | 265 |
lm_eval/tasks/bbh/cot_zeroshot/multistep_arithmetic_two.yaml | sha256=LCznNQTpfhDND7CXxGJtbT92384MiMPZ187_43M957I | 257 |
lm_eval/tasks/bbh/cot_zeroshot/navigate.yaml | sha256=9akHyCJl4yRLYhMpDa9UIivP80t9uIB-G5hSnX9m-2s | 293 |
lm_eval/tasks/bbh/cot_zeroshot/object_counting.yaml | sha256=nzP6RcHXc3RMiwanmHDiEdMxlJuQGheCw8Ue8DTbQb8 | 280 |
lm_eval/tasks/bbh/cot_zeroshot/penguins_in_a_table.yaml | sha256=Bzb6UHMaz5Y6uaNhxknXn6rY3tI_86GZ0E3g9IMfDXk | 274 |
lm_eval/tasks/bbh/cot_zeroshot/reasoning_about_colored_objects.yaml | sha256=ZPz4sZ6lb7GZapzxKh1FOo2FH7ED_Q1eXnsCOhoA5dA | 309 |
lm_eval/tasks/bbh/cot_zeroshot/ruin_names.yaml | sha256=WyvQ15Uc-p0Wt0DRbbP_HmdNhPVkGhstZrgPLQKvu_c | 269 |
lm_eval/tasks/bbh/cot_zeroshot/salient_translation_error_detection.yaml | sha256=XCXXq_6fhIqSM7csNN50Y_q08234rR0eKTE--fxO1wU | 321 |
lm_eval/tasks/bbh/cot_zeroshot/snarks.yaml | sha256=fEkxQpR6a_oYneli2QU79NVQCv4JaS7kqXi1rezhk8s | 555 |
lm_eval/tasks/bbh/cot_zeroshot/sports_understanding.yaml | sha256=Jk10AIuNG3h5-qhG88LhlVauTqVjNK1an8eHL-fhGBA | 306 |
lm_eval/tasks/bbh/cot_zeroshot/temporal_sequences.yaml | sha256=f8ra_-gx2S0O8KCziN54IuWMIM8aVyUMTibzPP3-mLY | 296 |
lm_eval/tasks/bbh/cot_zeroshot/tracking_shuffled_objects_five_objects.yaml | sha256=sx0LliAkEEmcBpGZSaHRU5bpMP3rRcSIS79Yezaoq_Y | 388 |
lm_eval/tasks/bbh/cot_zeroshot/tracking_shuffled_objects_seven_objects.yaml | sha256=y8SPU1nJNU484fIl0tqy92W2CxGPq1au_3P32psIRHw | 390 |
lm_eval/tasks/bbh/cot_zeroshot/tracking_shuffled_objects_three_objects.yaml | sha256=BsRxiWkhMa5OePsWIjNQ008IIAeK6O6ZBA3YM8e-Ohc | 390 |
lm_eval/tasks/bbh/cot_zeroshot/web_of_lies.yaml | sha256=7J2pYYVyCjosJFiBX0DoszjN6dUbikQ8VogE4TwG5TY | 257 |
lm_eval/tasks/bbh/cot_zeroshot/word_sorting.yaml | sha256=UAkFoXF3iixjWDmExwWnrb1OWyjp1DJpWjbpUvA-m2s | 217 |
lm_eval/tasks/bbh/fewshot/_fewshot_template_yaml | sha256=PUcMVyfPH_ndAaafeV6ND7LLAHWlFs8nJgayD8fZYhg | 402 |
lm_eval/tasks/bbh/fewshot/boolean_expressions.yaml | sha256=1tIp6Y5eC9Dya8yBzxVjdYO4nUCbAlIaFzG-K8xv8Hw | 367 |
lm_eval/tasks/bbh/fewshot/causal_judgement.yaml | sha256=vantgzSIBZhR_qxJRO2uWbIgyA7AuKCIR7Sn8_GFqRY | 2338 |
lm_eval/tasks/bbh/fewshot/date_understanding.yaml | sha256=ySlQrnYJxmE3GSnL_cqT8jvDqQB5fvEVXMpjEfrhKcA | 815 |
lm_eval/tasks/bbh/fewshot/disambiguation_qa.yaml | sha256=6JRUEFVFBTqG17T-072M7uEyLjus--VaiaXsGFatUgs | 1164 |
lm_eval/tasks/bbh/fewshot/dyck_languages.yaml | sha256=a394IE2EtX-i8QOBgAu6olHe96syKt1AjxOt8N0bYSE | 622 |
lm_eval/tasks/bbh/fewshot/formal_fallacies.yaml | sha256=kqv_qxXfSoSwTViot4G_8yBKEx1uhG8XqOK46g3kqAA | 1839 |
lm_eval/tasks/bbh/fewshot/geometric_shapes.yaml | sha256=TZwKR7vJ2Z9x0l7GY1glQ_6_vPTcBQRU7jrzF0AK_aU | 1074 |
lm_eval/tasks/bbh/fewshot/hyperbaton.yaml | sha256=hvcnVDCbmUPxnMiI_P6qVVqlUfRtKT8yCvl4KWGAMjM | 634 |
lm_eval/tasks/bbh/fewshot/logical_deduction_five_objects.yaml | sha256=dSRQXf8szjv_yDPSHFFxphv022anRQOzPReBqY-s5Ik | 1539 |
lm_eval/tasks/bbh/fewshot/logical_deduction_seven_objects.yaml | sha256=ty843RXDantbT5JKldYf4ZtEJcsEIpn9xxBaLGT58Qg | 1541 |
lm_eval/tasks/bbh/fewshot/logical_deduction_three_objects.yaml | sha256=oU9T3xpAVcaFyMKhvdkUyPjtTvhrNlJHG8TK3EdcgMQ | 1541 |
lm_eval/tasks/bbh/fewshot/movie_recommendation.yaml | sha256=jS9ruvpQwcgiyaR3KVApBGDgf3QyX2wTWx61FFd9PFk | 906 |
lm_eval/tasks/bbh/fewshot/multistep_arithmetic_two.yaml | sha256=pwWjm5OLv_qjiu296ZtUrCC0glShTq8uk0H94yV6pWM | 389 |
lm_eval/tasks/bbh/fewshot/navigate.yaml | sha256=QOTReNyaIjZyn3F7THRwJuU6CCbuyRBanSC7Onunkb4 | 842 |
lm_eval/tasks/bbh/fewshot/object_counting.yaml | sha256=6yrD3p-nOVN9ymXekvX1H1YSxWVhSFse8CobjcWI4vE | 689 |
lm_eval/tasks/bbh/fewshot/penguins_in_a_table.yaml | sha256=0PM3HhN17hsmGB7TqSIbgveusa0LDW31CQDXZeqZX3k | 1542 |
lm_eval/tasks/bbh/fewshot/reasoning_about_colored_objects.yaml | sha256=TTtJaKleXVRX71doDMkk7mx3sw4kcL7axNpBjeiq-vE | 1509 |
lm_eval/tasks/bbh/fewshot/ruin_names.yaml | sha256=JMYb663T6w_MJkQGh8jaB1b9RrGFmVtntFnHjfQ_PXg | 882 |
lm_eval/tasks/bbh/fewshot/salient_translation_error_detection.yaml | sha256=APT876ojQHdbClvWMR2mUNh29aHRa3jVhi4cETOEivw | 3738 |
lm_eval/tasks/bbh/fewshot/snarks.yaml | sha256=FcUe10FIsqJVhKAbrCn6znCzGD0p0EV3I4kGjE9Da6s | 1226 |
lm_eval/tasks/bbh/fewshot/sports_understanding.yaml | sha256=06OeVP9JHyVB2-2YtVipiDhp4Q5OwoTEbYmbUDMZ5XU | 579 |
lm_eval/tasks/bbh/fewshot/temporal_sequences.yaml | sha256=D6yGSWcJ74UkOHqm6Lhs26h-10ejWb_hnT8jjmuUPG0 | 2117 |
lm_eval/tasks/bbh/fewshot/tracking_shuffled_objects_five_objects.yaml | sha256=LKa6X23i3JsbfDZejNcofoPl32Oib4q5E09z7eeDRmY | 1705 |
lm_eval/tasks/bbh/fewshot/tracking_shuffled_objects_seven_objects.yaml | sha256=Bn-uESnumu6mDPrsNMN8AEB6iwz7A3c_5BvwNDZNais | 1707 |
lm_eval/tasks/bbh/fewshot/tracking_shuffled_objects_three_objects.yaml | sha256=XhCmfLNUUK73TRLNMqnFnXrEdh9fgdykesi9weSaNGw | 1707 |
lm_eval/tasks/bbh/fewshot/web_of_lies.yaml | sha256=QQomeDW4QMJwaJIaGz9mBQ4wY1rzVHubyiiAhsixLZY | 813 |
lm_eval/tasks/bbh/fewshot/word_sorting.yaml | sha256=UhnU8RCtK0DE22qIoaRzo3VKpIUDuV5OjmXdazKHkbU | 582 |
lm_eval/tasks/bbh/zeroshot/_zeroshot_template_yaml | sha256=95ft6nOgFtFIM3Ko_BYEMas3cnQ2TEO9kS513hL9STc | 404 |
lm_eval/tasks/bbh/zeroshot/boolean_expressions.yaml | sha256=mrFX0fCvRrIxlwLLs28Ns3gJG5aPumHFLmFAowI1Jik | 225 |
lm_eval/tasks/bbh/zeroshot/causal_judgement.yaml | sha256=MSMdB_phIrAVEqmX6DW8a1476kZCYn71z2jk6k8FZ1I | 210 |
lm_eval/tasks/bbh/zeroshot/date_understanding.yaml | sha256=7kwAlkLAgiBoPqOEEu-J97VPq7aQcQBx6VZh13RGjuc | 200 |
lm_eval/tasks/bbh/zeroshot/disambiguation_qa.yaml | sha256=UdNJ064fiVGUgm68JDzV6HAgHVWToNLjNTtL4gDZpe0 | 227 |
lm_eval/tasks/bbh/zeroshot/dyck_languages.yaml | sha256=VvQuToGz8TV627yvaRr8dVsY1CQXSsNlrrA8qbl0I4Q | 194 |
lm_eval/tasks/bbh/zeroshot/formal_fallacies.yaml | sha256=rGXNxut9CyKYKwWKAhWC-DLDY6ESafaFK8PztRWCDmc | 230 |
lm_eval/tasks/bbh/zeroshot/geometric_shapes.yaml | sha256=BJKcGQLjFwWsTzl1e3BY5PKYOaqFuti_Plk_WQ6BEo8 | 211 |
lm_eval/tasks/bbh/zeroshot/hyperbaton.yaml | sha256=YpEgtomD4Z6oT3smKCSW9HtmK3ePXAN4QUWyfmDKGHQ | 204 |
lm_eval/tasks/bbh/zeroshot/logical_deduction_five_objects.yaml | sha256=RmRkQ6RQFCr27ubi41_h0TvD44jz7AB33opRCiqVw-k | 280 |
lm_eval/tasks/bbh/zeroshot/logical_deduction_seven_objects.yaml | sha256=PeJyYqRN9TQZF_MAL7Ww3-7Y6oUTv0v1ILb91nelgmk | 282 |
lm_eval/tasks/bbh/zeroshot/logical_deduction_three_objects.yaml | sha256=xfnx-wld_s3rBHTqLt9BGHW4xlt_PHauXiiIck3ebQk | 282 |
lm_eval/tasks/bbh/zeroshot/movie_recommendation.yaml | sha256=u-cfRZxSumjp_DA2fXP71r8-LkbzqRupyTKCrnGZXPY | 229 |
lm_eval/tasks/bbh/zeroshot/multistep_arithmetic_two.yaml | sha256=CHDNvy-3tK96KUTt2H-IlJug46DzmSJeUR6YWFYhEOE | 221 |
lm_eval/tasks/bbh/zeroshot/navigate.yaml | sha256=gwMXnG1MFLvG71AY5Zc-j1enPHAMSm68BEc3kFZzHjQ | 257 |
lm_eval/tasks/bbh/zeroshot/object_counting.yaml | sha256=-5j9PbSQLbsjMNNELPzIeGuUA4RKemWjtuODhMwQudg | 244 |
lm_eval/tasks/bbh/zeroshot/penguins_in_a_table.yaml | sha256=KT6B9IB549AYHSy8Rq91P9g6eoIVLQHDu-J0ufM8aSw | 238 |
lm_eval/tasks/bbh/zeroshot/reasoning_about_colored_objects.yaml | sha256=T7feR3GZUGNXQfcvqp9PQTUYnxSNxVorRNbslKaUeUY | 273 |
lm_eval/tasks/bbh/zeroshot/ruin_names.yaml | sha256=6Nnp8-A0ZAzZKdyGHlmuHqWSSI_Lh2t6ARySlZdW4vQ | 233 |
lm_eval/tasks/bbh/zeroshot/salient_translation_error_detection.yaml | sha256=Ekxj38CgDhGc3q0QOcX9cMMh0FCM7F5chwbuPDIY1SU | 285 |
lm_eval/tasks/bbh/zeroshot/snarks.yaml | sha256=ZRfRagNttGQOyg7YpsAFcHLlk1-TOkSOaKXygV3W0Gg | 519 |
lm_eval/tasks/bbh/zeroshot/sports_understanding.yaml | sha256=IznLZAtZQKHXMnxbIftDK48NrsmKPNB-DL5b7pCACgo | 270 |
lm_eval/tasks/bbh/zeroshot/temporal_sequences.yaml | sha256=WThhTOqmLdLsCCkFmOfLPTBf1dcJ3lWG2Vl92ZKyfu0 | 260 |
lm_eval/tasks/bbh/zeroshot/tracking_shuffled_objects_five_objects.yaml | sha256=Iakr6nbReBfcYGyRJvm5tr_21VUjjimzzPQFID_Kyww | 352 |
lm_eval/tasks/bbh/zeroshot/tracking_shuffled_objects_seven_objects.yaml | sha256=qP-RqLMupIrJwx01-KF_0DOE4moL_p2Lpi4Hj_5cj-w | 354 |
lm_eval/tasks/bbh/zeroshot/tracking_shuffled_objects_three_objects.yaml | sha256=Rh2c5OpcbotG5jXbzIH1S9MOLnRqTyWUjWAnYoxufGI | 354 |
lm_eval/tasks/bbh/zeroshot/web_of_lies.yaml | sha256=MUuHxBqmMEC0-nXX7xym-lENOVIrFZ4VYg1VBalWoIM | 221 |
lm_eval/tasks/bbh/zeroshot/word_sorting.yaml | sha256=1I5yXWvNk1-2wqauzDzcy1Jf44abpsbKQ4Lyc59y8xQ | 181 |
lm_eval/tasks/belebele/README.md | sha256=DePrXLzy0Wd8hP3XqMGXlXBRLZsczh1aEN4-MhTxMv4 | 2578 |
lm_eval/tasks/belebele/_default_template_yaml | sha256=AHjhB4rq9bU2cpUX_GrkIunCKBb7lp3OXMWxNxQJ7XI | 649 |
lm_eval/tasks/belebele/_generate_configs.py | sha256=FEE7dgUxK1bC3eX6NMdnC70EJ5v2FUj8ap_gxUPn_kU | 1838 |
lm_eval/tasks/belebele/belebele_acm_Arab.yaml | sha256=3qImw0i71UboOFSeQd2TmVioQiC0JfhMSP8iVxnDYXE | 91 |
lm_eval/tasks/belebele/belebele_afr_Latn.yaml | sha256=m9VbibTpvWsh2S4C3lSIva0pX0wNP3M5eL9et3Arjsg | 91 |
lm_eval/tasks/belebele/belebele_als_Latn.yaml | sha256=e1GA-9SBHfa9gf_I1yMB3By2EyEPKrZk2o6nBHJdoT8 | 91 |
lm_eval/tasks/belebele/belebele_amh_Ethi.yaml | sha256=csGr6kqh4mIfvLkpPKmahQm1VPCYa0exwMdUA9BIb1I | 91 |
lm_eval/tasks/belebele/belebele_apc_Arab.yaml | sha256=gOl6I5Puz8U_XVUiH8Rde3QMzhaICpfgdnhVIw-mPG4 | 91 |
lm_eval/tasks/belebele/belebele_arb_Arab.yaml | sha256=8quJ4Dg542i2TQAJGMUhTCTuNGnOK33yOkSbcuvH5HE | 91 |
lm_eval/tasks/belebele/belebele_arb_Latn.yaml | sha256=qOgXqifahfDEOZpcbSyx6m5fL4JONX_LDzNCrKOZxCE | 91 |
lm_eval/tasks/belebele/belebele_ars_Arab.yaml | sha256=wpO0b15mO0JV-9FfQurbM_o1bBf7Qp2la2HEwiX5m_I | 91 |
lm_eval/tasks/belebele/belebele_ary_Arab.yaml | sha256=2Od_iwAx0ssqDQRpL5ExCNKvz30y_IkCJdmBP2rKw0c | 91 |
lm_eval/tasks/belebele/belebele_arz_Arab.yaml | sha256=WZdVZxI-sAzrCohL0doLX207Yl3-0Pa2UPku23oplBc | 91 |
lm_eval/tasks/belebele/belebele_asm_Beng.yaml | sha256=EDrfMOkBRiRP50MXABZGGfl9SMz6XXNZdyTNUIlTlSU | 91 |
lm_eval/tasks/belebele/belebele_azj_Latn.yaml | sha256=kyJqxP5rlbLeJ8WzzHmAcAlyUuqP-xYZX1HsX13Vxzw | 91 |
lm_eval/tasks/belebele/belebele_bam_Latn.yaml | sha256=ER_d3opMDRffbMdsfhFqfLxkqRpD0m9OBGyPl5grXPM | 91 |
lm_eval/tasks/belebele/belebele_ben_Beng.yaml | sha256=coy8g09IvjBLlK4MjJQ8zy5y4h5PL6gWe_qYw-qIy8w | 91 |
lm_eval/tasks/belebele/belebele_ben_Latn.yaml | sha256=_71L4mUPJpJ_n-fX2jO82kD0yPXsxViO8n-FYFutjms | 91 |
lm_eval/tasks/belebele/belebele_bod_Tibt.yaml | sha256=SZTFC4JLEmXBYsBk0DhQ4gnDQ-pq-ufvoyDuxLDBR84 | 91 |
lm_eval/tasks/belebele/belebele_bul_Cyrl.yaml | sha256=ugTyfxZJuOLviFpvM4CVZZvuOgJsZoPuU5gUVsZV7zA | 91 |
lm_eval/tasks/belebele/belebele_cat_Latn.yaml | sha256=BbtFY_jEsFWKKmSMgnf-QKGZsoimaHrnoZsOPO2aAM4 | 91 |
lm_eval/tasks/belebele/belebele_ceb_Latn.yaml | sha256=T_5piS4b4qNDxhDNoHG5CDOLxQTdCGrE1cUJTFbe8Rk | 91 |
lm_eval/tasks/belebele/belebele_ces_Latn.yaml | sha256=h6I3PwveuUF-5EaTj6JJawB2DqNE6lE5AzcqIyh0JEw | 91 |
lm_eval/tasks/belebele/belebele_ckb_Arab.yaml | sha256=ygsJEXavNs9oXq3OgxNpuziKVZBkg34XOiZy1n8IXyA | 91 |
lm_eval/tasks/belebele/belebele_dan_Latn.yaml | sha256=hH0chUL7_uN90VchIF7trePjQmfLi-CszXaHbRGtXWQ | 91 |
lm_eval/tasks/belebele/belebele_deu_Latn.yaml | sha256=LOUWLhfhzYm11COhrBCwM_7UvNnt6sBmGeK9oWwaDpQ | 91 |
lm_eval/tasks/belebele/belebele_ell_Grek.yaml | sha256=_7AxqIKIENgXyfdLRh6z1BbBnl0FT9QBY4EpYUJwrRk | 91 |
lm_eval/tasks/belebele/belebele_eng_Latn.yaml | sha256=R9L--kN4APc8nwqI3f0KynOozZcyjlrOw3ZNW4dVXRs | 91 |
lm_eval/tasks/belebele/belebele_est_Latn.yaml | sha256=lEogDOCwVjgoGrxVpOHHLwBbXi4AcsKf1rVwYpJU38w | 91 |
lm_eval/tasks/belebele/belebele_eus_Latn.yaml | sha256=0LKGcWpKOVtdLx-gFNGDmqF3fRtboUu9Uz_81FfFwIg | 91 |
lm_eval/tasks/belebele/belebele_fin_Latn.yaml | sha256=JHVc8dlCrEB39C7N2Q_flrXpYYrhiBPMo8MkrNP6ISU | 91 |
lm_eval/tasks/belebele/belebele_fra_Latn.yaml | sha256=r-I9D60zBELCqXzU6lWYwf523JmQayYKJ5uYe7xPbx4 | 91 |
lm_eval/tasks/belebele/belebele_fuv_Latn.yaml | sha256=jzGN1XtByII6M7aJxVppPGiJMlI6SuRI1LQZpteJdPA | 91 |
lm_eval/tasks/belebele/belebele_gaz_Latn.yaml | sha256=Fa-lBKsnvp9yuqJfp86JNYyCRVmcmdFLFEHotw2gkD8 | 91 |
lm_eval/tasks/belebele/belebele_grn_Latn.yaml | sha256=_CVWkWmneyK7E_xuCwWDDJ6Ld873MMUoJkDg2VehG8U | 91 |
lm_eval/tasks/belebele/belebele_guj_Gujr.yaml | sha256=N1npKfH7bvMtRTur8VAXGwkK7Ukaz6sq7eG3LWXomFw | 91 |
lm_eval/tasks/belebele/belebele_hat_Latn.yaml | sha256=gmY4PH67T4OGN8hAjjxUF6MbeL7Z3P17apeoj8Xd-_4 | 91 |
lm_eval/tasks/belebele/belebele_hau_Latn.yaml | sha256=jH9GqFQBSZLyt6u02-iYSATHdCNViYotSGdE0xJn8o4 | 91 |
lm_eval/tasks/belebele/belebele_heb_Hebr.yaml | sha256=a5S94H9NWFF6FAHIiNVEfWI_6xztApTWTnw1o_5Ue1o | 91 |
lm_eval/tasks/belebele/belebele_hin_Deva.yaml | sha256=_2JJZHR6yzLCAt-S3w6Nu-twxe2yLwNxFA2xrSinftg | 91 |
lm_eval/tasks/belebele/belebele_hin_Latn.yaml | sha256=abUpXopa4MU6M1dJnElq6QXsgeOYD4JS30bJYnUUEOk | 91 |
lm_eval/tasks/belebele/belebele_hrv_Latn.yaml | sha256=93JpE33R0DlJs7PhqBY5LPmYunLKyB7waBGQbcw7XJ4 | 91 |
lm_eval/tasks/belebele/belebele_hun_Latn.yaml | sha256=SM-mXpTh_fZxwY6K4iwNCuf1d7A1fjvzd4MA34_mFoc | 91 |
lm_eval/tasks/belebele/belebele_hye_Armn.yaml | sha256=HqZKUvZvOH4c7Rp73vi_ZY3lHEyqbVmeE9ZMwVE1RUA | 91 |
lm_eval/tasks/belebele/belebele_ibo_Latn.yaml | sha256=ZhPEiau2oRF6o9-Ah9Q5G7TjtdtQ_f71KLwpMOx4qU4 | 91 |
lm_eval/tasks/belebele/belebele_ilo_Latn.yaml | sha256=2NKsKbkvqbWtifyrm2pCbDA-i4xqT6SBlqEI6RWyWrY | 91 |
lm_eval/tasks/belebele/belebele_ind_Latn.yaml | sha256=elVyRmhsurYpvvpS32J1nDB9MaKIun0u-wXaRnD0Itg | 91 |
lm_eval/tasks/belebele/belebele_isl_Latn.yaml | sha256=9AQRTj03LSsOlNEYbTHOFYizjqV-c3JRKxbUD95D6ic | 91 |
lm_eval/tasks/belebele/belebele_ita_Latn.yaml | sha256=hAlvHbe0lAiYSLk55u8wcu42Bvew-3tx_VRikWJet6w | 91 |
lm_eval/tasks/belebele/belebele_jav_Latn.yaml | sha256=Esb4rEenIWi1-5XjxkxtSFJpkhOeUo3I-kuFE4GimPc | 91 |
lm_eval/tasks/belebele/belebele_jpn_Jpan.yaml | sha256=QOsHmPRfOL4Dfa0CTCulVKwUqSk6fjsfwsALFyxlGhM | 91 |
lm_eval/tasks/belebele/belebele_kac_Latn.yaml | sha256=UKTr7xD-S36Hbreg3CThwM5zOf_nMamUqsox5cG0zIg | 91 |
lm_eval/tasks/belebele/belebele_kan_Knda.yaml | sha256=T3S3_u3K2oTf0aMr8S6HOE3u8tQYwCgNLPpq3jafyHU | 91 |
lm_eval/tasks/belebele/belebele_kat_Geor.yaml | sha256=w0jg1efNDA8qjHoRijv9IKYR7n2ol8RLbegB9qmNqC0 | 91 |
lm_eval/tasks/belebele/belebele_kaz_Cyrl.yaml | sha256=hn1gMsR4uFqyKgPYkLIaRyfApNPG8jRwoaR52GgDYs0 | 91 |
lm_eval/tasks/belebele/belebele_kea_Latn.yaml | sha256=nmwDctP-ynDRCoVY4OBusmz3djOak7MXFevVTIi0LNE | 91 |
lm_eval/tasks/belebele/belebele_khk_Cyrl.yaml | sha256=lRL6tZXq3W8jd8BJtqzMEgRLavow6aBqQ-YmT1yGBFU | 91 |
lm_eval/tasks/belebele/belebele_khm_Khmr.yaml | sha256=HGUdlMIWXQcUGMhfhJrNjgvuWZLHLv2RVAE3NuN3yrU | 91 |
lm_eval/tasks/belebele/belebele_kin_Latn.yaml | sha256=ULAoyU4HRxrqEH_EvuvO-CRoUPVSxd1M3AkYeAjoQqU | 91 |
lm_eval/tasks/belebele/belebele_kir_Cyrl.yaml | sha256=np0BzHCK5_MLK_7W703_9aSmAUQ-vQ1hhRwUtO-q0cM | 91 |
lm_eval/tasks/belebele/belebele_kor_Hang.yaml | sha256=Gt5b_xr-8xUFIby0HfpOiCrmoUIKYWRggMgZnBF1yZs | 91 |
lm_eval/tasks/belebele/belebele_lao_Laoo.yaml | sha256=Roo6K8H2i1-OUC4r1O4OfjDq7AT1iV5DlsvxtXAso2A | 91 |
lm_eval/tasks/belebele/belebele_lin_Latn.yaml | sha256=0Kh7w_vBnY67NsBGg5uM8esZE5U_aw7kKK8ewERyqVc | 91 |
lm_eval/tasks/belebele/belebele_lit_Latn.yaml | sha256=ssqiT2rCbWhpXr-QSTChWaszmAVHr2f9vyVEOa8GUew | 91 |
lm_eval/tasks/belebele/belebele_lug_Latn.yaml | sha256=MUuk0_l6lMMjBIWdaaQwNUpP_sCh52Zo6OjNNmHQE8I | 91 |
lm_eval/tasks/belebele/belebele_luo_Latn.yaml | sha256=frNv5QfgXY2aeveQpI39p6-_VtgRL2t1CQkz52xwFmQ | 91 |
lm_eval/tasks/belebele/belebele_lvs_Latn.yaml | sha256=vASDjUI9MRrxetYKI3LzkAo3Tzijwlsia3_C-t8F-KM | 91 |
lm_eval/tasks/belebele/belebele_mal_Mlym.yaml | sha256=7wSUVHj9h4YZPXrmy6yQ9iJIFvCCJj7Im4iFzKKkEqU | 91 |
lm_eval/tasks/belebele/belebele_mar_Deva.yaml | sha256=VLXB1q176NiW3z3JYnGzytfOm-W1ICMKanVLn4BxyOE | 91 |
lm_eval/tasks/belebele/belebele_mkd_Cyrl.yaml | sha256=4uaqgqFMpimzYaJcpMV1IRZPlMB_ZBm92K7HaHLCCBw | 91 |
lm_eval/tasks/belebele/belebele_mlt_Latn.yaml | sha256=MNy7mnYwW7CFUlBVPq9vK_aC9n8oTed9A8pD8o83Mqs | 91 |
lm_eval/tasks/belebele/belebele_mri_Latn.yaml | sha256=msQfpR5hhfnJuabeDqL0QI8xZZ6gX6w3ZzLe9-j4jL0 | 91 |
lm_eval/tasks/belebele/belebele_mya_Mymr.yaml | sha256=ZUssWoiB3X629KQOGbBvfW2QD00qZurGDcp73P3SrfA | 91 |
lm_eval/tasks/belebele/belebele_nld_Latn.yaml | sha256=vySt0ttcucmjOoyCiblXU1aEL40x0Qw3qxka4RnuHEo | 91 |
lm_eval/tasks/belebele/belebele_nob_Latn.yaml | sha256=2smEeqTVxaWtTB-cuYHJqcAaaW9BC24gjMAYZUWi4_0 | 91 |
lm_eval/tasks/belebele/belebele_npi_Deva.yaml | sha256=EAy-sUWJR7E8K4BKUDzseGcFm0f1MzqgLuwvk8Qd7NA | 91 |
lm_eval/tasks/belebele/belebele_npi_Latn.yaml | sha256=YxzICLHiY0C-BlkKOOtNb8oYE06aVFCOCqEuDB6aefU | 91 |
lm_eval/tasks/belebele/belebele_nso_Latn.yaml | sha256=DhVXJpncGAFXZo1hhYRrU69WoMZ3iERVIAVrsNBb0d8 | 91 |
lm_eval/tasks/belebele/belebele_nya_Latn.yaml | sha256=nu2p41Mjc3jclhyazDcvPWV2Nijh6-5B7wpCZhI2iq0 | 91 |
lm_eval/tasks/belebele/belebele_ory_Orya.yaml | sha256=jMgldlzR8VxGztyDlmAhiawaDvgcC2zhVEYAVhQ_d9E | 91 |
lm_eval/tasks/belebele/belebele_pan_Guru.yaml | sha256=vQgWIaTD5IRX6ok1qbFzYRB03ewHg59a89cMVdAVqgs | 91 |
lm_eval/tasks/belebele/belebele_pbt_Arab.yaml | sha256=GggP-ghr374RrMiOPXJS14vLeEjAoJ4tMLgUKT_Tu3U | 91 |
lm_eval/tasks/belebele/belebele_pes_Arab.yaml | sha256=FBhSUWQVtsvzTJMsvwHyAqauLVfnkp5ZUQdtUea1vTw | 91 |
lm_eval/tasks/belebele/belebele_plt_Latn.yaml | sha256=rafD0UNBsOROG58AHBE7g9w7NeiXVRgJxPXpuGZMvV4 | 91 |
lm_eval/tasks/belebele/belebele_pol_Latn.yaml | sha256=lwDvqICyyeDk8Cmw6PqqyDr8xkgepEMD3OreqhaDxU8 | 91 |
lm_eval/tasks/belebele/belebele_por_Latn.yaml | sha256=lbwymZJ9ehgalGGS0MfVY6ZYGAa7LFHzuAcFNN9fcBI | 91 |
lm_eval/tasks/belebele/belebele_ron_Latn.yaml | sha256=A_XHynzgIUv14VMFRc2vsbmI1aobv_1z7gBnSFNUC_s | 91 |
lm_eval/tasks/belebele/belebele_rus_Cyrl.yaml | sha256=HKwQ0iWaxH79PptSxPTj_fP5Tx1PoD0NQj5Yuh4wQqk | 91 |
lm_eval/tasks/belebele/belebele_shn_Mymr.yaml | sha256=QYO1Ru9r0kx5q6Le86eMXAIGHiH97WfYKctWC7LSSWc | 91 |
lm_eval/tasks/belebele/belebele_sin_Latn.yaml | sha256=Iee4J52z3qc1qUrnWLLaXWu4pWVbb78d_elBtwn8qVA | 91 |
lm_eval/tasks/belebele/belebele_sin_Sinh.yaml | sha256=A3WP32SjGZUvEqlW-jtUo_D01ndKdBAnaXf7Ch6xcCg | 91 |
lm_eval/tasks/belebele/belebele_slk_Latn.yaml | sha256=lnVUaRTEQbZc5N7nXFvcVq0rhxz3qlbtFMVJfwuhg8Q | 91 |
lm_eval/tasks/belebele/belebele_slv_Latn.yaml | sha256=Jgifx7F90TXd4gWCLFCMvTF4Oqq43Lt6v-26Q4v7NQU | 91 |
lm_eval/tasks/belebele/belebele_sna_Latn.yaml | sha256=TpVU1bN3hzP1NSfSOdRHPpcJmFIucz0BqBNStyX2WMI | 91 |
lm_eval/tasks/belebele/belebele_snd_Arab.yaml | sha256=utO8s7yEbiVqxgxFddCpiCxCX4DMJm_soW1WFT3XWyc | 91 |
lm_eval/tasks/belebele/belebele_som_Latn.yaml | sha256=LrTyXBAiSRrm6uypQGwBYIgkgeniOx2Qqw6BxHeYCl8 | 91 |
lm_eval/tasks/belebele/belebele_sot_Latn.yaml | sha256=EO2AtJA5W9RJNj7bIpnU-vG-Y2lETHClt0gfFXEe1Is | 91 |
lm_eval/tasks/belebele/belebele_spa_Latn.yaml | sha256=qBGiMl-10UdK0ysM1b7kwdaBqA7wgozgiZAPEuTBdyE | 91 |
lm_eval/tasks/belebele/belebele_srp_Cyrl.yaml | sha256=mRzdW_Jxs6LmSzFk6lrLaLeqBf9hUuxi4EQKwt0yEVo | 91 |
lm_eval/tasks/belebele/belebele_ssw_Latn.yaml | sha256=WoSk2-REWD-ZeO8CD8D6ZLI9gmw5ZWyMAiLfSgmSSII | 91 |
lm_eval/tasks/belebele/belebele_sun_Latn.yaml | sha256=J5Wo9tFM-rOM5sXGRTRgZmLlpJ5Wibo4-7FWO-j5cbk | 91 |
lm_eval/tasks/belebele/belebele_swe_Latn.yaml | sha256=FI4M0mhKPhlLn1JHUzoiOHosBL3cxljEMOYt_AvKVvM | 91 |
lm_eval/tasks/belebele/belebele_swh_Latn.yaml | sha256=GLkhU35MOb_lU7toxPltKDYNMqKTKdHHR1-uQAs4RT4 | 91 |
lm_eval/tasks/belebele/belebele_tam_Taml.yaml | sha256=v00AUECmZ6_2Z_zN5Th6NZ4qJL-kDoSV3vKccdLuA2k | 91 |
lm_eval/tasks/belebele/belebele_tel_Telu.yaml | sha256=wDyQeyCRHdRWxK0qOOFzmHfZRBzWe77fsNXm0ilkU0A | 91 |
lm_eval/tasks/belebele/belebele_tgk_Cyrl.yaml | sha256=skj1sVMEWLHqaVqZnZMcPREi9LVJGR1lnPOpjRQiCPI | 91 |
lm_eval/tasks/belebele/belebele_tgl_Latn.yaml | sha256=Jww_oK--iUun7y2HU2Y5c4KT5jWc1gL5LKiJrwSqPyc | 91 |
lm_eval/tasks/belebele/belebele_tha_Thai.yaml | sha256=tzzzd92lHGPwS7WQx7NYDPPOAM40AOXuJrrfdu_QM4Y | 91 |
lm_eval/tasks/belebele/belebele_tir_Ethi.yaml | sha256=fLNXVRsM-mqvGyPILDypxsRPo7pNqOe-NlmwlUP2gZU | 91 |
lm_eval/tasks/belebele/belebele_tsn_Latn.yaml | sha256=VVTQLv1w24rO3bxBa5M1Ar8oHWWSLHNPTZBMSQWAUig | 91 |
lm_eval/tasks/belebele/belebele_tso_Latn.yaml | sha256=Ee0NqJ5aLFxEO8VGbdmuXSxqAUG1zpM23UcoobKN4O0 | 91 |
lm_eval/tasks/belebele/belebele_tur_Latn.yaml | sha256=kxjLMNZ6S9Fu8gyE8T1ioZy0jU11s9LKUSMWP7msckk | 91 |
lm_eval/tasks/belebele/belebele_ukr_Cyrl.yaml | sha256=v3u0WSR-upMpqipSAcl1OaO1EjEjC8bLvqaidZn_S2w | 91 |
lm_eval/tasks/belebele/belebele_urd_Arab.yaml | sha256=gYS1_4TM55eqF61mS6wJ_P-BRrin1UUzdAyLh2EE8Gg | 91 |
lm_eval/tasks/belebele/belebele_urd_Latn.yaml | sha256=Zf-yWExiIHwdg3ZEptVt9UFdAPNrMQ4mT91z_Pxg7tU | 91 |
lm_eval/tasks/belebele/belebele_uzn_Latn.yaml | sha256=gyW5vIumvBxcQPU8nHHZdtEo15js2SxRHp7_8LRyJHM | 91 |
lm_eval/tasks/belebele/belebele_vie_Latn.yaml | sha256=QtJ6AY9rfZ-8tMpfE5SuViFLbT2Z2CJccols9MVtX9Y | 91 |
lm_eval/tasks/belebele/belebele_war_Latn.yaml | sha256=J_TCP5gGo-xO-pRb2OjTag6Bwqfn2AQzx1zahTPounk | 91 |
lm_eval/tasks/belebele/belebele_wol_Latn.yaml | sha256=HgwnqNvnJeJ5HDj3RXu2EN95KL2J79XvD10rQDXLf_w | 91 |
lm_eval/tasks/belebele/belebele_xho_Latn.yaml | sha256=6IlzDKrmH2L0_Vin9oeuECeemZw8HZqlGaAgGzWjUcA | 91 |
lm_eval/tasks/belebele/belebele_yor_Latn.yaml | sha256=jHNbrC5cSihutTMqZ30lRnUqUpS0a3GMlkWDm1sncVE | 91 |
lm_eval/tasks/belebele/belebele_zho_Hans.yaml | sha256=hPitpDdrgoeI92CpLgV6Xh_HDnyFMme7db3wVdPm5u8 | 91 |
lm_eval/tasks/belebele/belebele_zho_Hant.yaml | sha256=z4MihqyMapFQgZFwHEu7AzZcxwWHrkJl5-sVP3e9Ax0 | 91 |
lm_eval/tasks/belebele/belebele_zsm_Latn.yaml | sha256=6sB28pzcVRF_uchM-FTFg4e6_noikkGH6RBufu3UlvY | 91 |
lm_eval/tasks/belebele/belebele_zul_Latn.yaml | sha256=rdOR6JlGBq0O39DIkG24PTYn1ZLne3RHfwoB2N0_Imc | 91 |
lm_eval/tasks/benchmarks/minerva_math.yaml | sha256=lb2Yn4TfnswputGzd0vO4yX4YpfqZp-drdOfWViJA80 | 231 |
lm_eval/tasks/benchmarks/pythia.yaml | sha256=xb6ysr5Wkze05aUl0DS6aKWKN4d3-WBXHInrmE3Q4Uk | 135 |
lm_eval/tasks/benchmarks/t0_eval.yaml | sha256=NfW-WLp-pnT4hQrmNyO1Du6DHVscevER86MHVSf_zVE | 3491 |
lm_eval/tasks/benchmarks/flan/flan_anli.yaml | sha256=-Got1Sly1RkTQBiYLvMewadvXeGIaa8fiAs8D63xTx8 | 518 |
lm_eval/tasks/benchmarks/flan/flan_arc.yaml | sha256=NwSMhVR4K65vRetXuV-HJSNWFed6FiMVb1L2t6aJpVw | 430 |
lm_eval/tasks/benchmarks/flan/flan_boolq.yaml | sha256=ukZSIbaVpbo47USX7iHspLD6BG-WdVB4pUEQnA5vy9k | 206 |
lm_eval/tasks/benchmarks/flan/flan_cot.yaml | sha256=8Y42MCfUVBsA7ug5ZGHUr6t_QQZtGcQSUe6qz_AqHaE | 324 |
lm_eval/tasks/benchmarks/flan/flan_held_in.yaml | sha256=54UtxDpen7cyEhrYewAwDmMwk8z6ZV95K8oSV88Egis | 81 |
lm_eval/tasks/benchmarks/flan/flan_held_in_yaml | sha256=2fYqhneej_oDB7vZ1pXn6k9Cpb6-O_y0t_zwgFLpkRE | 1359 |
lm_eval/tasks/benchmarks/flan/flan_held_out.yaml | sha256=k7ZthUTsamEKMPqROcL3A4vLrEnwIDegrlQ61qHBjLo | 267 |
lm_eval/tasks/benchmarks/flan/flan_rte.yaml | sha256=0RMlDNSIDFu9W0roJIqx-8Tb33GQmxygQ6IstVzkKuA | 200 |
lm_eval/tasks/benchmarks/flan/prompt_templates/anli.yaml | sha256=Q6OzO9PZtNucARl_tJUWFmqOfKnnILM93RvzLkB5ehY | 2437 |
lm_eval/tasks/benchmarks/flan/prompt_templates/arc.yaml | sha256=B734F0fpAgAbdJ0aIGq6BrtYxViJ1tFZNonXQi2BkCs | 1407 |
lm_eval/tasks/benchmarks/flan/prompt_templates/boolq.yaml | sha256=RN2SfDJsnQC5nhJy4-KtQvZTx_v_uRG-04xQo3JY0CA | 1859 |
lm_eval/tasks/benchmarks/flan/prompt_templates/rte.yaml | sha256=_kDkSfOxo_8pmN4xrMJqEU8kfKQXNyhyRrFduiA8Ga0 | 1941 |
lm_eval/tasks/benchmarks/flan/yaml_templates/cot_template_yaml | sha256=rErr7w509-Kb2RodVJwltKPpS36FbpBiKdCFbf8HT_k | 429 |
lm_eval/tasks/benchmarks/flan/yaml_templates/held_in_template_yaml | sha256=w8KXee5JStS9AIDlb-fBEZ1Y2rj36xObBc6B2EfJj84 | 222 |
lm_eval/tasks/bigbench/README.md | sha256=-S-u9m2fxpIOoIvS4K1LS2Td3WfjFw4XFh6FnJXOGWM | 9772 |
lm_eval/tasks/bigbench/generate_tasks.py | sha256=bXI5oOO8j8HA6IHMuYAdJ8uU1sMkgOe2q2hcDAgtZgw | 5576 |
lm_eval/tasks/bigbench/generate_until_template_yaml | sha256=VqdG7BB_DKXLOzTaGLkj9pP1SHas0MR3Pz2tOuAOlLs | 509 |
lm_eval/tasks/bigbench/multiple_choice_template_yaml | sha256=ccOR0ox0VwbgBQOO69jZDyp56I0096dH0KdH9dC6Ltw | 504 |
lm_eval/tasks/bigbench/push_bigbench_dataset.py | sha256=z_8s7JS4L97fkdVyDVMnbyrb_f2OjlBgz2ke4s0foV0 | 1036 |
lm_eval/tasks/bigbench/generate_until/abstract_narrative_understanding.yaml | sha256=0QLUsd46oJza1RWtto1OHpdpxd8r79lLZJ-8eFNw5ZY | 185 |
lm_eval/tasks/bigbench/generate_until/anachronisms.yaml | sha256=T1Fc7bNpFatJyeTOAZ61FOA_vQkkMwPpgFLvEe3tMGE | 145 |
lm_eval/tasks/bigbench/generate_until/analogical_similarity.yaml | sha256=I-HNuu_mTxqRNiAGpiyEpoMbm4ViZJpd8tdPD-fkW5g | 163 |
lm_eval/tasks/bigbench/generate_until/analytic_entailment.yaml | sha256=4IpGceDe68otlD7i617DSBXqhw067Y4AjpYVWYnfURU | 159 |
lm_eval/tasks/bigbench/generate_until/arithmetic.yaml | sha256=--6zcCrvHwjcE1SSujrnoCHDXpTo4c2CT9sosctJ0qY | 141 |
lm_eval/tasks/bigbench/generate_until/ascii_word_recognition.yaml | sha256=QhBAm87LFXXIztQjATqtE1QG2s3JOkADRvbiASZcsOM | 165 |
lm_eval/tasks/bigbench/generate_until/authorship_verification.yaml | sha256=J7qQUerJLmxVwptNTbsFlZrDn3WWjxyA-i6aDY-iQ7I | 167 |
lm_eval/tasks/bigbench/generate_until/auto_categorization.yaml | sha256=ZSVByX3aUgSSa_dUYHfJvm6bX6ID5iFF9pZodjWzudI | 159 |
lm_eval/tasks/bigbench/generate_until/auto_debugging.yaml | sha256=EwWe_JEyKN8cQTnhvMFV2T40Td2Igaq0rWuvm9VFVaU | 149 |
lm_eval/tasks/bigbench/generate_until/bbq_lite_json.yaml | sha256=x7II4n0ImBk4HwpbXn6Dap0no5YBdrizIo3qqeoIstQ | 147 |
lm_eval/tasks/bigbench/generate_until/bridging_anaphora_resolution_barqa.yaml | sha256=QFdj_nZPzivXQ_99MACTqsq_hNqpOXwAv0JBvnKZQZU | 189 |
lm_eval/tasks/bigbench/generate_until/causal_judgment.yaml | sha256=f9fiw28Jp_YEeRgrbmUG8dwtt7l6Up22-1-r-uhDyuY | 151 |
lm_eval/tasks/bigbench/generate_until/cause_and_effect.yaml | sha256=5GlQQ-CAgOwXPypYnjRMpdyZ7fA4a-x6REDBEPpmFGo | 153 |
lm_eval/tasks/bigbench/generate_until/checkmate_in_one.yaml | sha256=eWi6zh5n4gwBcE3J7IMiyNttiy2EYvOTAcMMB3Q33lI | 153 |
lm_eval/tasks/bigbench/generate_until/chess_state_tracking.yaml | sha256=anlmDNc-UuKZhgvd4bGHfnloD0817tEiYWuoMBrstVI | 161 |
lm_eval/tasks/bigbench/generate_until/chinese_remainder_theorem.yaml | sha256=hUIYsvTxDFpXOBBR3rc5ByHjK-kCr0IJuYD4-uCEeqU | 171 |
lm_eval/tasks/bigbench/generate_until/cifar10_classification.yaml | sha256=E96IQAlynQhHjAYzJh3CIy3o1oF5Np0onr3Y0G0dS1Y | 165 |
lm_eval/tasks/bigbench/generate_until/code_line_description.yaml | sha256=EbyOJ6tcfb56fDC7jKERqViylqMzNZReN5N4tFrp054 | 163 |
lm_eval/tasks/bigbench/generate_until/codenames.yaml | sha256=RHFfLNH_PvBByvta_z2FSqC0MgA5V7lr6ORRJN5IjO0 | 139 |
lm_eval/tasks/bigbench/generate_until/color.yaml | sha256=V66z_3cDIsLWHt7cHqnPGfFFvgVBypj-jqW60l4WGy0 | 131 |
lm_eval/tasks/bigbench/generate_until/common_morpheme.yaml | sha256=DMnQE0PnPan9Z10yajvyM6AnDz2SNKrmID06eKfW-aU | 151 |
lm_eval/tasks/bigbench/generate_until/conceptual_combinations.yaml | sha256=wN2KQGaT9pun0hOWwe3jrAkjh2lZScYr2jJtiKfPiCA | 167 |
lm_eval/tasks/bigbench/generate_until/conlang_translation.yaml | sha256=-HU-3JkFMpn4vPatZMO3gA6vAJBfdc5XISmYzTDIuMc | 159 |
lm_eval/tasks/bigbench/generate_until/contextual_parametric_knowledge_conflicts.yaml | sha256=CgIDUv6CCJ07FK6H_ATyzqHq8uy_p4ktGWawP8Bmy64 | 203 |
lm_eval/tasks/bigbench/generate_until/crash_blossom.yaml | sha256=_kEHp_E3G1AXRC0UsLL6LLJN0o7OXpaobTZl9idnP9w | 147 |
lm_eval/tasks/bigbench/generate_until/crass_ai.yaml | sha256=Gjf50yyrvFYa2uCcpcu6IJEw4_GpvPtLaIt_dHSgKiw | 137 |
lm_eval/tasks/bigbench/generate_until/cryobiology_spanish.yaml | sha256=tIqxreR7fTTOmPbYthVH-SEuzjgJQhfAdm7wkQx_CPw | 159 |
lm_eval/tasks/bigbench/generate_until/cryptonite.yaml | sha256=5QWZppWvBkcS3wifv3cihe1fCKTZnwVvmtifEkPjgbE | 141 |
lm_eval/tasks/bigbench/generate_until/cs_algorithms.yaml | sha256=Bs4PE7GgZLTX3cPlHHaFqcDmmoEfUOc5V_Gmipya7ls | 147 |
lm_eval/tasks/bigbench/generate_until/dark_humor_detection.yaml | sha256=u98XLx00QqxUlZyScZSaDghGG2XNblgVvQMYLzWW-5I | 161 |
lm_eval/tasks/bigbench/generate_until/date_understanding.yaml | sha256=ikMqfOMsIQ5sMEu5F6jmiPZ1QIk55BMoWgPmlD2YZZc | 157 |
lm_eval/tasks/bigbench/generate_until/disambiguation_qa.yaml | sha256=3AfjnL9sxOL7-mS00bAMCer8ytGaceP-AEVKJ036qCg | 155 |
lm_eval/tasks/bigbench/generate_until/discourse_marker_prediction.yaml | sha256=IDsWjfdbnWGCmPZOPXF1cCqoae05UYLPwO2FJ2SqHVE | 175 |
lm_eval/tasks/bigbench/generate_until/disfl_qa.yaml | sha256=slBKpOw28f7O4FrQjm43gqzcHgOB9-2ysKGTlOXcIt0 | 137 |
lm_eval/tasks/bigbench/generate_until/dyck_languages.yaml | sha256=Nf4uiVjkZB78bKbFEbnXRE3-4eTd4oHhWOAQsg4zOsY | 149 |
lm_eval/tasks/bigbench/generate_until/elementary_math_qa.yaml | sha256=cvAGFFzJcYgDKDmdDfWoJxpPfGYcoH5YKM6hJv-504o | 157 |
lm_eval/tasks/bigbench/generate_until/emoji_movie.yaml | sha256=xE60hkJ3GUO1IzxA5kyWTgQGN8MdpsFL6U44ABSzpgQ | 143 |
lm_eval/tasks/bigbench/generate_until/emojis_emotion_prediction.yaml | sha256=XmwhQbFtBGHBvKcFeBNyaVvGZntHdIveeRV_6cdr7Wg | 171 |
lm_eval/tasks/bigbench/generate_until/empirical_judgments.yaml | sha256=kjuLT2A-PhCTmqnBMu0msAkVL09fHHoTpszp-2Rmvxs | 159 |
lm_eval/tasks/bigbench/generate_until/english_proverbs.yaml | sha256=C-ssB8SgXTSpWuxyjMBTQX9mBwKvHNNzO4nYcVauhjc | 153 |
lm_eval/tasks/bigbench/generate_until/english_russian_proverbs.yaml | sha256=jN-poiQ4U4UCdcHf7RMV6hcZBoKFEvuzdkxBUqD4uFY | 169 |
lm_eval/tasks/bigbench/generate_until/entailed_polarity.yaml | sha256=_gaT1mv0iFYNMbZTGfWeifF6TB8KxASgiyEeXY0vrH0 | 155 |
lm_eval/tasks/bigbench/generate_until/entailed_polarity_hindi.yaml | sha256=RE9kwhgved0dXeKgFCjeFtETtB9FuTgL94iiNSExJj0 | 167 |
lm_eval/tasks/bigbench/generate_until/epistemic_reasoning.yaml | sha256=J-n430fnOd4kw4zRySnYYUG-e7GnxadwVAtqU3S8NRc | 159 |
lm_eval/tasks/bigbench/generate_until/evaluating_information_essentiality.yaml | sha256=6fKxC324hKwqkpV_6MTNNsLicGevovD1iKDflOtOzhM | 191 |
lm_eval/tasks/bigbench/generate_until/fact_checker.yaml | sha256=QZ2tsTKpy93PWKXM-cPAdzSKXsYtspGFyQqQXM8QNSY | 145 |
lm_eval/tasks/bigbench/generate_until/fantasy_reasoning.yaml | sha256=JWzZtrvKJaXfBrC8-B2ClPUze2704DVXUpWioHKCo0M | 155 |
lm_eval/tasks/bigbench/generate_until/few_shot_nlg.yaml | sha256=jGqGMoegdMocHCIyV2HDHm6yrf-7h4N8JnzI028bWmY | 145 |
lm_eval/tasks/bigbench/generate_until/figure_of_speech_detection.yaml | sha256=l3ohFveEUwi8QceVaX1Ubpo0bgaJOJkmN20oFENc4GE | 173 |
lm_eval/tasks/bigbench/generate_until/formal_fallacies_syllogisms_negation.yaml | sha256=VW2iLQzYRtTXjvrCa2Xnz8wlpIyPhUvMfAf_3W_rHZg | 193 |
lm_eval/tasks/bigbench/generate_until/gem.yaml | sha256=ODcWuReD_irTxL7Om0YX1lwUPdgTvS4gfnq64_9RT9M | 127 |
lm_eval/tasks/bigbench/generate_until/gender_inclusive_sentences_german.yaml | sha256=N6yiMVWfYnYWXAku7GSw7PAw20_GJevKEF7Nln9s20o | 187 |
lm_eval/tasks/bigbench/generate_until/general_knowledge.yaml | sha256=0FoVsz9_Whmets9lZh3vpd7TxwclRTFMIT8tpn2iTqk | 155 |
lm_eval/tasks/bigbench/generate_until/geometric_shapes.yaml | sha256=tVKuLRsEGC6QEZINH_MJL9ouuGxYBuBcIoqf8Ry1CB0 | 153 |
lm_eval/tasks/bigbench/generate_until/goal_step_wikihow.yaml | sha256=HefVYueV7Ib4olhFiPSnN-4tKk-wm2-TTOJZq13zDiY | 155 |
lm_eval/tasks/bigbench/generate_until/gre_reading_comprehension.yaml | sha256=imJmoGVFj12Yw1LFVNvOwMqmcjvPC0SfBwptLaX_Rj0 | 171 |
lm_eval/tasks/bigbench/generate_until/hhh_alignment.yaml | sha256=u9i_BMm0zJiWEkU_IL36D1nf9TLqGXArxICZoMmyn6g | 147 |
lm_eval/tasks/bigbench/generate_until/hindi_question_answering.yaml | sha256=ed9fUg5xV9JFW_pI9slzBepyiTu-v1s5s3zu_M7JlCE | 169 |
lm_eval/tasks/bigbench/generate_until/hindu_knowledge.yaml | sha256=GyJkeBgssT8R04bTdYSQM4oa4v8JWpa2ILwVTvLjOyI | 151 |
lm_eval/tasks/bigbench/generate_until/hinglish_toxicity.yaml | sha256=F4y708uc0l1a5o1M6s_kSCpYNl3ivpwfWAgO7usZ8JQ | 155 |
lm_eval/tasks/bigbench/generate_until/human_organs_senses.yaml | sha256=AeQZPk72WRN9G2pj31CvgKiDEbEjSGMppYhni2Q_sVs | 159 |
lm_eval/tasks/bigbench/generate_until/hyperbaton.yaml | sha256=m_cFalqyG6dq_RoMUzTV9fiTFQQ2BssZfG071Zezlzo | 141 |
lm_eval/tasks/bigbench/generate_until/identify_math_theorems.yaml | sha256=buqbBDN-gZJY8mnG2IRHpUPbEFgz4e2amo_c1uQmIvE | 165 |
lm_eval/tasks/bigbench/generate_until/identify_odd_metaphor.yaml | sha256=EoTWJfETPJQIKFScOELfBno5wGMM0KSRUp5Ck8wDh_A | 163 |
lm_eval/tasks/bigbench/generate_until/implicatures.yaml | sha256=XDY-X3eUplOlnEY2WZis1uGjSU0GLg85c7krqgsGQg4 | 145 |
lm_eval/tasks/bigbench/generate_until/implicit_relations.yaml | sha256=AxXDlJDpf_YQKJpvifStiRPiehlDl3L8_bo8i4EtY-c | 157 |
lm_eval/tasks/bigbench/generate_until/intent_recognition.yaml | sha256=QSsKdp83MAfBu2LSLUx2dPt1mENEZ5s4O3to4ntZolM | 157 |
lm_eval/tasks/bigbench/generate_until/international_phonetic_alphabet_nli.yaml | sha256=bPAQzEm6obZvwbxqzZGCDDKYJhasb9Esv6w7FVS5knI | 191 |
lm_eval/tasks/bigbench/generate_until/international_phonetic_alphabet_transliterate.yaml | sha256=ERiqN2vbxFHM3lbUyvWvm46ydMwxU7y1xa4hur8V3B0 | 211 |
lm_eval/tasks/bigbench/generate_until/intersect_geometry.yaml | sha256=uq6hHt_p6HnyMFMN7XcS6Uhml-Ndv5a5l9TTaSzL-9Y | 157 |
lm_eval/tasks/bigbench/generate_until/irony_identification.yaml | sha256=3Lg0jMAk1-QXMo08j6T4weLkMU1xihyF94-61Y5cjCI | 161 |
lm_eval/tasks/bigbench/generate_until/kanji_ascii.yaml | sha256=ma-v7NMOLxNkdKYoRvL9OuEblQ7-l2O2O9bjPhIbyGQ | 143 |
lm_eval/tasks/bigbench/generate_until/kannada.yaml | sha256=y3M1MBUaQqV6b3cfumpigEoeq9m7j8qu2wqM8mjzeEE | 135 |
lm_eval/tasks/bigbench/generate_until/key_value_maps.yaml | sha256=YBdKpEXYUdrbg2YxcDpTheRCGtA8QQU_kMEyWfGaR7I | 149 |
lm_eval/tasks/bigbench/generate_until/known_unknowns.yaml | sha256=FSMjIyrW6Zq86r6PjPnC7GY7KnWQQukFsSkNRMXkIAI | 149 |
lm_eval/tasks/bigbench/generate_until/language_games.yaml | sha256=4vOMkyvPfKVTI-qWO_FfHnxH66nTN6qROPS5selFR-0 | 149 |
lm_eval/tasks/bigbench/generate_until/language_identification.yaml | sha256=siO1slzacE_Qem-FuA5vwlRqfo_gHZsMCGrIjnA-JlY | 167 |
lm_eval/tasks/bigbench/generate_until/linguistic_mappings.yaml | sha256=9BAFhXST3cS9ktxMTB-qVF7lqN8NNEUN4L4JjhqSH5M | 159 |
lm_eval/tasks/bigbench/generate_until/linguistics_puzzles.yaml | sha256=5KGRhLH_mhvoGwdh_CFQTM5r9dPowCxOHzzzcSAkdh0 | 159 |
lm_eval/tasks/bigbench/generate_until/list_functions.yaml | sha256=On2YeI3r2_s9bblbk-AoVp8jZsdmpH7JPTRxzLbLz9k | 149 |
lm_eval/tasks/bigbench/generate_until/logic_grid_puzzle.yaml | sha256=N7JKcaLTcZIxh6efPHG6grF_-Dia9TLDj6AINFyrgas | 155 |
lm_eval/tasks/bigbench/generate_until/logical_args.yaml | sha256=LeMAv4cqQynPdEgMjbX6DLUuHtE5be7VL3_TRgEBxcg | 145 |
lm_eval/tasks/bigbench/generate_until/logical_deduction.yaml | sha256=cMhraRNkbdmCn70YWUI3L5szUSZxF2BZ9dkb08x3otI | 155 |
lm_eval/tasks/bigbench/generate_until/logical_fallacy_detection.yaml | sha256=Plu8NPXtIwicj-ZOR-s-tUp8sQTRUSidXG13wkiybPU | 171 |
lm_eval/tasks/bigbench/generate_until/logical_sequence.yaml | sha256=oiqHok8TaV88QsPEmUtF8J_mx7XBBOO_kEi6MYFETcU | 153 |
lm_eval/tasks/bigbench/generate_until/mathematical_induction.yaml | sha256=AcUk2gvyYMBR2MXIxiswXjcbv4UITm2CU_RboxlfV34 | 165 |
lm_eval/tasks/bigbench/generate_until/matrixshapes.yaml | sha256=oPNV1qhlRa0CStZy9CCOEyYPM1Q88mk51aJ8EEY-yeY | 145 |
lm_eval/tasks/bigbench/generate_until/metaphor_boolean.yaml | sha256=4pm8zy5rvB_f8jXoTBBLe_0gimdFwt7zkINpHdMztA0 | 153 |
lm_eval/tasks/bigbench/generate_until/metaphor_understanding.yaml | sha256=eTWZ8H4boQ7GHOkRh8JiGNzpqMwV0-jy-pxs3ZEIE6k | 165 |
lm_eval/tasks/bigbench/generate_until/minute_mysteries_qa.yaml | sha256=-106CIqMUWgCr30EoCxvnjL3NnRwgqF4YzkXBjJKm7M | 159 |
lm_eval/tasks/bigbench/generate_until/misconceptions.yaml | sha256=GRaducmwu4DxLeIPTw6fcxOi5aEoNctq09pae_zlmIY | 149 |
lm_eval/tasks/bigbench/generate_until/misconceptions_russian.yaml | sha256=NXz_RMAGdhitHJUrOcyOs3lUJAR3BZczDkNh7wuRbrQ | 165 |
lm_eval/tasks/bigbench/generate_until/mnist_ascii.yaml | sha256=3ft522RKA2O6tkvjKFEUXR_ZeAHZyRmUYAVFacedIYs | 143 |
lm_eval/tasks/bigbench/generate_until/modified_arithmetic.yaml | sha256=tN48_TrYgL6NlmDnAFf4_ynOgjgf59tDjZaFMxiGXhs | 159 |
lm_eval/tasks/bigbench/generate_until/moral_permissibility.yaml | sha256=QWHphy2-qbjA6cVIBkv3jojENR-RtA6dxSFUtTaiMCE | 161 |
lm_eval/tasks/bigbench/generate_until/movie_dialog_same_or_different.yaml | sha256=izDgy0BjGi5gkJdKBFB6MT-vq2x97ktVkQHPYThzXpg | 181 |
lm_eval/tasks/bigbench/generate_until/movie_recommendation.yaml | sha256=Ls68uPStQfEA_cXXoHRltL_of6hPd4LCyz5z2FhAQfo | 161 |
lm_eval/tasks/bigbench/generate_until/mult_data_wrangling.yaml | sha256=tNqxoe0NI87WvxSOPS1JyUr1PCpU-UP-q19tmfeaU9Y | 159 |
lm_eval/tasks/bigbench/generate_until/multiemo.yaml | sha256=ntr6dACBtdAxlsVaCYxQ4ZYEEZ2Q1pf4jF00fiu7HFg | 137 |
lm_eval/tasks/bigbench/generate_until/natural_instructions.yaml | sha256=_W6euf1qNMYGfvy7VFPpSGTllBU3TnvQLEwnIzIjsKs | 161 |
lm_eval/tasks/bigbench/generate_until/navigate.yaml | sha256=SgxFNM3bs3Cbfcw2oE2uBj2vXsc0_NKW-R8n1IPbgMU | 137 |
lm_eval/tasks/bigbench/generate_until/nonsense_words_grammar.yaml | sha256=y7R8xHkK3Fg9Vwbs6MLI7nEk-v_lBkd3Qdpxw1TyKbg | 165 |
lm_eval/tasks/bigbench/generate_until/novel_concepts.yaml | sha256=Uw79SXkiEfDm0za-qLou47Vmp42R5necVDTOmIsNnwk | 149 |
lm_eval/tasks/bigbench/generate_until/object_counting.yaml | sha256=BPtUsBz3xxwrKC38WiDAP0Lz8Boh7rkMC0t4rWobGe0 | 151 |
lm_eval/tasks/bigbench/generate_until/odd_one_out.yaml | sha256=0MPa0ZWseDqQZWxIiUVHPLyHaC0CDqDYP5_VJqML9eI | 143 |
lm_eval/tasks/bigbench/generate_until/operators.yaml | sha256=Xq2pA8FZ1d84z69QD0oXGH7hqs4fMLs-lxZpjwACBgY | 139 |
lm_eval/tasks/bigbench/generate_until/paragraph_segmentation.yaml | sha256=UEraXnlx1L9yNh0qQwsz63wJ0AzYlMwJ-m2NjZEning | 165 |
lm_eval/tasks/bigbench/generate_until/parsinlu_qa.yaml | sha256=BzriiMDmkFzK17iZEYiQmsK_QBfuBewrMNg8Jpanuq8 | 143 |
lm_eval/tasks/bigbench/generate_until/parsinlu_reading_comprehension.yaml | sha256=HRPXjduxFQ66sJImYH00lc7JCNOYvu1Cp1OVpcHtC9Y | 181 |
lm_eval/tasks/bigbench/generate_until/penguins_in_a_table.yaml | sha256=AK27vKzGHc5dZmI_rUOaMb46gqArR93-qFAeWvc0LSM | 159 |
lm_eval/tasks/bigbench/generate_until/periodic_elements.yaml | sha256=W3ru5pbGYHFh3cXAWta5sqN6tPhrfZTr0hmXoftd0uk | 155 |
lm_eval/tasks/bigbench/generate_until/persian_idioms.yaml | sha256=4NV4ESKoI7a7EwwaMoP00HrhbF2n2fFcJDukwkrDjMc | 149 |
lm_eval/tasks/bigbench/generate_until/phrase_relatedness.yaml | sha256=hEoCjBW50vaQcu1EnVRxmHCglXGOJEQITX7ki8oQemY | 157 |
lm_eval/tasks/bigbench/generate_until/physical_intuition.yaml | sha256=4tnrOLP_uEpDciJaSe3bvAyw9V9BiEXIuNmy3CkGMRA | 157 |
lm_eval/tasks/bigbench/generate_until/physics.yaml | sha256=O1CzYMtf6bKfY8xCh8ozpMiGBeKJR2OoDiKnQvS3xro | 135 |
lm_eval/tasks/bigbench/generate_until/physics_questions.yaml | sha256=Y662E9Oe4bGLueoI3htoqKXQohzO5z1siHfkbkX_crk | 155 |
lm_eval/tasks/bigbench/generate_until/play_dialog_same_or_different.yaml | sha256=b2pdgfqb9rmc6zFhFh4OhofhuITnd-CagxP_62YP7_c | 179 |
lm_eval/tasks/bigbench/generate_until/polish_sequence_labeling.yaml | sha256=6syFTfP371tpGL08rlVUPSTGgRYOVs8H6qR-AWwNl9A | 169 |
lm_eval/tasks/bigbench/generate_until/presuppositions_as_nli.yaml | sha256=F8FjUkXb6KO7faXV_OA96c8C8mehFEGr75jng3A7QRE | 165 |
lm_eval/tasks/bigbench/generate_until/qa_wikidata.yaml | sha256=R9dHCcdvg2TzI2ZIyYMz9Va63qrW0XV-3pqDOzAVMMw | 143 |
lm_eval/tasks/bigbench/generate_until/question_selection.yaml | sha256=yy8sqV94vIr97h-srkXC0UXmrn_hCFwfXzuN24T2I84 | 157 |
lm_eval/tasks/bigbench/generate_until/real_or_fake_text.yaml | sha256=BzT3eGjusHCJEkFGUWGKPVHk-Ty-kejnTO09ePPS2-8 | 155 |
lm_eval/tasks/bigbench/generate_until/reasoning_about_colored_objects.yaml | sha256=rHAOlsYCbZi_7Q6CsDJfxHxW-cKMYM108TFrRV6ZtFc | 183 |
lm_eval/tasks/bigbench/generate_until/repeat_copy_logic.yaml | sha256=aMUsLN4oxqceJBjL42m22on1_4S6miTq4zNLWCKHJIE | 155 |
lm_eval/tasks/bigbench/generate_until/rephrase.yaml | sha256=o7I78PrOnUIxqFZ_lNt0twELTMrajUAvI1-HvTM0APM | 137 |
lm_eval/tasks/bigbench/generate_until/riddle_sense.yaml | sha256=eas5Zq3tq1xx03Qn8kB9mU1JbfV-KzY0SWnFTeomy8s | 145 |
lm_eval/tasks/bigbench/generate_until/ruin_names.yaml | sha256=CkUBCb63izgA8XIrA6Ipg_JEsTZUhTd2jvokluiT0ug | 141 |
lm_eval/tasks/bigbench/generate_until/salient_translation_error_detection.yaml | sha256=B4ODGvAsPK_yZhh6tdLwahQedWlrI8C747DnsEtMJ7Y | 191 |
lm_eval/tasks/bigbench/generate_until/scientific_press_release.yaml | sha256=nQqzGRcOY_34eihaI54wGGHxbZmjCiLIlhnTy5NDuRo | 169 |
lm_eval/tasks/bigbench/generate_until/semantic_parsing_in_context_sparc.yaml | sha256=IfY2K5ChSu7wJJocrAcFOqZZ6DJ2UbNQaVu1YmguN4k | 187 |
lm_eval/tasks/bigbench/generate_until/semantic_parsing_spider.yaml | sha256=9NQEKZEqKQIxzTB9yrVOL_n9gdzGCTEh_SM_8d54nxc | 167 |
lm_eval/tasks/bigbench/generate_until/sentence_ambiguity.yaml | sha256=UL89kpxCyDcc80GAvgeyrNSxb7up-Zg2r9vY-DIPOS8 | 157 |
lm_eval/tasks/bigbench/generate_until/similarities_abstraction.yaml | sha256=TJ56BdnL4GqshtCAGMFhnAyoJLakYJjHEg8IjpjUbE4 | 169 |
lm_eval/tasks/bigbench/generate_until/simp_turing_concept.yaml | sha256=VLUMGNwUn7UBmukWVTvm5FpnWwsgI05Sea-mycDxWeY | 159 |
lm_eval/tasks/bigbench/generate_until/simple_arithmetic_json.yaml | sha256=K-mgxW5WEvkTiuPSRLyrOYrQxNsNOKOCxy903yRsAHE | 165 |
lm_eval/tasks/bigbench/generate_until/simple_arithmetic_json_multiple_choice.yaml | sha256=E4ScDHW9xrHYoxX6tHpd9F5TelLTfF1FEkWKjiDrAow | 197 |
lm_eval/tasks/bigbench/generate_until/simple_arithmetic_json_subtasks.yaml | sha256=zrb7SPKYenklYrv5iYEJlhbmoj4hlTsO5LOYzEUaO9g | 183 |
lm_eval/tasks/bigbench/generate_until/simple_arithmetic_multiple_targets_json.yaml | sha256=hj5tcAejMWEqUpKb92vrxZdc3DmgQiV4wTGUxS0Ah_A | 199 |
lm_eval/tasks/bigbench/generate_until/simple_ethical_questions.yaml | sha256=W3Q1UG0OZafvdloI4_6KrKUqBWySFjB86ip0wzq1qCY | 169 |
lm_eval/tasks/bigbench/generate_until/simple_text_editing.yaml | sha256=9tauwNsCUcTjnjjmB7Ci1ffGJfT6kytRqruJQr9OsfI | 159 |
lm_eval/tasks/bigbench/generate_until/snarks.yaml | sha256=-xI33E-A5p91T-56El3AIwWq8BUaCMvea32zq0VzeS4 | 133 |
lm_eval/tasks/bigbench/generate_until/social_iqa.yaml | sha256=m5y4-e6B9_hsHpO4N1xORqWMGNW26zqG4amCwQViMxs | 141 |
lm_eval/tasks/bigbench/generate_until/social_support.yaml | sha256=Rw5LSAeaKSqM4P-Bw7TFuyrH2LQHr4eHJU7iF46_HAY | 149 |
lm_eval/tasks/bigbench/generate_until/sports_understanding.yaml | sha256=THgiCQZQ7uXebiKfUfxMeoRn-wHj9YlbEDzEbUYPFks | 161 |
lm_eval/tasks/bigbench/generate_until/strange_stories.yaml | sha256=jmSfVWMoIj3671y9thmnqV8CRip8gEzxon2NPQy6EVg | 151 |
lm_eval/tasks/bigbench/generate_until/strategyqa.yaml | sha256=pvrWXwq87EQTrLZFlvrZwaUvL5S5fGic7ygFJRXH5cM | 141 |
lm_eval/tasks/bigbench/generate_until/sufficient_information.yaml | sha256=y7jEwlu2P7qgTjNiTJZ9H0jJQjnirAIlZTWVB_n5umg | 165 |
lm_eval/tasks/bigbench/generate_until/suicide_risk.yaml | sha256=tVTkOx8x631h4azG5yEH6k_tx8PINMgp5gJEAJNnsyY | 145 |
lm_eval/tasks/bigbench/generate_until/swahili_english_proverbs.yaml | sha256=p2-DYr3WcFI8WSzoh_6ztyYXPZwK15f1d-XXld6xDsQ | 169 |
lm_eval/tasks/bigbench/generate_until/swedish_to_german_proverbs.yaml | sha256=wR1R1kRuLai6rrIkL_X2qnjFecZpiBqSpE2Sl6_D5wE | 173 |
lm_eval/tasks/bigbench/generate_until/symbol_interpretation.yaml | sha256=4Eg8-UYe6AvRZVvoyw4pWg3G8SLvotH6Y-fy7t-hI5A | 163 |
lm_eval/tasks/bigbench/generate_until/temporal_sequences.yaml | sha256=gJ5NyIda1KbTaZ4DsUKm_TwZDervdNq_rThpzo5lPbo | 157 |
lm_eval/tasks/bigbench/generate_until/tense.yaml | sha256=eorYGhfu6AXOFeGLs2iMWVpoPYm_dyV4slefRIdJ0Zc | 131 |
lm_eval/tasks/bigbench/generate_until/timedial.yaml | sha256=Sp9BMfBIs4Bob-XdxDhqKdL_QVcHDsdj05hyeGp3pBs | 137 |
lm_eval/tasks/bigbench/generate_until/topical_chat.yaml | sha256=rcjpxp2ukXzx8nTEcQr4oYEo7TjiFGnHeYZU5oM12ZQ | 145 |
lm_eval/tasks/bigbench/generate_until/tracking_shuffled_objects.yaml | sha256=SCfecVUi2EGMRzune6kpya491RDXoyct3cbtc7A3C-A | 171 |
lm_eval/tasks/bigbench/generate_until/understanding_fables.yaml | sha256=vH8I0hlKQ5P8cOGUeI91NClne9qMSUTv7vT0wHK0Z88 | 161 |
lm_eval/tasks/bigbench/generate_until/undo_permutation.yaml | sha256=9BHOlfV8xa5kjVW-uM635tkxDlTTuVFfwn5sw1XX8b4 | 153 |
lm_eval/tasks/bigbench/generate_until/unit_conversion.yaml | sha256=wtTHImrbhNRkSHyF-5hQUvBE0Pdn574G5TIdom-VmfA | 151 |
lm_eval/tasks/bigbench/generate_until/unit_interpretation.yaml | sha256=9AHsHkx1dwuL2gfbLq8mduuitpKJgpD38xyWNTpfxPQ | 159 |
lm_eval/tasks/bigbench/generate_until/unnatural_in_context_learning.yaml | sha256=QDLLkgEaTMOQ67huKiLaC1puqfxBcd-W-5U1iIg0aOw | 179 |
lm_eval/tasks/bigbench/generate_until/vitaminc_fact_verification.yaml | sha256=UdngQIP7djwfw3Yr1n8OTDv5c5wa9vLKuuJXm_62Q2c | 173 |
lm_eval/tasks/bigbench/generate_until/what_is_the_tao.yaml | sha256=X2ONz9UFxL975TIiCk-L7C5wDRI3TUxN3LCVzCIBswo | 151 |
lm_eval/tasks/bigbench/generate_until/which_wiki_edit.yaml | sha256=11AwFg-8uyzYs01JdsTlD-76YJTy8QQElnBYtWTxZb0 | 151 |
lm_eval/tasks/bigbench/generate_until/winowhy.yaml | sha256=339YOg_p3fq0a8-5mBkuruJintiUmhe4VzuC4JATV7Y | 135 |
lm_eval/tasks/bigbench/generate_until/word_sorting.yaml | sha256=sw0cqkQkb4K6yuQpa1HTDRPi36uQKfuJDnpTlHvTspM | 145 |
lm_eval/tasks/bigbench/generate_until/word_unscrambling.yaml | sha256=vLuTPnG1BzEJcMQwQF37FNPPcFgw9E73tY6i2Y5ABps | 155 |
lm_eval/tasks/bigbench/multiple_choice/abstract_narrative_understanding.yaml | sha256=wC1sP9TEDVeqNyIH22iaUsotWkGzOTKvbwgiqH968n0 | 187 |
lm_eval/tasks/bigbench/multiple_choice/anachronisms.yaml | sha256=C7Je1VX1Oer2QQZ5oTUDaRrvXNVk0hm1v0i9V5ZizBg | 147 |
lm_eval/tasks/bigbench/multiple_choice/analogical_similarity.yaml | sha256=t7OKYASkSANtBukdp0rCrrb9mRnv9AVymxrpbiOpROk | 165 |
lm_eval/tasks/bigbench/multiple_choice/analytic_entailment.yaml | sha256=INZHBFKntYor3Y5jKmQcpfVfWNzKJa9UnSVP9YwfIS0 | 161 |
lm_eval/tasks/bigbench/multiple_choice/arithmetic.yaml | sha256=2FBfcRxlIlMKiYcZpgbH1SJEdKysdCnqnqafTV4jdMw | 143 |
lm_eval/tasks/bigbench/multiple_choice/ascii_word_recognition.yaml | sha256=dWZZsykMhM60NfZVwuca4ZCsRMyIQm2y7xal9j5N0R8 | 167 |
lm_eval/tasks/bigbench/multiple_choice/authorship_verification.yaml | sha256=gjE-K4rye_zIaKDlh8dYy-VwPjofrEl3MQH34Bru_t0 | 169 |
lm_eval/tasks/bigbench/multiple_choice/auto_categorization.yaml | sha256=1Loa5kQ4sOzlqfcbUdrdTIL7uFkAwNdJRlW8ZHA0mrE | 161 |
lm_eval/tasks/bigbench/multiple_choice/auto_debugging.yaml | sha256=uvO9d4dm7ZSI9ExMlEVxHup4SEPMYsC9f-9pCjqhiak | 151 |
lm_eval/tasks/bigbench/multiple_choice/bbq_lite_json.yaml | sha256=PwESU5lyQ8jCt48M1CRu35zjrZe_1KJ0vRAkRsD344M | 149 |
lm_eval/tasks/bigbench/multiple_choice/bridging_anaphora_resolution_barqa.yaml | sha256=zRYUaV6tbiR4vzKE9WNfLuzVycUQgAC2wDrcQ46kQyA | 191 |
lm_eval/tasks/bigbench/multiple_choice/causal_judgment.yaml | sha256=cOoY9jmJRYkA1KGalJ7h8dBUpv9chuakALtfH08gw2w | 153 |
lm_eval/tasks/bigbench/multiple_choice/cause_and_effect.yaml | sha256=wCaVMnfOjvtrVugUuGtsFW6TS9rrJDY0sn3d6mgiz70 | 155 |
lm_eval/tasks/bigbench/multiple_choice/checkmate_in_one.yaml | sha256=gDzulVCGouLHriNLgPs40lx_70LyQQt48yzZoU9mwr4 | 155 |
lm_eval/tasks/bigbench/multiple_choice/chess_state_tracking.yaml | sha256=cpMuwLx4PM6LIZgLKxGFJ5bJbESrjJSwjtrYsi24hvo | 163 |
lm_eval/tasks/bigbench/multiple_choice/chinese_remainder_theorem.yaml | sha256=2kOE5oUeEIvF1T7QwbwbOs_YvWkz9LmRlD6oGAOG7aE | 173 |
lm_eval/tasks/bigbench/multiple_choice/cifar10_classification.yaml | sha256=aaF6C9Y0ShfklEKSBTV1Ge56N9hjGbUWoBhb-k0Q8BM | 167 |
lm_eval/tasks/bigbench/multiple_choice/code_line_description.yaml | sha256=S1035NWJpfsH422H5l0ODN5IYD--TmpCRQ2oYjxwKDM | 165 |
lm_eval/tasks/bigbench/multiple_choice/codenames.yaml | sha256=g9ZH3kojjsJIInfiG_8jQ59lRYE58Beo_vM9-u01tWo | 141 |
lm_eval/tasks/bigbench/multiple_choice/color.yaml | sha256=AQVs0lfVjCKmQVxD21lZ0wvt05IT5zj8hKTBJHIyo-M | 133 |
lm_eval/tasks/bigbench/multiple_choice/common_morpheme.yaml | sha256=1lMuopdW2sXoOl0seZam01J5QLoGQcin6dcak6aIUqY | 153 |
lm_eval/tasks/bigbench/multiple_choice/conceptual_combinations.yaml | sha256=AUk3ixDxwC2d2mmyy0vgBHlvdF8WrZ8CQEVYw_-IRKk | 169 |
lm_eval/tasks/bigbench/multiple_choice/conlang_translation.yaml | sha256=hMZ4TDw66UMt95YDTdzOd8xND9dMboYKRNmHlVZMtwk | 161 |
lm_eval/tasks/bigbench/multiple_choice/contextual_parametric_knowledge_conflicts.yaml | sha256=vtAoTqjUA-LA-6Ha2NTU4mp4sLj8tJ3Pnp6VSiojCjE | 205 |
lm_eval/tasks/bigbench/multiple_choice/crash_blossom.yaml | sha256=TrQV25mnyMHwd_ScNwn5mS8I5P-p3Eh7udUJkdUsWQE | 149 |
lm_eval/tasks/bigbench/multiple_choice/crass_ai.yaml | sha256=40zHsjc3Kwzx4pEHE3EHbmKse2OWlLvVpUio6s9TSME | 139 |
lm_eval/tasks/bigbench/multiple_choice/cryobiology_spanish.yaml | sha256=vQmzgs2Qc6HggqhLO6gnhSMZ9TQLia234w3l-3YM5yg | 161 |
lm_eval/tasks/bigbench/multiple_choice/cryptonite.yaml | sha256=B7W_fs7aBd3bdNrESbV_hN3FinjmtSkQJBIfpLJx-rM | 143 |
lm_eval/tasks/bigbench/multiple_choice/cs_algorithms.yaml | sha256=CBAuNg7LJg_ZkOcwToxUiyx9J9UYL_ZywFBF76RUOW8 | 149 |
lm_eval/tasks/bigbench/multiple_choice/dark_humor_detection.yaml | sha256=ZR7uOXffiox0IEVWYkXOT7SdIQnDcJagKX7VBi67ZIw | 163 |
lm_eval/tasks/bigbench/multiple_choice/date_understanding.yaml | sha256=MCTeid6Oka450ykNY7W3_R0A_PQJho22VFmCeHIfbYo | 159 |
lm_eval/tasks/bigbench/multiple_choice/disambiguation_qa.yaml | sha256=JcqPKhHYk16GrGPoayMtU3GfobU9q4_CJls75HEO2vU | 157 |
lm_eval/tasks/bigbench/multiple_choice/discourse_marker_prediction.yaml | sha256=xiBp0rF6bDNiK29LA_3e3F4z2XBpP4Q04ui8swgUdOM | 177 |
lm_eval/tasks/bigbench/multiple_choice/disfl_qa.yaml | sha256=FT-7_mTAmg2G8cnkBdC_WM7K48XGVOIYrNPyZU4yKgI | 139 |
lm_eval/tasks/bigbench/multiple_choice/dyck_languages.yaml | sha256=zoC2Wr7zftGCJ7Vxz9n-uKnsyC41MEa8qWFzCq0Iw-Q | 151 |
lm_eval/tasks/bigbench/multiple_choice/elementary_math_qa.yaml | sha256=bl0WofRVx69oiYan7-6E4GyIy9O06MbN-ufJQOwC4xw | 159 |
lm_eval/tasks/bigbench/multiple_choice/emoji_movie.yaml | sha256=5bb5pq4ODf2K0KvBKxuS8wzNyiTfCnacRGzlr_FL0ao | 145 |
lm_eval/tasks/bigbench/multiple_choice/emojis_emotion_prediction.yaml | sha256=m4nNGvxS2WQvxPnL8zraYKMT_G-Ech-YQpJPHNBOOx4 | 173 |
lm_eval/tasks/bigbench/multiple_choice/empirical_judgments.yaml | sha256=LW2ualE3N4kwkHVrI0d6EoyGMYW2w9zAHeZSblMoBY4 | 161 |
lm_eval/tasks/bigbench/multiple_choice/english_proverbs.yaml | sha256=pvklpKxfGJPON-55U-u_OpuX6TjeiFAwaZG9DoYWsL8 | 155 |
lm_eval/tasks/bigbench/multiple_choice/english_russian_proverbs.yaml | sha256=LaXw7JBMw9wYRSQ5Oc6UcVRWRObxK-YZZuET8RnImNE | 171 |
lm_eval/tasks/bigbench/multiple_choice/entailed_polarity.yaml | sha256=O4jpB-YazafZ2eMfAP_X5V6km3_SYrVM8TQr20kgsDM | 157 |
lm_eval/tasks/bigbench/multiple_choice/entailed_polarity_hindi.yaml | sha256=XMv0z940AAAPrLUOLbzx30hK1nto1eOHdHtFmpZjiHo | 169 |
lm_eval/tasks/bigbench/multiple_choice/epistemic_reasoning.yaml | sha256=V5TJetxQ2yrJ6-wKdocsee7IQ5RCDFEyCyAyxrJKCJg | 161 |
lm_eval/tasks/bigbench/multiple_choice/evaluating_information_essentiality.yaml | sha256=tvkY6sCaIJ8__vR6s-KwEd98-ratIPCoqRt3aDJGiqk | 193 |
lm_eval/tasks/bigbench/multiple_choice/fact_checker.yaml | sha256=PsjpCG1Lr4TyF0j4g3qafA9JilHA-gkOk4UFJBi26Jg | 147 |
lm_eval/tasks/bigbench/multiple_choice/fantasy_reasoning.yaml | sha256=WV-E_5iU6mzN6TuVx5tzxQHoj4eRECe1nGvBYchoKWM | 157 |
lm_eval/tasks/bigbench/multiple_choice/few_shot_nlg.yaml | sha256=jyhPKTSznBwm-Wc4qZL-oRNuW_bX0EHm_Ub5yPQNrkc | 147 |
lm_eval/tasks/bigbench/multiple_choice/figure_of_speech_detection.yaml | sha256=M_04O90Pe0ouz3C1hB9cr3OHCpDBg6uEwmov0WmpG1w | 175 |
lm_eval/tasks/bigbench/multiple_choice/formal_fallacies_syllogisms_negation.yaml | sha256=kYQBuhXwGX4rkfsH5-xl8a89clZ44J2yDRDXWaEWxlo | 195 |
lm_eval/tasks/bigbench/multiple_choice/gem.yaml | sha256=p5K2HUddtwio3c-BDgWgXA1IakG9WRxxWwlrkk6DhZE | 129 |
lm_eval/tasks/bigbench/multiple_choice/gender_inclusive_sentences_german.yaml | sha256=M8fGO2pAf24VVLe475dPNULbbfS8VKqo4kJavuCPiMc | 189 |
lm_eval/tasks/bigbench/multiple_choice/general_knowledge.yaml | sha256=c0wF8hScD69clivEqyHCrS-q54U3HXxkSdaTnF6Japs | 157 |
lm_eval/tasks/bigbench/multiple_choice/geometric_shapes.yaml | sha256=fC2JycgGzSw7Mv2Rtrm9LuzBMPOQ7GOsbvn6BTFPWYM | 155 |
lm_eval/tasks/bigbench/multiple_choice/goal_step_wikihow.yaml | sha256=YKxtalWZL4K1_ZsWc-LjcuoCcA4zZrJo9k2j6Gwf-H0 | 157 |
lm_eval/tasks/bigbench/multiple_choice/gre_reading_comprehension.yaml | sha256=fP4Je-tWun2_aVA9t5VdgVQhxr_XV6dFpOqN8gOmQHs | 173 |
lm_eval/tasks/bigbench/multiple_choice/hhh_alignment.yaml | sha256=_tUXB6FyCm4FhrzdvGCGToZ9Uel7iiT9bTYhcctmxcc | 149 |
lm_eval/tasks/bigbench/multiple_choice/hindi_question_answering.yaml | sha256=OoSurgrc790dPRWg_xpYhqCpqYwKgzCtc5UQNVhQC2Y | 171 |
lm_eval/tasks/bigbench/multiple_choice/hindu_knowledge.yaml | sha256=mR19KJvjc1Zfu1iTZ_XXJEHhGceewlaIor23i9NFT-4 | 153 |
lm_eval/tasks/bigbench/multiple_choice/hinglish_toxicity.yaml | sha256=yFWbJIcU7bixzLbEhGB8jTh_zfufQDN9pb9RHsjI3is | 157 |
lm_eval/tasks/bigbench/multiple_choice/human_organs_senses.yaml | sha256=AN-lVocUpTUEXbxlXETc9wvbtI4VlQRbam4yJ8DuAa8 | 161 |
lm_eval/tasks/bigbench/multiple_choice/hyperbaton.yaml | sha256=cD8xjAZ2PkPaNci9URLHuJp6ycFqBaFItFDx1CbMnIU | 143 |
lm_eval/tasks/bigbench/multiple_choice/identify_math_theorems.yaml | sha256=fuAPHAn6v_4nsTlMViKA--Oir38GoRFdRsjbgXajIYU | 167 |
lm_eval/tasks/bigbench/multiple_choice/identify_odd_metaphor.yaml | sha256=abV3gYfcE6CkeVu_VHw34PHOKB-lqxpIVUbpS5_KECg | 165 |
lm_eval/tasks/bigbench/multiple_choice/implicatures.yaml | sha256=wxZTAm9VbfCWoxE1jU9k3nzy4njiLbQf6syZJHoKT5A | 147 |
lm_eval/tasks/bigbench/multiple_choice/implicit_relations.yaml | sha256=qCOpepGcuNlXEkSXzQ8kWBhMd5SxMH21Qe4rOkQruzs | 159 |
lm_eval/tasks/bigbench/multiple_choice/intent_recognition.yaml | sha256=NgkXv5sA4F6tA7yW6NVdGolTURrf9_2hr4-qGzgl4RI | 159 |
lm_eval/tasks/bigbench/multiple_choice/international_phonetic_alphabet_nli.yaml | sha256=ikVnfnKZMzeuE2DxWfdyHxN2I78_o2WbOiQmyZdAmIY | 193 |
lm_eval/tasks/bigbench/multiple_choice/international_phonetic_alphabet_transliterate.yaml | sha256=Q9G0lf0IolZ6zI5Kql6WiTdIU1LXOhdvGgnFDMzSh2g | 213 |
lm_eval/tasks/bigbench/multiple_choice/intersect_geometry.yaml | sha256=AMQk-kMyhzMYRKXMPwVjRw81vz5SbzdJKv3n3DVhE-s | 159 |
lm_eval/tasks/bigbench/multiple_choice/irony_identification.yaml | sha256=9uJjn9cc_1FKV0B6Q_RApFQFLgOWg5epCthdFy4OxbQ | 163 |
lm_eval/tasks/bigbench/multiple_choice/kanji_ascii.yaml | sha256=OiDkSbsojWXhvuXd1hm-gg0FDAM1gIFi3ZgIqSCZ7Ak | 145 |
lm_eval/tasks/bigbench/multiple_choice/kannada.yaml | sha256=9r5l-ePBRwIct7oCLnbcAd1Go7YjdT4_49VFW9MZUFg | 137 |
lm_eval/tasks/bigbench/multiple_choice/key_value_maps.yaml | sha256=oDwDxjIHL_xoL59erf39h02ktA175lz3AwVmdQO4EBY | 151 |
lm_eval/tasks/bigbench/multiple_choice/known_unknowns.yaml | sha256=zqJ_y82QBR49vIjl-nXaMztSnmQHZyt89iYduvODAJI | 151 |
lm_eval/tasks/bigbench/multiple_choice/language_games.yaml | sha256=uNakbVpnDGUANSXyjC2Soq2AhojHJxdP8nUtZtoQCZ8 | 151 |
lm_eval/tasks/bigbench/multiple_choice/language_identification.yaml | sha256=H9R_FN6zSJ-r1PJuxzLj-Zokaz_h_SnFL5-TOqsXgrk | 169 |
lm_eval/tasks/bigbench/multiple_choice/linguistic_mappings.yaml | sha256=1Gg8iqLbb_Q1loJ3D6vrp1cG_RPMiJ_lidRaDmXmQjY | 161 |
lm_eval/tasks/bigbench/multiple_choice/linguistics_puzzles.yaml | sha256=IFwKu0pmpWcPPfw2mlB-vHJQdnc2UeGOnFpJW862ejQ | 161 |
lm_eval/tasks/bigbench/multiple_choice/list_functions.yaml | sha256=YnjOU3p7YZ6H-b-3pe7JpxqU7n38vDRUujHvFeGg9rg | 151 |
lm_eval/tasks/bigbench/multiple_choice/logic_grid_puzzle.yaml | sha256=tTzJVoptnvAXvHrSa_p8SQBitcqm33N7xj19c5-k958 | 157 |
lm_eval/tasks/bigbench/multiple_choice/logical_args.yaml | sha256=EXkFCjB2ZwgQbaFRueg0GAU0YeaShfIg7Hntr6qLl6c | 147 |
lm_eval/tasks/bigbench/multiple_choice/logical_deduction.yaml | sha256=CkQfV5G0ODHf2-jsn-kGQpWVn_XZxvCQMC51FLB_-2I | 157 |
lm_eval/tasks/bigbench/multiple_choice/logical_fallacy_detection.yaml | sha256=38FqX9n3B7vCiAipQOBy0h-U196BkXJbLYas9QQf_lU | 173 |
lm_eval/tasks/bigbench/multiple_choice/logical_sequence.yaml | sha256=svmGHJqVBczZFAJIlLEr1ZkXeww14sJmlSO0Q3mPSNo | 155 |
lm_eval/tasks/bigbench/multiple_choice/mathematical_induction.yaml | sha256=WlHISjFdS1bDDWcXaunC_YCxR8xiwDMywcK1V5oTjSs | 167 |
lm_eval/tasks/bigbench/multiple_choice/matrixshapes.yaml | sha256=dRaQ7CK36fOGIgxjQpqbL0G54sCruap1erCqwjKn8II | 147 |
lm_eval/tasks/bigbench/multiple_choice/metaphor_boolean.yaml | sha256=6zPIyGfa2_1F0izqys2BA_oPRqP6bkuG8mn1sr-SSO8 | 155 |
lm_eval/tasks/bigbench/multiple_choice/metaphor_understanding.yaml | sha256=gDPNGHax72oqSOG9FEZtb4o1RwnQFRnWxtpP21MtTGA | 167 |
lm_eval/tasks/bigbench/multiple_choice/minute_mysteries_qa.yaml | sha256=uxFxZS1VCrFTzlCNIZySELdJwBySfiy49d9sDl0PxIQ | 161 |
lm_eval/tasks/bigbench/multiple_choice/misconceptions.yaml | sha256=hD9u1UkaUMCrBOo4hQ3aqGaXn2OsYWx9BHehVbmR8SQ | 151 |
lm_eval/tasks/bigbench/multiple_choice/misconceptions_russian.yaml | sha256=RyOFlUECkBfgXVwINo6nb4LZGIGEHvEOf3QXRPuHqgo | 167 |
lm_eval/tasks/bigbench/multiple_choice/mnist_ascii.yaml | sha256=d82XP_zCc1BVX62ACAtwRFqTknRUiBdA8e_dfG8mDDU | 145 |
lm_eval/tasks/bigbench/multiple_choice/modified_arithmetic.yaml | sha256=k9XOUspUkQgwPr6zq8x_thAYCKCXWQnI42WObqza1cA | 161 |
lm_eval/tasks/bigbench/multiple_choice/moral_permissibility.yaml | sha256=gwWRvZfl3EB6KfqPgeYopWi0selkq6TUoOwT2yIu-N8 | 163 |
lm_eval/tasks/bigbench/multiple_choice/movie_dialog_same_or_different.yaml | sha256=rbRbTacFYTA4w0IiCDwu-BV3cXdoTyUHaiZBw_da3KM | 183 |
lm_eval/tasks/bigbench/multiple_choice/movie_recommendation.yaml | sha256=Q_m6rVIIAYrScV9rOL-whs2uQpI_SS_PfzlRvguOSEo | 163 |
lm_eval/tasks/bigbench/multiple_choice/mult_data_wrangling.yaml | sha256=qqn2a0LC4p3RZfCr0zPwK3RrH3ujzASfFzWZBouJMlc | 161 |
lm_eval/tasks/bigbench/multiple_choice/multiemo.yaml | sha256=mQiAx9YxXNa7KIiQOq5-xsw6H3orqeTKaTWUMVQ-eH4 | 139 |
lm_eval/tasks/bigbench/multiple_choice/natural_instructions.yaml | sha256=Xkz8HRANNey5ai4RDCKq74SKvjDiAgFCnOtc2cpW_KY | 163 |
lm_eval/tasks/bigbench/multiple_choice/navigate.yaml | sha256=4w-tghcD6TA82faIKLv7a788eeunV9xLpZuEgv-_fPQ | 139 |
lm_eval/tasks/bigbench/multiple_choice/nonsense_words_grammar.yaml | sha256=WcvwDGDH3ngMkubAv-OwJotfPospfM0g9sQvt28zcDI | 167 |
lm_eval/tasks/bigbench/multiple_choice/novel_concepts.yaml | sha256=70FLoqaSM9FuJcw3Inq0_lDlq9kOhZKA9LRP3pyMkTg | 151 |
lm_eval/tasks/bigbench/multiple_choice/object_counting.yaml | sha256=FgmaBFkmloF4vO_ggHuFZAZ0y63SP7jFcROGEQa5K4Q | 153 |
lm_eval/tasks/bigbench/multiple_choice/odd_one_out.yaml | sha256=pNe2yMix9NoxFR1uFGMvmGJ-XXaf-k91GqhVGqx8IIo | 145 |
lm_eval/tasks/bigbench/multiple_choice/operators.yaml | sha256=dynr_XiyX2B3YdNH0aYHumgStnqf1Xlc1tEqnaLNSwU | 141 |
lm_eval/tasks/bigbench/multiple_choice/paragraph_segmentation.yaml | sha256=pzkd799eOlhMSs1plT9VKX2va6QR8pGw-G3ZQ7fJdSY | 167 |
lm_eval/tasks/bigbench/multiple_choice/parsinlu_qa.yaml | sha256=AVBwt6tCfZ0laBosVW5MQ9ko8487szfZPWs3EvDIKEY | 145 |
lm_eval/tasks/bigbench/multiple_choice/parsinlu_reading_comprehension.yaml | sha256=5FOCYca9TArYrwVDhW-j8gVNDdh7gj2Xx5bNU05NrLE | 183 |
lm_eval/tasks/bigbench/multiple_choice/penguins_in_a_table.yaml | sha256=oL_-N96gKsrGBfBg2UD6ct3hU1gh51gvXpKoCGD0DuY | 161 |
lm_eval/tasks/bigbench/multiple_choice/periodic_elements.yaml | sha256=HypvcUcCkflKLvsZFP9_OmmWmNCpHN2oflxSs-0se4k | 157 |
lm_eval/tasks/bigbench/multiple_choice/persian_idioms.yaml | sha256=S_f8iqKOnKJ4lHG5egkLDgO3XqQhz8eluPDizWvvyhw | 151 |
lm_eval/tasks/bigbench/multiple_choice/phrase_relatedness.yaml | sha256=SbcRCbbvr50IkMhdJOYh6Ut2hvIv6tKAr-H6Ly0xVn4 | 159 |
lm_eval/tasks/bigbench/multiple_choice/physical_intuition.yaml | sha256=itDxp960hGYTGOecgg4_SIvnVUJWD2oGK0VS1bwfFvc | 159 |
lm_eval/tasks/bigbench/multiple_choice/physics.yaml | sha256=zp1ylYAHchQc_NZI_80znXr3x1Keaith7F7FZWixdZY | 137 |
lm_eval/tasks/bigbench/multiple_choice/physics_questions.yaml | sha256=KAOHwtZhxcs1OM9zHkTjLKih8qFPR6UTuY5xs0J1QM0 | 157 |
lm_eval/tasks/bigbench/multiple_choice/play_dialog_same_or_different.yaml | sha256=XARNBYPXja_b1ve7ivRgjY40Rs_sY0-Ypb4wR10HJos | 181 |
lm_eval/tasks/bigbench/multiple_choice/polish_sequence_labeling.yaml | sha256=6mgV-tUc9a9al1MqQuPMBRTHnADYjcmOb2wiZ2aKPTs | 171 |
lm_eval/tasks/bigbench/multiple_choice/presuppositions_as_nli.yaml | sha256=nxOBZPZEZiW3U3oehpw__LgpohBZqtw6C228vfWkpOI | 167 |
lm_eval/tasks/bigbench/multiple_choice/qa_wikidata.yaml | sha256=AQqA32tK3YV35djuf0xguKYGjUlYu7aF7nzYNVLv3zY | 145 |
lm_eval/tasks/bigbench/multiple_choice/question_selection.yaml | sha256=-We9wR4lHJ8Mt876ASjZ-BCqDgVJ3rxjetwkhDN6m44 | 159 |
lm_eval/tasks/bigbench/multiple_choice/real_or_fake_text.yaml | sha256=sXE9yUoZP_zLenXb3elDIqkbqWliUCGgbj-2zJaZ1j0 | 157 |
lm_eval/tasks/bigbench/multiple_choice/reasoning_about_colored_objects.yaml | sha256=GxUoDPDFc1X_A8t6Ry0U2ik4nFPCPD_rcRb2NzSazpQ | 185 |
lm_eval/tasks/bigbench/multiple_choice/repeat_copy_logic.yaml | sha256=zwE2sFi9wS_uSfJuk06Pp-iwMU9kKHZ-Hycdl0XzlmI | 157 |
lm_eval/tasks/bigbench/multiple_choice/rephrase.yaml | sha256=765_dob8s3IUxEIBnEjXROaraac0MXMJsIO6427AHlQ | 139 |
lm_eval/tasks/bigbench/multiple_choice/riddle_sense.yaml | sha256=3YmY87ChwiGd7QR4svwruN7uTbHc9SO2GrY5P27R6hY | 147 |
lm_eval/tasks/bigbench/multiple_choice/ruin_names.yaml | sha256=FftjCDl4NT38Y9OGqXK8DPpJMlpiuIrCgFmHf4dUPIc | 143 |
lm_eval/tasks/bigbench/multiple_choice/salient_translation_error_detection.yaml | sha256=cwqUPYs4ABD4Up3p5Zoc9o1eRWIDWJeF6LCqlzYbnsA | 193 |
lm_eval/tasks/bigbench/multiple_choice/scientific_press_release.yaml | sha256=K-hSiBHahbEHsTRZcRlrLiTgr40LpSz2XqxelmVpPkg | 171 |
lm_eval/tasks/bigbench/multiple_choice/semantic_parsing_in_context_sparc.yaml | sha256=e4rUYPAz9NKdHyJuVNm8aOCc5wvJfCufbkBgDOdcuxo | 189 |
lm_eval/tasks/bigbench/multiple_choice/semantic_parsing_spider.yaml | sha256=03wphaTbuRbJjPimKY46pZyR7xYXtinoazFm9y8W3UU | 169 |
lm_eval/tasks/bigbench/multiple_choice/sentence_ambiguity.yaml | sha256=JE1-08FYW-dxEOpx5bpZezg7bv7PGXxKrPJy6-YyBls | 159 |
lm_eval/tasks/bigbench/multiple_choice/similarities_abstraction.yaml | sha256=mSSvLTS_klQJnnJ5XyivY35lRjPBlnMaIRZm1qksNNE | 171 |
lm_eval/tasks/bigbench/multiple_choice/simp_turing_concept.yaml | sha256=PCjOzMdvflXFY80rT2mUEqrRSUSjpV2G4nBvJrg-7bY | 161 |
lm_eval/tasks/bigbench/multiple_choice/simple_arithmetic_json.yaml | sha256=Vn-qd71dMDRG_O8qW3RWNw18RfzRfh_WAbX8uIWdJ-4 | 167 |
lm_eval/tasks/bigbench/multiple_choice/simple_arithmetic_json_multiple_choice.yaml | sha256=z-7I7haN3gbj-ob7HpXEcc3BGHi54Rcpx4vUuklopXY | 199 |
lm_eval/tasks/bigbench/multiple_choice/simple_arithmetic_json_subtasks.yaml | sha256=scaWSib2RTInLTPq9QTjP9jqFuGrswRjoG1ldf7ZV40 | 185 |
lm_eval/tasks/bigbench/multiple_choice/simple_arithmetic_multiple_targets_json.yaml | sha256=c_5j1thsZWGPpN587L9wwTvGXJtn0bXHwsPkQti-Gtc | 201 |
lm_eval/tasks/bigbench/multiple_choice/simple_ethical_questions.yaml | sha256=AoEpxT-BJNoK14erRJF2KMRHhxYQknT8RlKyFfUo464 | 171 |
lm_eval/tasks/bigbench/multiple_choice/simple_text_editing.yaml | sha256=iQ2dhZDQmVjwI45MNA4tq6QSUteDHZhrAA26AUcolfM | 161 |
lm_eval/tasks/bigbench/multiple_choice/snarks.yaml | sha256=6fzQ534gJ258GBeQ_dAfY6XDWO_4iiFCqnk25UoLaw8 | 135 |
lm_eval/tasks/bigbench/multiple_choice/social_iqa.yaml | sha256=9YXML6u8TMjEXmgoiCCaxPuwWAkI3D_hZ7DSFHgXOBM | 143 |
lm_eval/tasks/bigbench/multiple_choice/social_support.yaml | sha256=0DtPajyURdrecK8iK_a1rHn0CGSVl0AV4P-ZHsdYX90 | 151 |
lm_eval/tasks/bigbench/multiple_choice/sports_understanding.yaml | sha256=tMqTvRUO8LkLwBlETT0gifsPuVhGPloBALx0RFUbiDg | 163 |
lm_eval/tasks/bigbench/multiple_choice/strange_stories.yaml | sha256=tg_ziIxDWhe-gKEZhXmPYBPjxEO5eLBIxZt0jNamWJs | 153 |
lm_eval/tasks/bigbench/multiple_choice/strategyqa.yaml | sha256=qpCs5rUpwnwaxM2-WwoD7d_dcGyRNj9udfj3YgPg0XA | 143 |
lm_eval/tasks/bigbench/multiple_choice/sufficient_information.yaml | sha256=6ELBpj2L4d328g-i3VBD4TdF-bbluyLMwvxbeEosXS4 | 167 |
lm_eval/tasks/bigbench/multiple_choice/suicide_risk.yaml | sha256=6gP5J1tuQZbJV0GzM1EF0d6_YvK9_oQ_Ql4R8AiPQEk | 147 |
lm_eval/tasks/bigbench/multiple_choice/swahili_english_proverbs.yaml | sha256=wMNK9p2Pj30r66cn1zvSShLSux0RfFuVfNqWwGB70UA | 171 |
lm_eval/tasks/bigbench/multiple_choice/swedish_to_german_proverbs.yaml | sha256=5XxtyZUUBNpHkfQnyuxGO8vkJFeOk4TC_UPy_CQCT8M | 175 |
lm_eval/tasks/bigbench/multiple_choice/symbol_interpretation.yaml | sha256=8VX_GFgr3i6Dc8tn0VOeIQ_wNzKbsLZsEXwNywbDSV0 | 165 |
lm_eval/tasks/bigbench/multiple_choice/temporal_sequences.yaml | sha256=H0WwLH2bVviU4DCJG84cdRj7S_O--KFo0ibF2Marr5g | 159 |
lm_eval/tasks/bigbench/multiple_choice/tense.yaml | sha256=Bruxfq7hLnGRQgBe3wP2dTuNi-lEEBLZkB0OtcOwDG0 | 133 |
lm_eval/tasks/bigbench/multiple_choice/timedial.yaml | sha256=AydfQAj3ZiDrUzOCHOnVRNrza3UbwsLgNvnEtboFK2E | 139 |
lm_eval/tasks/bigbench/multiple_choice/topical_chat.yaml | sha256=buvC9ck4McRAUL7hO2q-C3tbOZ4IRhtrvFoX5d98tRE | 147 |
lm_eval/tasks/bigbench/multiple_choice/tracking_shuffled_objects.yaml | sha256=q4HsGJ0s0z8nQ4igwGUukttJBuMkiJc926OPME6UE-Q | 173 |
lm_eval/tasks/bigbench/multiple_choice/understanding_fables.yaml | sha256=vrKXG8Y9kVogHrp0FnMYarytSJLGD2QcGldbhWbX98U | 163 |
lm_eval/tasks/bigbench/multiple_choice/undo_permutation.yaml | sha256=obnLt5OywuNhhELip5jNgotWCwAHzd6IrVgWkZzmMPY | 155 |
lm_eval/tasks/bigbench/multiple_choice/unit_conversion.yaml | sha256=0GFL35T0IRYgMNMss-LLQwmdANbdhFJ-NEUYspB9pHc | 153 |
lm_eval/tasks/bigbench/multiple_choice/unit_interpretation.yaml | sha256=vLqDPIdMj8FlMq5AQUXyz7o7k0lGC4_BLop9TRNALgM | 161 |
lm_eval/tasks/bigbench/multiple_choice/unnatural_in_context_learning.yaml | sha256=sF8nmC30vsXZR1Xn-a1m5mAXC-lrqs18_t20qJ1cw94 | 181 |
lm_eval/tasks/bigbench/multiple_choice/vitaminc_fact_verification.yaml | sha256=1sZ7XhrJGGbicdOJbJxl61yTzy0nez3wMNvr8DtoR10 | 175 |
lm_eval/tasks/bigbench/multiple_choice/what_is_the_tao.yaml | sha256=g4sj5BjHAlbLqt5KBrvXT3jAvofFobdIacNmfugmcAE | 153 |
lm_eval/tasks/bigbench/multiple_choice/which_wiki_edit.yaml | sha256=AHNB5MgzPP6hC79ktaPGcCrTNHnklYxiU25R1ACdEAc | 153 |
lm_eval/tasks/bigbench/multiple_choice/winowhy.yaml | sha256=jD95Obu3GrnKP_oZL26NrOAvznQJV0274KmLlg_wM1k | 137 |
lm_eval/tasks/bigbench/multiple_choice/word_sorting.yaml | sha256=WJctV0okW4jjU3HgprNUyNc9yeFan109eC77Bayq9tk | 147 |
lm_eval/tasks/bigbench/multiple_choice/word_unscrambling.yaml | sha256=560CY4-vhF5C97RpIDVjaht1RchocipGDvlmimZp_ZQ | 157 |
lm_eval/tasks/blimp/README.md | sha256=DWssG7sScoVaJep8XMGuh7q4ypM9m0evl9YzvnxgFeA | 2920 |
lm_eval/tasks/blimp/_template_yaml | sha256=rZkGUXEqrKs8arNiTCURkoWdcl-qe-3vzMMgj8D2LEY | 335 |
lm_eval/tasks/blimp/adjunct_island.yaml | sha256=-9lX4hPdterByJxKE5g0rKbduMM19WgtEMvblkzv68s | 104 |
lm_eval/tasks/blimp/anaphor_gender_agreement.yaml | sha256=YvC5NfoTfaIQ8YEYSXDsj3nUph38cVyV6V6j8zDmmrM | 124 |
lm_eval/tasks/blimp/anaphor_number_agreement.yaml | sha256=QZLYkO_7cmUYG0wJFBbXvoDAdgzEouIlWaw3WIlp85o | 124 |
lm_eval/tasks/blimp/animate_subject_passive.yaml | sha256=znBh6LPx2JsVMfGJro-hfKDSwKb6UEPuv0SJ7bxjAF0 | 122 |
lm_eval/tasks/blimp/animate_subject_trans.yaml | sha256=NA59OdcPs1vcNK37AObFpIRusV4bXJAZWwgptFKWlxs | 118 |
lm_eval/tasks/blimp/causative.yaml | sha256=iOyrzoGsOaU7L1mRctjhuFVgxFma_Z8FIDana6GRP-U | 94 |
lm_eval/tasks/blimp/complex_NP_island.yaml | sha256=IJZMuZgeeJhBdE5fRK9JLkHv4-EFjRGIdZzOMlh6acE | 110 |
lm_eval/tasks/blimp/coordinate_structure_constraint_complex_left_branch.yaml | sha256=3KHjSpHUgOlMknw6yyeuFcmq7Tr5Aj0BWhABRqBAXKI | 178 |
lm_eval/tasks/blimp/coordinate_structure_constraint_object_extraction.yaml | sha256=1utajR5vsWlwfMlxnAIh6g_ZWMerLWplnVa_91ZOOt8 | 174 |
lm_eval/tasks/blimp/determiner_noun_agreement_1.yaml | sha256=Xozzid4qpRC2c2Y0G2CzQA4MwtC6lmAxWYzolnV1vyg | 130 |
lm_eval/tasks/blimp/determiner_noun_agreement_2.yaml | sha256=h3l_Nur4ofxlOCEKG74Ped29pgKrKGJ2EU06CR-W_ko | 130 |
lm_eval/tasks/blimp/determiner_noun_agreement_irregular_1.yaml | sha256=SaT-zTh8rDVb0lpIxKqDsvBaKGGtR2UtyzqE0n-ixuE | 150 |
lm_eval/tasks/blimp/determiner_noun_agreement_irregular_2.yaml | sha256=mkorgBYuduNOB-gTdMlNFAxV6N7dC7mjdtL3jcpaWmE | 150 |
lm_eval/tasks/blimp/determiner_noun_agreement_with_adj_2.yaml | sha256=RyuzjODaFGx-tpB4qsFUCp6LKxq23TQVpePCW8Qffys | 148 |
lm_eval/tasks/blimp/determiner_noun_agreement_with_adj_irregular_1.yaml | sha256=yhSMa2TUnNbcDabHYtIPdgbU34sbFrEW2_WxDXzzrcc | 168 |
lm_eval/tasks/blimp/determiner_noun_agreement_with_adj_irregular_2.yaml | sha256=dmUQWIxZnSKEGJgBxBMancfBTAjhp-5Fn6IiL3w1ci4 | 168 |
lm_eval/tasks/blimp/determiner_noun_agreement_with_adjective_1.yaml | sha256=qO4si9QBuAvM1y0yGP9ZZo1YiQlBZljl2n8zKFh9VDE | 160 |
lm_eval/tasks/blimp/distractor_agreement_relational_noun.yaml | sha256=ZXy-qJ5fkMeqctJDqo2hJfsM-8usA9bneX7VWAvR1Ak | 148 |
lm_eval/tasks/blimp/distractor_agreement_relative_clause.yaml | sha256=aylJHRj3J50lqloD6TtbRWgTC8sMek7PlolhlQ2_wTs | 148 |
lm_eval/tasks/blimp/drop_argument.yaml | sha256=piUDj4gM9_dlopsxQB47CYpaFOV2Z6l3beZEScQqB38 | 102 |
lm_eval/tasks/blimp/ellipsis_n_bar_1.yaml | sha256=pawDpZP85htkOT_Db2TRFP19neJP1xio404cYcFhzv8 | 108 |
lm_eval/tasks/blimp/ellipsis_n_bar_2.yaml | sha256=OBAtmSx6TW2Rgo-zdqKNp6ZBhJPBOa8eODvTZb8Blmg | 108 |
lm_eval/tasks/blimp/existential_there_object_raising.yaml | sha256=f8wWYmAiqdEAKqIDcSCB2mj3CXRpz6Xx23tBw_YFmAk | 140 |
lm_eval/tasks/blimp/existential_there_quantifiers_1.yaml | sha256=0dCbp1jHm8zZrznnHDWb31ho8rDV4tnLR3Fm1uGUMFI | 138 |
lm_eval/tasks/blimp/existential_there_quantifiers_2.yaml | sha256=il9eevifcY7YXleFZtMPeT2aHM_0q_pmRrMX8Dnlvas | 138 |
lm_eval/tasks/blimp/existential_there_subject_raising.yaml | sha256=Pms6JBnODzdcBr0HkS9o7oMskk0Uxxl0Smz7y8iFnhg | 142 |
lm_eval/tasks/blimp/expletive_it_object_raising.yaml | sha256=DP15wYDN9C4ZZFBqz9TcnG89_GkmXm91YWFeueJGZ8g | 130 |
lm_eval/tasks/blimp/generate_configs.py | sha256=ViuxTjh-O4eOHVSxwbVzMmig00R9Fo3tJz7Gi95CNrk | 2883 |
lm_eval/tasks/blimp/inchoative.yaml | sha256=DsMpj_a2yrOchFTmTXat0LGocDai5yEhefMj4mw11ug | 96 |
lm_eval/tasks/blimp/intransitive.yaml | sha256=S4KtS7drV5J2iqoe3TNXbJIM56m85KCXSTBeCLJModg | 100 |
lm_eval/tasks/blimp/irregular_past_participle_adjectives.yaml | sha256=gZhQpDK95j2qJotGRqg1JY5aRxDKMvABwpwLEHBHDvg | 148 |
lm_eval/tasks/blimp/irregular_past_participle_verbs.yaml | sha256=J7i1uPI1XRkOJ5J9fVDqkma-DBIVpTP4CQaPF9zNc6A | 138 |
lm_eval/tasks/blimp/irregular_plural_subject_verb_agreement_1.yaml | sha256=vkRRN_PpLhliyDbdjyrWP-Exo0IPvqbBxbV-gB-6u-Q | 158 |
lm_eval/tasks/blimp/irregular_plural_subject_verb_agreement_2.yaml | sha256=Dhce_QyhiMuLq5nYtEsg9f2U14a2lPM5gNoa_k1BZqU | 158 |
lm_eval/tasks/blimp/left_branch_island_echo_question.yaml | sha256=tmYr6gGH_W_bsTxfD0o8E0gm0lpPX_RouukysmN8PmE | 140 |
lm_eval/tasks/blimp/left_branch_island_simple_question.yaml | sha256=6fQOQ1Khq4c4r2FKjccNOzQq2nPfSWGEfWAY5ui5YZk | 144 |
lm_eval/tasks/blimp/matrix_question_npi_licensor_present.yaml | sha256=zgviPtzlA4t_e1I0uJHQWSIXoVxGCCYCbE9Q6ZJ8H0g | 148 |
lm_eval/tasks/blimp/npi_present_1.yaml | sha256=1lFMhXRmF1N-ZCRA71OieXn9dcaNWM0h1_tr9nf3dr8 | 102 |
lm_eval/tasks/blimp/npi_present_2.yaml | sha256=hkelD4YT05hqNiBu6foSc8Ea6DBTVEZo6tA4_W6pn58 | 102 |
lm_eval/tasks/blimp/only_npi_licensor_present.yaml | sha256=8exp0yKRSCPcD5AXBbURBTDI1FaCcpWTDP_SQNckXgA | 126 |
lm_eval/tasks/blimp/only_npi_scope.yaml | sha256=ByExTctp9xZmTtKrHCGJg70UY6yD2Kqpt1i95zIl1Xo | 104 |
lm_eval/tasks/blimp/passive_1.yaml | sha256=aVZXNP2pI2DzSfGuNtNLmWElXxdNPTAMCABV8Yb9Kvk | 94 |
lm_eval/tasks/blimp/passive_2.yaml | sha256=RSkmNYrndnY5tweYPxL1rvb7_IYJdBfs-QXQXHvpSuk | 94 |
lm_eval/tasks/blimp/principle_A_c_command.yaml | sha256=HNR2XQIRJfJlOn63103PmDnnUG2NY2iMuWPAB_tKoGU | 118 |
lm_eval/tasks/blimp/principle_A_case_1.yaml | sha256=2q4Zrc27iGDVaT7XilWvcJCzL3il8UILyEW6BW3-RMs | 112 |
lm_eval/tasks/blimp/principle_A_case_2.yaml | sha256=VgfFmGJ5ODxbAyga-hvWrH4ALajZ0CqY8S1yMF5dN6c | 112 |
lm_eval/tasks/blimp/principle_A_domain_1.yaml | sha256=wjWNm-2SkxOJpUf6XplZuY_lm45qNsAhEqf8gkw42cE | 116 |
lm_eval/tasks/blimp/principle_A_domain_2.yaml | sha256=I7-vj_eHLXL92Q5YyQg0tNkn6XfDwZQmYAcdxZ5jDUk | 116 |
lm_eval/tasks/blimp/principle_A_domain_3.yaml | sha256=N4NOk4-FYUrZe_yEB3QVpK10l5YTbVvAR8T2ZdZJbIY | 116 |
lm_eval/tasks/blimp/principle_A_reconstruction.yaml | sha256=kbgPw8WRvQgEw4nOx6lIahrJfiwQgeldg-_ubuyduKQ | 128 |
lm_eval/tasks/blimp/regular_plural_subject_verb_agreement_1.yaml | sha256=TRl_ZSGOzmoKj8aaps-3UoUH-E2CQTvHkT7oY8tvnp0 | 154 |
lm_eval/tasks/blimp/regular_plural_subject_verb_agreement_2.yaml | sha256=El69s111tnlZ3PaVD8dJ_mnGyHkwfF1Lx1NRbegvyqc | 154 |
lm_eval/tasks/blimp/sentential_negation_npi_licensor_present.yaml | sha256=tlDP6oxHDRNT-DOlxqER7c16pMqjRiYtraonx0dhJSQ | 156 |
lm_eval/tasks/blimp/sentential_negation_npi_scope.yaml | sha256=ZA01-DgkD_XiH4_y4LEPTxID6yN6IB3ChXcVM3r-yeo | 134 |
lm_eval/tasks/blimp/sentential_subject_island.yaml | sha256=dWTwulV1S633yAhGuWGuyGttg3fkyYwMM2A_y8HxcKc | 126 |
lm_eval/tasks/blimp/superlative_quantifiers_1.yaml | sha256=faxiPYPbVCG3Jz-PRJoHlYl6EyhEEc-nprr29tV-3Cc | 126 |
lm_eval/tasks/blimp/superlative_quantifiers_2.yaml | sha256=WbMvowOM10KnngE6Nz5iS3f4A5hcEP01331m_m4JmGY | 126 |
lm_eval/tasks/blimp/tough_vs_raising_1.yaml | sha256=pK9Upq5umDCfVZWm8u0E2kxdYmEitsuAqO-5QD9tayc | 112 |
lm_eval/tasks/blimp/tough_vs_raising_2.yaml | sha256=7VeDbZkxEY8D9nwNymqOHotD8NkeTUibGkKJMSigWtQ | 112 |
lm_eval/tasks/blimp/transitive.yaml | sha256=cmejl92fLdcvqrpWR4oX-yLeWExMqtj1a-x0fKHtLwQ | 96 |
lm_eval/tasks/blimp/wh_island.yaml | sha256=jFAVoSJBhuKAfU8fs2kl4US-tFiZ03vnMXbNqYfdF0I | 94 |
lm_eval/tasks/blimp/wh_questions_object_gap.yaml | sha256=kOvup2GXc9GtfsI9i4wzF3_jbL043PeHWjSUWFi0hBE | 122 |
lm_eval/tasks/blimp/wh_questions_subject_gap.yaml | sha256=m3ybX6FgLO7SYEA-7iUyLOTRmXC3hpQpUmkvm620mrw | 124 |
lm_eval/tasks/blimp/wh_questions_subject_gap_long_distance.yaml | sha256=rFcVijVQW-IG_mpNmRNFo7QEEhRoQ5CNVfBGKuI8qnw | 152 |
lm_eval/tasks/blimp/wh_vs_that_no_gap.yaml | sha256=3Buk7jIKXy4e0c7JYjJ5Iknlobz-JjWQxuMFl-PjuqU | 110 |
lm_eval/tasks/blimp/wh_vs_that_no_gap_long_distance.yaml | sha256=RVfGHziEZb_v7um-wo72xZNeSt0VcN6FiODhSq9uxTI | 138 |
lm_eval/tasks/blimp/wh_vs_that_with_gap.yaml | sha256=MwnrjZ-CdZGyvAshYmken2hkNf97BhAXNY03rhu679A | 114 |
lm_eval/tasks/blimp/wh_vs_that_with_gap_long_distance.yaml | sha256=9gOjb25Zw6AtFaXwyyyo9xrapuN3PwBE-zcCZ4zdWbM | 142 |
lm_eval/tasks/ceval/README.md | sha256=UEX7W3AFO3-cM3UcL3yrLoO9C4ZsmiiD2cRzvCH6nys | 4967 |
lm_eval/tasks/ceval/_default_ceval_yaml | sha256=VHEzrG1XsHUwRR3VFM_zRFuFW9hzAZixNw6PigqTVAU | 509 |
lm_eval/tasks/ceval/_generate_configs.py | sha256=SmP2YNepa3FwZYBDFz8chodHfoPzJ-5Uy4m-59mqLxw | 4288 |
lm_eval/tasks/ceval/ceval-valid_accountant.yaml | sha256=r61lKl0DAH5ySKcDs7AwPvQl8JVUiHZfvzmJRmBiUX8 | 207 |
lm_eval/tasks/ceval/ceval-valid_advanced_mathematics.yaml | sha256=TowvVz5_ZfK6yBmcAuqQ1T1uv9_PfeQ8bJen8NkRHrg | 224 |
lm_eval/tasks/ceval/ceval-valid_art_studies.yaml | sha256=kI7p4mk8_5oF4IEb9hAgy9LASGQIXRzzVp5Xar39Kis | 203 |
lm_eval/tasks/ceval/ceval-valid_basic_medicine.yaml | sha256=m2PzLxFzKXbYd4_2Ln2z7sxS25fVlw1GiuKYjnZ1Nt4 | 212 |
lm_eval/tasks/ceval/ceval-valid_business_administration.yaml | sha256=tVyXVeOB5Mk_4WkGiY4FsVMb9GHWA0bXvK9VS22gTw8 | 230 |
lm_eval/tasks/ceval/ceval-valid_chinese_language_and_literature.yaml | sha256=SAhX_ST3R3hSDvyVRoZMvTIDTLzAOR6IA4QHRkUjwvM | 252 |
lm_eval/tasks/ceval/ceval-valid_civil_servant.yaml | sha256=G_8m9RcD_aV7jJXAubW_1oq84RIbrUfyLZxxTcic_vE | 207 |
lm_eval/tasks/ceval/ceval-valid_clinical_medicine.yaml | sha256=0QikXTEvr3amDcUGl8DcfynOZj0Ll5hZRa1AhhHTXQ8 | 218 |
lm_eval/tasks/ceval/ceval-valid_college_chemistry.yaml | sha256=0rhGE5axuBh5O4Z4aZRaOuQ0usiuTJd-CtAvKpxI9NE | 218 |
lm_eval/tasks/ceval/ceval-valid_college_economics.yaml | sha256=Y9xrtTT-BiinFOkkqI7nWi4GyB1bxiOHh6pRPff3-AQ | 221 |
lm_eval/tasks/ceval/ceval-valid_college_physics.yaml | sha256=JJfHph_isVStbsk2yIav4A5iqmLWNf1EAmCFOIUjk5Y | 214 |
lm_eval/tasks/ceval/ceval-valid_college_programming.yaml | sha256=FYNlc9mHqfoLCAdtjx3aiaPq-HuI0c2zNDQp8AaE6wo | 222 |
lm_eval/tasks/ceval/ceval-valid_computer_architecture.yaml | sha256=vGZ__iGOj0_nX7aVWX3qCDYrr2eEJ1mJj7k59NG3CTs | 229 |
lm_eval/tasks/ceval/ceval-valid_computer_network.yaml | sha256=gPMX8lN2YMGH9QYaKBEXProfP_MA9XV4Lx_udMr-ktQ | 219 |
lm_eval/tasks/ceval/ceval-valid_discrete_mathematics.yaml | sha256=a9wuabDadH9CgiyQc5uW1lld4vAeaJYv4mPTx5u-Ujg | 224 |
lm_eval/tasks/ceval/ceval-valid_education_science.yaml | sha256=KiFoKyLZHkaDYdWCAZ45k4K_GglR3MDJGheeHWDgSbM | 215 |
lm_eval/tasks/ceval/ceval-valid_electrical_engineer.yaml | sha256=DjZ62r5DtU_XIS1K-MUbQqbigXYd6YCQI7LBYdXhB8Y | 231 |
lm_eval/tasks/ceval/ceval-valid_environmental_impact_assessment_engineer.yaml | sha256=S-HPmH9da8gLu8lh_2YZ4XwV5Hog7JPJJEbxVkbd0Kk | 279 |
lm_eval/tasks/ceval/ceval-valid_fire_engineer.yaml | sha256=aTajwMc0EjalqD3Rx5O6BUX3slgolA8lxLSjF0NvDlE | 219 |
lm_eval/tasks/ceval/ceval-valid_high_school_biology.yaml | sha256=KMO3L-P6JFdCwkH5431YBOImX-oWGi6A9gmtvyCq-EU | 222 |
lm_eval/tasks/ceval/ceval-valid_high_school_chemistry.yaml | sha256=YdpYxhBFLDoKk9gz6UiZa6TBuqrdRH8FnZmG2NZiuL4 | 226 |
lm_eval/tasks/ceval/ceval-valid_high_school_chinese.yaml | sha256=6L4ePI81IW_ssklfqriFt83X8vMZ4b0gm_oAkpDXkqA | 222 |
lm_eval/tasks/ceval/ceval-valid_high_school_geography.yaml | sha256=rPDd_fm_nqM530JAWLG7PmYyCFux3wOZf50gdZBBRVY | 226 |
lm_eval/tasks/ceval/ceval-valid_high_school_history.yaml | sha256=SEMX0dqEXZjsvTn1JP_3ECBZ0M56I4WBKFbw0XWI8No | 222 |
lm_eval/tasks/ceval/ceval-valid_high_school_mathematics.yaml | sha256=j45jE6-jfXFcdkLZFY2jPwexDnqiBkqilwC9a5vsM04 | 230 |
lm_eval/tasks/ceval/ceval-valid_high_school_physics.yaml | sha256=lTuM6LCjO9SlruoHX3xepebj46l_0ZK_N5l5HZmys6A | 222 |
lm_eval/tasks/ceval/ceval-valid_high_school_politics.yaml | sha256=T6HS-hthajC2NJi5NFKkD0XDxmXmKHCNuhBbhntddpU | 224 |
lm_eval/tasks/ceval/ceval-valid_ideological_and_moral_cultivation.yaml | sha256=hmHJ5O9v3iXt-j8xHO7UeCMWE6A6FB-dciyljq9xSqM | 271 |
lm_eval/tasks/ceval/ceval-valid_law.yaml | sha256=QmrSRhjMC5K7OQDTz2_r52HJVZWWv4xjrptwmY5NKzA | 184 |
lm_eval/tasks/ceval/ceval-valid_legal_professional.yaml | sha256=rQMWxpcWt2Y1bhoSgaUP5US4OXVbPvTSxvU_J90dwHk | 226 |
lm_eval/tasks/ceval/ceval-valid_logic.yaml | sha256=mnuTRJO3tYKeySn2n3B-92InjPvz3t0mhf-UaKGcHgI | 191 |
lm_eval/tasks/ceval/ceval-valid_mao_zedong_thought.yaml | sha256=z4BrjRmSCh96ieu9MCmc9J-vy0PnBdxKYO7Q8lUjenc | 268 |
lm_eval/tasks/ceval/ceval-valid_marxism.yaml | sha256=3KjhPFk4w9kpVzl1WD9Va4EOAkux32iBqrfQ1UIP9s8 | 213 |
lm_eval/tasks/ceval/ceval-valid_metrology_engineer.yaml | sha256=YqiCDiJ4bphneVAIjweU5Qqc4uck_s_iuIzMT9HF_kQ | 223 |
lm_eval/tasks/ceval/ceval-valid_middle_school_biology.yaml | sha256=Ic-e39wEVx6NScOoCbkA7dciQ-Y2wt0QFmN0kWVTVEk | 226 |
lm_eval/tasks/ceval/ceval-valid_middle_school_chemistry.yaml | sha256=CJ6HyS-6Nlcp-wi0yb74zdqUPL_zQWdTf9oTYQcCGO4 | 230 |
lm_eval/tasks/ceval/ceval-valid_middle_school_geography.yaml | sha256=Yh1mxAbsNan6WY4sH8eN5EI-oLw8psQ5PmGO1ZX-ZrU | 230 |
lm_eval/tasks/ceval/ceval-valid_middle_school_history.yaml | sha256=ckDHEb5npvsq2mdt4ICfkbk0eTlcZxHWlGJXax-1aIY | 226 |
lm_eval/tasks/ceval/ceval-valid_middle_school_mathematics.yaml | sha256=Mtt8szOofgOabzBBVLIPV67b7sDEECndzOAz057qlJs | 234 |
lm_eval/tasks/ceval/ceval-valid_middle_school_physics.yaml | sha256=oue8rUCV8h0MP0gx5emFPTOreBh6FSNhqNi_HEJtvW8 | 226 |
lm_eval/tasks/ceval/ceval-valid_middle_school_politics.yaml | sha256=pKqoZ560D8p0sJ6sEBanLv_ybuppFpvd8f-IYRCVl50 | 228 |
lm_eval/tasks/ceval/ceval-valid_modern_chinese_history.yaml | sha256=ISjUEGRMxv2nQGf50IbxoQEMA4hLHUchXO5wWT_ams8 | 231 |
lm_eval/tasks/ceval/ceval-valid_operating_system.yaml | sha256=1r9lC8brpfqm4D1lX1_0avgSZXwAm3xq48WtLYxtCxE | 216 |
lm_eval/tasks/ceval/ceval-valid_physician.yaml | sha256=JV3vjt37Cmnv0fGCQzjpvCxGljASNTJQj3fO8Xt0WY4 | 202 |
lm_eval/tasks/ceval/ceval-valid_plant_protection.yaml | sha256=XxzSPV-7R2X6nOiqWM_PhKeMtIT9WOwVvkNCc71KZNM | 216 |
lm_eval/tasks/ceval/ceval-valid_probability_and_statistics.yaml | sha256=Dm-WFp5dusbxLucUCEqRkmcbgIGnNjYoMXsmYbYJ5UY | 236 |
lm_eval/tasks/ceval/ceval-valid_professional_tour_guide.yaml | sha256=LMS9fyh7Zmt8grr4CBQGccGHPAKuj0RZAj3XQGzmyl0 | 230 |
lm_eval/tasks/ceval/ceval-valid_sports_science.yaml | sha256=6rgkkmJCxopoPNedAkIhWVpGzhdcB4ztYO0EmUk_9rc | 209 |
lm_eval/tasks/ceval/ceval-valid_tax_accountant.yaml | sha256=dHhlfeqH_HUlTkKbWzOJNaYXzAE1c9FWejT_3XBiGhU | 209 |
lm_eval/tasks/ceval/ceval-valid_teacher_qualification.yaml | sha256=msYhw4RmvIXosDstJVb1l7wUs_-hokMOFY1UFSTteHc | 226 |
lm_eval/tasks/ceval/ceval-valid_urban_and_rural_planner.yaml | sha256=lqXQXjQI4jxIQ3_iNIaTQE1CJ3OGg5UzEcL0NIiQRgs | 239 |
lm_eval/tasks/ceval/ceval-valid_veterinary_medicine.yaml | sha256=g9Ui3hPL64eumBGsuKUE1xgiCKFMFzt8hqbJ14pbu90 | 219 |
lm_eval/tasks/cmmlu/README.md | sha256=gyA3hrGDwuWy4mtFMPgxWXleKApdjgbKmiiWi0t9CMk | 1748 |
lm_eval/tasks/cmmlu/_default_template_yaml | sha256=3r35-Pc74RZ3JDDS6PnRzO9EGVgNdgF9W_MzFga5I-Y | 497 |
lm_eval/tasks/cmmlu/_generate_configs.py | sha256=M1umn9sa6LYSd-F4RDjYnBM7rj7wXcK09NjROTyn-mA | 4687 |
lm_eval/tasks/cmmlu/cmmlu_default_agronomy.yaml | sha256=DqvlHZ1g4sDq5lFUjDzk8Xu7LdpfOajsqgD5COLsnio | 191 |
lm_eval/tasks/cmmlu/cmmlu_default_anatomy.yaml | sha256=SKazmZTenePltXz5i7wj33uM-zwAjWTmKcd0ngzEjOM | 192 |
lm_eval/tasks/cmmlu/cmmlu_default_ancient_chinese.yaml | sha256=zQ5j11KOJ60Q0n3IJ2SNGFkx01I0Qy6p6i-RQTQC8_8 | 208 |
lm_eval/tasks/cmmlu/cmmlu_default_arts.yaml | sha256=qNkb7UTvtgXF9JcHo8qSYW6O22tZgLSuPzvoklCL0zw | 186 |
lm_eval/tasks/cmmlu/cmmlu_default_astronomy.yaml | sha256=lgF3qfC_2bQc4NEklG6vnwmhy1GvfogpgRSYfoijulQ | 196 |
lm_eval/tasks/cmmlu/cmmlu_default_business_ethics.yaml | sha256=TdFBk1ool2z3ihnnk5LHraT6R_Feo_F_p5at9JT3HcY | 211 |
lm_eval/tasks/cmmlu/cmmlu_default_chinese_civil_service_exam.yaml | sha256=l7wFBEEn_BtahJVHQL6cI7azQeWSs3hX-2XdHX-CjhM | 242 |
lm_eval/tasks/cmmlu/cmmlu_default_chinese_driving_rule.yaml | sha256=0Uj-zYoT4yeQqOqBfIXi_IpYzyQPcHMCf1dS9ma2LKc | 227 |
lm_eval/tasks/cmmlu/cmmlu_default_chinese_food_culture.yaml | sha256=EMIfT1GJluls12hfxlmTgfNKevRuzV9XWkoGTzO0djI | 227 |
lm_eval/tasks/cmmlu/cmmlu_default_chinese_foreign_policy.yaml | sha256=1yuG2_1A9Oe4_o_Bl7uJKOv3Qfqv9r6JYAD1P6L3AHg | 231 |
lm_eval/tasks/cmmlu/cmmlu_default_chinese_history.yaml | sha256=vYox5jq9_vm04ClPytEiqluf8oiJ7Y2Yl8dwphd_ukY | 211 |
lm_eval/tasks/cmmlu/cmmlu_default_chinese_literature.yaml | sha256=6vFl0vmSFAeLBtcyn9utf7YGQMtiJEOjxR1XtmmeN7k | 217 |
lm_eval/tasks/cmmlu/cmmlu_default_chinese_teacher_qualification.yaml | sha256=Ofur5dABRspuog_bL39FTQcJ6cqSj3B1pjJTeparuPg | 245 |
lm_eval/tasks/cmmlu/cmmlu_default_clinical_knowledge.yaml | sha256=ReXbIW90A0BZ3NGOysUraRr1n4Ugto-Pl8z3CPPU4aA | 217 |
lm_eval/tasks/cmmlu/cmmlu_default_college_actuarial_science.yaml | sha256=vvVIOnXSEG-J9OcEFf4G3qGpGBRkfrKb8x1_oJrruK4 | 234 |
lm_eval/tasks/cmmlu/cmmlu_default_college_education.yaml | sha256=9AUMkRL72eBk2UnWaDBtmgdrh0EQZait775LloIZq7M | 218 |
lm_eval/tasks/cmmlu/cmmlu_default_college_engineering_hydrology.yaml | sha256=HBihPhmNhTPj7_LSB939YL_o8zOI8vsuTXuEK8F2yd4 | 248 |
lm_eval/tasks/cmmlu/cmmlu_default_college_law.yaml | sha256=FWe0m1K9JmnVTcfXW5Fbsv2tE3LGBfNhSxLXrVi4pSk | 203 |
lm_eval/tasks/cmmlu/cmmlu_default_college_mathematics.yaml | sha256=1os_um2HNCfbbRJYM6IKAG05I2_QsiSrmW9OaHLNGwo | 219 |
lm_eval/tasks/cmmlu/cmmlu_default_college_medical_statistics.yaml | sha256=z6LJZK45Tf9gj9LIx1TjjuaH8LACReSz43ObiNTvd0A | 239 |
lm_eval/tasks/cmmlu/cmmlu_default_college_medicine.yaml | sha256=iIQRLQfEx3ZCtcRqHE5Il1XDqjqaHaV8oAdM2ihWCC4 | 213 |
lm_eval/tasks/cmmlu/cmmlu_default_computer_science.yaml | sha256=64z6rFtry_E0LS5opBBaBcHXzmOW1lg9Y1wh1lNx1Cg | 216 |
lm_eval/tasks/cmmlu/cmmlu_default_computer_security.yaml | sha256=iCYXgKnc8GpnHAwHPZq1-XbXzwZ9AlBuANlQ66Wj1Sc | 218 |
lm_eval/tasks/cmmlu/cmmlu_default_conceptual_physics.yaml | sha256=L_DkqkfoMI1kBneIXn9W3r-zZ7rG0bp_dceUOlqaVWU | 220 |
lm_eval/tasks/cmmlu/cmmlu_default_construction_project_management.yaml | sha256=1tMoBrlqts3rgxwRgVUu8tRR9td8S8_54LPZyOKRgZQ | 249 |
lm_eval/tasks/cmmlu/cmmlu_default_economics.yaml | sha256=bai4ZwJBfG7OAN_uSS-uajVt-HOrUw9nNwK4f9R53RI | 196 |
lm_eval/tasks/cmmlu/cmmlu_default_education.yaml | sha256=JHFLezPEuR8vINuJ7fiq5vrMMaWieyW3HXoWsdpOWnw | 196 |
lm_eval/tasks/cmmlu/cmmlu_default_electrical_engineering.yaml | sha256=pVHvc_MRieXI3ff7WJpKkQV1uaap3II7-BuzkAwrHiY | 225 |
lm_eval/tasks/cmmlu/cmmlu_default_elementary_chinese.yaml | sha256=P4jiuRXU5OqjvlpDkjFJHl4RLu7b5LaTmbGrmvseYMI | 217 |
lm_eval/tasks/cmmlu/cmmlu_default_elementary_commonsense.yaml | sha256=OlTYX9qyhhu4u5VYFDtUGEFicu-VPNLmNU1Juq8uO0w | 225 |
lm_eval/tasks/cmmlu/cmmlu_default_elementary_information_and_technology.yaml | sha256=hAPmn31ac7hFTFl283vhK1jPjJm5tv6VchLKQgb3yPs | 261 |
lm_eval/tasks/cmmlu/cmmlu_default_elementary_mathematics.yaml | sha256=D8ne6N6tJCsPzWqlF4qxy6oBgkmjb6Jqy5DKw-xJMnU | 225 |
lm_eval/tasks/cmmlu/cmmlu_default_ethnology.yaml | sha256=OhNfsDxIuIA7ADIMc2SYiWjMtEw_DehtcQSIbXTbxc4 | 196 |
lm_eval/tasks/cmmlu/cmmlu_default_food_science.yaml | sha256=fItOTnSEaBqDxokXTmY62WJI8orHAo2EL6HHAA_6z8A | 205 |
lm_eval/tasks/cmmlu/cmmlu_default_genetics.yaml | sha256=TOWNyAd8uOc1NrZkjgDMuYBDKaW1Ft8xJRABwMZYenk | 194 |
lm_eval/tasks/cmmlu/cmmlu_default_global_facts.yaml | sha256=-jZNUBh1qBrRVz70BfV4WWjhDwS4jsH5G9yipyKDHfE | 205 |
lm_eval/tasks/cmmlu/cmmlu_default_high_school_biology.yaml | sha256=pX2-airA86ZU5pUjewxjdlcLs-9FWHUUUiAnzBubrwQ | 219 |
lm_eval/tasks/cmmlu/cmmlu_default_high_school_chemistry.yaml | sha256=Q1ZBG8Wp9ab96l19PRwod9Dll5skvlB96x2A1Jmnfc0 | 223 |
lm_eval/tasks/cmmlu/cmmlu_default_high_school_geography.yaml | sha256=G0VrkoUMzKtEm1kzOuEwPdq2vtlkc0KMDMsEGF6t1ds | 223 |
lm_eval/tasks/cmmlu/cmmlu_default_high_school_mathematics.yaml | sha256=wB7tBE5a9SWghbkP6dRakza_3PpSt-wkmTrd0bQpUEc | 227 |
lm_eval/tasks/cmmlu/cmmlu_default_high_school_physics.yaml | sha256=-QcmeommiYmIqCYaLVsaars-u6VKnqzbIoaf7Uz3Tmg | 222 |
lm_eval/tasks/cmmlu/cmmlu_default_high_school_politics.yaml | sha256=kKjyp_zDx4tsAJkWmzBCqp6Ubx2hhriEl-PiI6GHRys | 221 |
lm_eval/tasks/cmmlu/cmmlu_default_human_sexuality.yaml | sha256=IB0QxIhbKjAmhT77CJqheViIVw-2sZ3_kWpeyDcFAOw | 214 |
lm_eval/tasks/cmmlu/cmmlu_default_international_law.yaml | sha256=9luncjc_o4MvJjIYSznbT4ljfGEkrQdiaxYRajAnREA | 215 |
lm_eval/tasks/cmmlu/cmmlu_default_journalism.yaml | sha256=Tzhv5LmPa9-RTrok-GBgGc3mag4AmPIUVJKYqhzA_-c | 198 |
lm_eval/tasks/cmmlu/cmmlu_default_jurisprudence.yaml | sha256=OVAiNRVJBAUmw7ON2CX1cP44BUv7TktZW0ufOC6Zgco | 204 |
lm_eval/tasks/cmmlu/cmmlu_default_legal_and_moral_basis.yaml | sha256=YbQTOpGYrKJr5TOKzEWrUl3FO6zQtu1pAwjGCnmPRik | 232 |
lm_eval/tasks/cmmlu/cmmlu_default_logical.yaml | sha256=4lpQg10BWCqLyepRgXn4fcazO9J6YKiZvoWhgRJTytw | 192 |
lm_eval/tasks/cmmlu/cmmlu_default_machine_learning.yaml | sha256=yTSdJ2qB6hVZ-I1M3V8IQshSThOugOI_2H3ECNdeoig | 213 |
lm_eval/tasks/cmmlu/cmmlu_default_management.yaml | sha256=xj0wH_La-bf_Ezx9mjmsbY07M4UdTXbkzCqGdnzJkRk | 198 |
lm_eval/tasks/cmmlu/cmmlu_default_marketing.yaml | sha256=l7ulx3Nr47Ai4-MwPSvr64j1cKF8hG0wpkUHNKVkuTU | 199 |
lm_eval/tasks/cmmlu/cmmlu_default_marxist_theory.yaml | sha256=d7XeZBoxxtzm9rf4WrjcChH5-RDT00XgITU9QJXKkBA | 218 |
lm_eval/tasks/cmmlu/cmmlu_default_modern_chinese.yaml | sha256=M2gRRZy54c8e6CeJu69yNAoP6c9NpDfSMlVyD_0pMvk | 209 |
lm_eval/tasks/cmmlu/cmmlu_default_nutrition.yaml | sha256=yLQYVLdRY1MUc4NaCidmrFlsDAWaBmI4tp9r3DLzjqY | 196 |
lm_eval/tasks/cmmlu/cmmlu_default_philosophy.yaml | sha256=IlGz2CINUIAzbvlLbnAbXOdNsxCyO2rmwSnwB9iqF_8 | 195 |
lm_eval/tasks/cmmlu/cmmlu_default_professional_accounting.yaml | sha256=TgYE1xSlF2MBJW7fnisY7-dwcJlxTU-lKJDmf3nS5HA | 227 |
lm_eval/tasks/cmmlu/cmmlu_default_professional_law.yaml | sha256=S86GwVZZw3ilxfFvxpvZg5Rsl1sn-nUllYx5VFktinE | 213 |
lm_eval/tasks/cmmlu/cmmlu_default_professional_medicine.yaml | sha256=o9w1kA9-L1J72EuQ7V2kq1YhlUIS4ovXVhoQ44GLcbY | 223 |
lm_eval/tasks/cmmlu/cmmlu_default_professional_psychology.yaml | sha256=w5wE-YswhIPdQp1NWW2U09hYs3Rd64bvb6ZGupYucTk | 230 |
lm_eval/tasks/cmmlu/cmmlu_default_public_relations.yaml | sha256=jblBswd7hMbPfweUa-5hVEp43oNF24v4MeWRuea8Q3U | 213 |
lm_eval/tasks/cmmlu/cmmlu_default_security_study.yaml | sha256=CFKa_RoDtHDkHrXyyS9FNp_HI6vGCV7XaogP2cjVHyk | 209 |
lm_eval/tasks/cmmlu/cmmlu_default_sociology.yaml | sha256=Qzr4AiRoyPHtIISXvBN8_XAXltIO9GdMYr7xYXk9Atc | 196 |
lm_eval/tasks/cmmlu/cmmlu_default_sports_science.yaml | sha256=wD1eTg1JgFg-rnglXDDM--owRRq94g6st7GA3zZiXkA | 206 |
lm_eval/tasks/cmmlu/cmmlu_default_traditional_chinese_medicine.yaml | sha256=fs7VxHpIsAqdW52e-ffc6ClIdomsVPGzQKyiuGTTNs8 | 237 |
lm_eval/tasks/cmmlu/cmmlu_default_virology.yaml | sha256=aB_oTbDjh76nGH9rIkNhcbygJJkmckEBj7ehe_BVSd4 | 194 |
lm_eval/tasks/cmmlu/cmmlu_default_world_history.yaml | sha256=AWCZJjmwhJobrzPCUpNRKh5F_ieCDWuhQv4H6uq0mZA | 207 |
lm_eval/tasks/cmmlu/cmmlu_default_world_religions.yaml | sha256=v39HzwxSXp2xo5Ap_Ig1sGcdT0XkiDKRBsiPnI7J05I | 211 |
lm_eval/tasks/code_x_glue/code-text/bleu.py | sha256=YRP1MQN3XiS7ZfHMYS1fWXlwIJTwr0J8qDDGdpx7xfM | 7862 |
lm_eval/tasks/code_x_glue/code-text/go.yaml | sha256=w5oNioGJZyk5gbxdFmT-CSbGCdeigFA2CrvX92pZCYU | 479 |
lm_eval/tasks/code_x_glue/code-text/java.yaml | sha256=69hm7ydw5N7dhYz3LWzQGdTDtqROMYfFxXZHObILw4Q | 483 |
lm_eval/tasks/code_x_glue/code-text/javascript.yaml | sha256=pITf4Jr8fItJRcx0CQX0cb7P_4-DDFuIr0eSB3Tkyfo | 495 |
lm_eval/tasks/code_x_glue/code-text/php.yaml | sha256=OrDwislORoyzMwc_yLScurrSiet35X_tBQw5DflXMo8 | 481 |
lm_eval/tasks/code_x_glue/code-text/python.yaml | sha256=xeEVYgLVJdOG9gZcNgi2sbRB_XYsLNqB6HrXjiq3_aA | 487 |
lm_eval/tasks/code_x_glue/code-text/ruby.yaml | sha256=g8aSCIHTdJ1QXL_0zui4riIQzTuEiGIOSjr4zQmYkEI | 483 |
lm_eval/tasks/code_x_glue/code-text/utils.py | sha256=MhYi4IyBmZC4PuwDwNUwljLxa9nQKcCaCtoNgAuiecU | 310 |
lm_eval/tasks/code_x_glue/code-text/__pycache__/bleu.cpython-39.pyc | sha256=KgmtlozdjO7jrHE38caYNvVp-QwNPsQwb2UkNCSubtQ | 6137 |
lm_eval/tasks/code_x_glue/code-text/__pycache__/utils.cpython-39.pyc | sha256=XStqkfI5Mbx1JFOsKlg5sp0nYl38fCYWn3SmBcJs-tA | 563 |
lm_eval/tasks/coqa/README.md | sha256=LF6N0XSwsg6DLYACWr5FJca7bRlUYib00tGPHNiSzg0 | 1262 |
lm_eval/tasks/coqa/default.yaml | sha256=w3avxjGht-8SDSXeTecV3LtgbmHbT7gOY34YOnPUoHY | 568 |
lm_eval/tasks/coqa/utils.py | sha256=rQUwtHsatPLBmkdf5QlqCvi4WPTRhWFh76JcjSW_vig | 2839 |
lm_eval/tasks/coqa/__pycache__/utils.cpython-39.pyc | sha256=TQNkpjx35Igjz14Gcdc3JU49WGLYLSJhGhPc18hNsEY | 2634 |
lm_eval/tasks/crows_pairs/README.md | sha256=HesNVCLZST9DTRBTjxbAOIwzKG9UGaR9CuPVIrQUz3I | 6562 |
lm_eval/tasks/crows_pairs/crows_pairs_english.yaml | sha256=M2673tkeoGmXCxPzpZeO6zETHAgCsbC3Nn6wpBg7B4s | 552 |
lm_eval/tasks/crows_pairs/crows_pairs_english_age.yaml | sha256=g15ncf9B-uj8jpnGspHMF_tkTgytHxTFDEQheq-r5jE | 127 |
lm_eval/tasks/crows_pairs/crows_pairs_english_autre.yaml | sha256=-ZVZSt0RkemIKAHx-qM_Zf6WYphWFbtpKFTZqN4zer8 | 131 |
lm_eval/tasks/crows_pairs/crows_pairs_english_disability.yaml | sha256=FDuoBS89Bt4XnXT1qO4G3AKaLzRtjUr9ty_essY5ms4 | 141 |
lm_eval/tasks/crows_pairs/crows_pairs_english_gender.yaml | sha256=Jp_bpHin0LDl4Oh_5dw7DsnPIdw27_L7IvCSlt5-soc | 133 |
lm_eval/tasks/crows_pairs/crows_pairs_english_nationality.yaml | sha256=Xq_gMqx84YOsPB85t-mg-WowqOC9wGZAjti5s1vxZEE | 143 |
lm_eval/tasks/crows_pairs/crows_pairs_english_physical_appearance.yaml | sha256=rHxnfaefCxo-yW1nSA6odWsGWM1nuZ4qO7mY0_U3akY | 150 |
lm_eval/tasks/crows_pairs/crows_pairs_english_race_color.yaml | sha256=1TcaZQ2Vq0XQPalvOSvlpKZ43gzWOJ2_cwokusrppt0 | 141 |
lm_eval/tasks/crows_pairs/crows_pairs_english_religion.yaml | sha256=TL4EheFGZbH1g13jyDFTx83tcLFoGijbuxv34HuCp8s | 137 |
lm_eval/tasks/crows_pairs/crows_pairs_english_sexual_orientation.yaml | sha256=fkwnSl7AJI3zbmuWD2lWGOE7tiuRumRN1uINS0QI-d4 | 150 |
lm_eval/tasks/crows_pairs/crows_pairs_english_socioeconomic.yaml | sha256=uDwc7LsQC_Ws-4PsFQ8tc5vDkU98PxGzg4xz012Zi7w | 139 |
lm_eval/tasks/crows_pairs/crows_pairs_french.yaml | sha256=fz9gbMutyCHqm_OKj0xqqkr0Z3b3DLbQa54fAPAZ-dE | 80 |
lm_eval/tasks/crows_pairs/crows_pairs_french_age.yaml | sha256=p5WCzdbPIkilp8qG0fZGWG3dHjKr7ynX6PUP5GAWsN4 | 125 |
lm_eval/tasks/crows_pairs/crows_pairs_french_autre.yaml | sha256=nWk1CtmS4rPNxHuhp4fq4_r8MXmjO0PZUes6Cl5kW7E | 129 |
lm_eval/tasks/crows_pairs/crows_pairs_french_disability.yaml | sha256=JHuqbu8Z8VflYRzJF2KnYGdIshBae9AmYptl84dW_wU | 139 |
lm_eval/tasks/crows_pairs/crows_pairs_french_gender.yaml | sha256=I9YDvpOnQXTMWOH1smjEs1nDiDeQP3Emq-XN2SUfWQ0 | 131 |
lm_eval/tasks/crows_pairs/crows_pairs_french_nationality.yaml | sha256=ViElfWF8v9_JzWlhqosZtkA1WEuYCqwl__1eM0bByAg | 141 |
lm_eval/tasks/crows_pairs/crows_pairs_french_physical_appearance.yaml | sha256=Hv8VGBgSbJRy7ituauUmgxxFc3aPMJiwPLEDuk1W4L4 | 148 |
lm_eval/tasks/crows_pairs/crows_pairs_french_race_color.yaml | sha256=WIbsZhtI3CTC1tYI0QuVtHRatNinqWWVbEhCFqadzLg | 139 |
lm_eval/tasks/crows_pairs/crows_pairs_french_religion.yaml | sha256=n19G-AGyzTMp8dPGUcS-1TuCs90O9vR1np7oxn9RzhM | 135 |
lm_eval/tasks/crows_pairs/crows_pairs_french_sexual_orientation.yaml | sha256=zg4UOJEM1CnKu933_I8NXpyM3pADeihBpMFOjrsWKpA | 148 |
lm_eval/tasks/crows_pairs/crows_pairs_french_socioeconomic.yaml | sha256=N5rktYPTmeZkQDPZw6mGZL5GhBdmyE9hkxtd__lh8GA | 137 |
lm_eval/tasks/crows_pairs/utils.py | sha256=Wx48MYgKgqn-kHLhTtsV_-FD0Ik53l0X_qF8LcL-DBY | 1892 |
lm_eval/tasks/crows_pairs/__pycache__/utils.cpython-39.pyc | sha256=JGsGcR9EYtQlu9SWjIbyTt6TteeJvVjeQUynLcbPrCA | 2370 |
lm_eval/tasks/csatqa/_default_csatqa_yaml | sha256=nxl_fXyNo-ktSqXL7NEZVyEaltJpM71e1lndcGOqE9Y | 393 |
lm_eval/tasks/csatqa/_generate_configs.py | sha256=AGNXvD78TBDsFv0u9OP8PB3zcqPftSjpx6MaVfRi9a0 | 1438 |
lm_eval/tasks/csatqa/csatqa_gr.yaml | sha256=WfwUoa2uX8gOjaQfcVDUvVSVkWCmbJBjiv7KBpjHZ5w | 75 |
lm_eval/tasks/csatqa/csatqa_li.yaml | sha256=ZRwynLR8BVgxgFcSDTLi_WoHpkYAtmG6iJhLhr8KUFQ | 75 |
lm_eval/tasks/csatqa/csatqa_rch.yaml | sha256=hciObdoI5LBjMc0eM3fFX3fc-uKpuIIt-02-0-5K5Q8 | 77 |
lm_eval/tasks/csatqa/csatqa_rcs.yaml | sha256=8bSnj6bbts-sRbYrXpzM7OITuxED7VuIMiUzzo9xMPY | 77 |
lm_eval/tasks/csatqa/csatqa_rcss.yaml | sha256=-GoC4clrkSwJLOFkxa6TOEwin1PeTaKfy-Qw6BpHogc | 79 |
lm_eval/tasks/csatqa/csatqa_wr.yaml | sha256=ovjDaNGHTq38vQ3RROv4ppR09nQyVN6RMEsGimHfiL8 | 75 |
lm_eval/tasks/csatqa/utils.py | sha256=thFD-3JzYceDfR055-F6NhjxFLaEoAxF3b6E4ehwea4 | 662 |
lm_eval/tasks/csatqa/__pycache__/utils.cpython-39.pyc | sha256=zFW2IxYFLg5Aar_dlxWq6ML620q9lbKu_yDt0CVcXoY | 957 |
lm_eval/tasks/drop/README.md | sha256=_fto2NjX5LFKc6jv6Ip5dM7V-viFzt8sGlqcxBM7OJI | 1857 |
lm_eval/tasks/drop/default.yaml | sha256=ge9lSWsbRgWni0my5vUIf9Ox1w3lJEFfVYNVs4JiZSM | 602 |
lm_eval/tasks/drop/utils.py | sha256=79pxK4m_9kudfFmFOGCALYu64n0E3cMVAK6Gv-AYRAk | 5987 |
lm_eval/tasks/drop/__pycache__/utils.cpython-39.pyc | sha256=JMuijRFJ4_j10J5F1rGBCoYK72LhkcdvhLDV0bwTFso | 5949 |
lm_eval/tasks/glue/README.md | sha256=qdUL658CcnzXewbDaGiiZozAeCg_W-Pm2iD--sE5B10 | 3879 |
lm_eval/tasks/glue/cola/default.yaml | sha256=FudXMiTevWXPcxorqQC5PJHBFKjx_r1ROpD3U0z9E4w | 392 |
lm_eval/tasks/glue/mnli/default.yaml | sha256=hSmd3Jd1ox4Ks5kW_8rqvZ7KvB4UMoFU2VxLq-yVUqk | 311 |
lm_eval/tasks/glue/mnli/mismatch.yaml | sha256=hL3bcKRBMnyGsLBIOHfu1j8WsYTe8TGLrkSW6SIrvNQ | 110 |
lm_eval/tasks/glue/mnli/utils.py | sha256=2zCZu6crR6KQGCIbvKmp1E8EO1v0-8nfk7gIFoe6iV4 | 232 |
lm_eval/tasks/glue/mnli/__pycache__/utils.cpython-39.pyc | sha256=DKnp5FeQaX0SKL5om-nyOm2NhKqHas0VJ4CgPYT-UDQ | 435 |
lm_eval/tasks/glue/mrpc/default.yaml | sha256=LfUNoQsfzbVSQJmsYV96xUGq_-ROy8UwpyYCvHmhVhU | 389 |
lm_eval/tasks/glue/qnli/default.yaml | sha256=74SSOsDUfbLXh2colA7AXQ8Nt-ZvrCVp3GhBCY8Q2nY | 349 |
lm_eval/tasks/glue/qqp/default.yaml | sha256=9rMGaRfLIqWUJELYOZQ21c8z_Ant13GbvMBPh7pAxlc | 356 |
lm_eval/tasks/glue/rte/default.yaml | sha256=MS6ENzmO48t1Gh0YFABIJKx9IvRtH1igjlGgVqcoVdg | 327 |
lm_eval/tasks/glue/sst2/default.yaml | sha256=a_Pe2cSPXxH08_Gwufm0Taoy1ApgvcLN0EpELcXRzho | 345 |
lm_eval/tasks/glue/wnli/default.yaml | sha256=jn0pgCoQZUms-4bP3VaSptLke9a_JoimPq6UoD2i2U8 | 329 |
lm_eval/tasks/gsm8k/README.md | sha256=UDYib3sADm37wgpYMNQkRXfmaqJJDVqn4ioy9F4GxP4 | 1950 |
lm_eval/tasks/gsm8k/gsm8k-cot-self-consistency.yaml | sha256=bp-Qplbh2v69aqJhkrHX40bic-hxIfdzhh3ahie6Fnc | 974 |
lm_eval/tasks/gsm8k/gsm8k-cot.yaml | sha256=P87OrlJivWMfjv4bqCPbDL2ZDKHHiFh5lbhgAYIqWvw | 2949 |
lm_eval/tasks/gsm8k/gsm8k.yaml | sha256=NZNmw-HDypgvZ2sjfWcFtwNZG9EFP7f3YZsf6vsg6fs | 799 |
lm_eval/tasks/headqa/README.md | sha256=HGBlwCx5skNA9GKsXv59G3s-08i577g4QSgv2sQrK5s | 2582 |
lm_eval/tasks/headqa/headqa_en.yaml | sha256=cYLcqHtz4NKZ8snLIUGdfH5m8EI7E6fcNVCciGD8B-U | 578 |
lm_eval/tasks/headqa/headqa_es.yaml | sha256=SKIFepRQ_qX9euHAWhk0g8sm3OYDfaei2uQUpGfPWu8 | 57 |
lm_eval/tasks/hellaswag/README.md | sha256=0Sxbs3jgiuWJFMB0onpY-vhTxCZMWbDke8ElRFsiLfY | 2710 |
lm_eval/tasks/hellaswag/hellaswag.yaml | sha256=q_-PUH9svpAv658tsuklVLl64_rr3vt2Vs9gRxty6l4 | 482 |
lm_eval/tasks/hellaswag/utils.py | sha256=XRWYcDxab-AIjdEOQFKfGrMN8aHPtQjA8cKtVRkOuvw | 716 |
lm_eval/tasks/hellaswag/__pycache__/utils.cpython-39.pyc | sha256=wpBx-mC8BDH55zvCnQjX9DGzfFrF85Z-u7Vh-PvBsks | 1070 |
lm_eval/tasks/hendrycks_ethics/README.md | sha256=CHqVUCYMuODB2-sKYJWL_DHBAkMww7dEkVA4WXHDWVo | 1768 |
lm_eval/tasks/hendrycks_ethics/commonsense.yaml | sha256=sRtQV-KmrjuWmg0TYhFOUzSF8wmDKOUnQYwUaUP-PtA | 346 |
lm_eval/tasks/hendrycks_ethics/deontology.yaml | sha256=6VgrIemEILPa6yHeiAorYinA1ouDg2bfqmtC1JbHIHU | 359 |
lm_eval/tasks/hendrycks_ethics/justice.yaml | sha256=EHtKx2Ouw53LDHNGvhYmpQ0RVDOGl6jADRPtZGB7_OI | 290 |
lm_eval/tasks/hendrycks_ethics/utilitarianism.yaml | sha256=QEGqou_1154gCvJ7jNva8Kd072j8HK-MDVfuY5wk96M | 282 |
lm_eval/tasks/hendrycks_ethics/utilitarianism_original_yaml | sha256=D51G14NW3zCKcGjqeU_Z4gD22Vmu4Kt9rqKh4DYoOA8 | 589 |
lm_eval/tasks/hendrycks_ethics/utils.py | sha256=TYz5SgyhBjHVOjCMJCCBMVKexOHJwi-NBDvHE4qAoB4 | 691 |
lm_eval/tasks/hendrycks_ethics/virtue.yaml | sha256=_KlyeW331tOqZoDlC2qS5ahPowAQ9-HU9FciNX9YXkA | 299 |
lm_eval/tasks/hendrycks_ethics/__pycache__/utils.cpython-39.pyc | sha256=jqOq9zbvm71IzS_W6f0AhgyyUV6jsdXr6BhEQFCsnSI | 887 |
lm_eval/tasks/kmmlu/README.md | sha256=vKCq-CucNighrCOEXbwyW6uiBCeGaocnQ3my0iVVkhU | 2151 |
lm_eval/tasks/kmmlu/_default_kmmlu_yaml | sha256=s99xGAyoSJRqZPy3_6zUioWZejA_lPDBWZlZbwvVo5Q | 492 |
lm_eval/tasks/kmmlu/kmmlu_accounting.yaml | sha256=PnoIjRkInnWfb6wBaa89NAJBoHE8cttpIoSrPPYcC7s | 89 |
lm_eval/tasks/kmmlu/kmmlu_agricultural_sciences.yaml | sha256=DSAC6CstIVpHeLi_LY1ajRkh2RkIbIBqJCazJcihtGM | 111 |
lm_eval/tasks/kmmlu/kmmlu_aviation_engineering_and_maintenance.yaml | sha256=Ikr1qp-e73QffMDYCtuzVe_KoCpW9DyDwN74ldKEXs4 | 141 |
lm_eval/tasks/kmmlu/kmmlu_biology.yaml | sha256=Y3ZUD-CmlwvCn3c6CWPwkiRNIeSQ0CJu0pkuZkJ7hHs | 83 |
lm_eval/tasks/kmmlu/kmmlu_chemical_engineering.yaml | sha256=WqbfhDxdph4P_dkZhl7nu0Qrq6MRs_2sMpFnT-BHHl4 | 109 |
lm_eval/tasks/kmmlu/kmmlu_chemistry.yaml | sha256=N_ZJJvV7nrJ0Y6FYGeyIOkSfdOiHr_rhwaIzc_-c5Zs | 87 |
lm_eval/tasks/kmmlu/kmmlu_civil_engineering.yaml | sha256=MF7E3t9a-E8QDUD1D8bB-LmCemPUVQghGOMq4w2EeAU | 103 |
lm_eval/tasks/kmmlu/kmmlu_computer_science.yaml | sha256=lkbCtY54F_udXBougn_WbqlLNsNtIhxdFHvpF1q1lxs | 101 |
lm_eval/tasks/kmmlu/kmmlu_construction.yaml | sha256=MMfDCk53RXnUaSjkmxxjkEOL1l2MycUNxm-rWxxd8-A | 93 |
lm_eval/tasks/kmmlu/kmmlu_criminal_law.yaml | sha256=kjstmGkdkdelpegLAMsw4l5j-zDxdyHNA-9-fjOxmpg | 93 |
lm_eval/tasks/kmmlu/kmmlu_ecology.yaml | sha256=EK8qft9iXmSR2GQDVu-hs5WEBAZmc7j8vLQCW7A0byk | 83 |
lm_eval/tasks/kmmlu/kmmlu_economics.yaml | sha256=zL4d218PNW2jpL9jn7Oa6oRC7JDblGVFj3yuBo8Fyos | 87 |
lm_eval/tasks/kmmlu/kmmlu_education.yaml | sha256=NWOTVh1bqopcFlA7nN7UzjDN1k1ItxuJqs1pQs8AeeE | 87 |
lm_eval/tasks/kmmlu/kmmlu_electrical_engineering.yaml | sha256=KXYCI3H1aZhUgZg17-LBmZTW1iIjr9dog-2Y-vQrDqQ | 113 |
lm_eval/tasks/kmmlu/kmmlu_electronics_engineering.yaml | sha256=2GANVlbjK7-fDLBoqU9_eLyfQnzv4poBt-HG9uPmaHs | 115 |
lm_eval/tasks/kmmlu/kmmlu_energy_management.yaml | sha256=hg7hN9i0lQ6yY8AacXiJeaC-W1mQQxITxC-a82q36ZA | 103 |
lm_eval/tasks/kmmlu/kmmlu_environmental_science.yaml | sha256=fu8Uy7gWPWTIEN0J-sOGABjG2Ke_t-aIkx6N-En-1SY | 111 |
lm_eval/tasks/kmmlu/kmmlu_fashion.yaml | sha256=oNJS3i331vcOT08Cawdsj3sEzggcKys935hrxHuqPMg | 83 |
lm_eval/tasks/kmmlu/kmmlu_food_processing.yaml | sha256=_3aauAgjXMWaG52HTouA1QAgh3iyZypsvPyEyINsfV0 | 99 |
lm_eval/tasks/kmmlu/kmmlu_gas_technology_and_engineering.yaml | sha256=l1uElIgoDO1tCCgyF_uRJnGJxzSBHGwBMqD1ba30M8U | 129 |
lm_eval/tasks/kmmlu/kmmlu_general_physics.yaml | sha256=sdlZ41WUkRGE5cyImidyIiZUqjcKmS7a_sLlhBq3eL0 | 99 |
lm_eval/tasks/kmmlu/kmmlu_geomatics.yaml | sha256=iVO6SI7IqxlAAyc2w6_IOPwEoKhr0-4792vsAC1XdRQ | 87 |
lm_eval/tasks/kmmlu/kmmlu_health.yaml | sha256=fHQO5do6oQJWHiXp7J6LyKBHPfF-6oAOI91fYVSfxy8 | 81 |
lm_eval/tasks/kmmlu/kmmlu_industrial_engineer.yaml | sha256=GruQ5rA9FUJ8lrhrXrnjKd6ymDRT8hqfvjj5XrX4j3E | 107 |
lm_eval/tasks/kmmlu/kmmlu_information_technology.yaml | sha256=KZWp8Nt5GaEBiy09KewsJUNhdWBkE4u000Lae6oesoc | 113 |
lm_eval/tasks/kmmlu/kmmlu_interior_architecture_and_design.yaml | sha256=hidNhZXxiWOVb3BBPyrXgmMcV2lxRDOGyc6mvQs9O4A | 133 |
lm_eval/tasks/kmmlu/kmmlu_korean_language.yaml | sha256=JhGzy0in86fBO1_yOjAEg7MafJTad7-bEQ6VPJQfRaQ | 99 |
lm_eval/tasks/kmmlu/kmmlu_law.yaml | sha256=xhZw-OC7g22fd_tu1yQG_GDfZIpfP-yv_a1QMhhEidk | 75 |
lm_eval/tasks/kmmlu/kmmlu_machine_design_and_manufacturing.yaml | sha256=PRp1OMFEcjIMFv6IRwIgCsX2ujrVXQE69xcZ1EBSL_w | 133 |
lm_eval/tasks/kmmlu/kmmlu_management.yaml | sha256=eaQeFCuIdF8X75AExCnsQK7rcdyU99nTr1_IUT7xt50 | 89 |
lm_eval/tasks/kmmlu/kmmlu_maritime_engineering.yaml | sha256=ummh-dy6xBpYo0j1iCodyujBMu7t2o2iQzSjCsOCnbU | 109 |
lm_eval/tasks/kmmlu/kmmlu_marketing.yaml | sha256=SUxeOTwgzQ_svotNitwLZ0280Alv40ATLJCX6Fz_1Oc | 87 |
lm_eval/tasks/kmmlu/kmmlu_materials_engineering.yaml | sha256=Azd2RqZFuu1F56E2twcbAaKDpRbnhs6jNQcjvDDGZ4s | 111 |
lm_eval/tasks/kmmlu/kmmlu_mechanical_engineering.yaml | sha256=k3xNZavowNsG1halWZtEXguL9DhUTu97ydbyzueTEDk | 113 |
lm_eval/tasks/kmmlu/kmmlu_nondestructive_testing.yaml | sha256=7ZFU2fmhtExLOVJutKvRbK_6gZll78CfXq2WZ_6uoIw | 113 |
lm_eval/tasks/kmmlu/kmmlu_patent.yaml | sha256=03bCwJqW5rJqXDz1NJY5rJQTGgHwRxObFEbxfMpS2oQ | 81 |
lm_eval/tasks/kmmlu/kmmlu_political_science_and_sociology.yaml | sha256=-mvbD9Jjomi98TrTTRGGZIFo5HvDreuRw9QruKPhV8E | 131 |
lm_eval/tasks/kmmlu/kmmlu_psychology.yaml | sha256=v2bORzCSEZ4YNTxhHBLHYAwEnPvgeRTDuIcTloDOBmM | 89 |
lm_eval/tasks/kmmlu/kmmlu_public_safety.yaml | sha256=8IikRq3MWkxTAy_hOWMfMxV3UVsVDlvCOB3m0F8CKxM | 95 |
lm_eval/tasks/kmmlu/kmmlu_railway_and_automotive_engineering.yaml | sha256=farl59tLnWiodezJgf2EWjY8LUxWUNkMtsvtvZtygA0 | 137 |
lm_eval/tasks/kmmlu/kmmlu_real_estate.yaml | sha256=z0nTnFNOBOD5Kv_dkDwVAMkyc5CAdkdOzTziG-R2BO0 | 91 |
lm_eval/tasks/kmmlu/kmmlu_refrigerating_machinery.yaml | sha256=yDjEJc3Qwi02DSoJvaJySpdbF47vlXnlXb08xOZ7Dw8 | 115 |
lm_eval/tasks/kmmlu/kmmlu_social_welfare.yaml | sha256=qOysalmYQTHdkq1cGYrGnwTqJqqAO3sliUrG97te24c | 97 |
lm_eval/tasks/kmmlu/kmmlu_taxation.yaml | sha256=ndTnXwCkd0SrRDnt71GSavTbQjVicbaiU14hLBY4AEQ | 85 |
lm_eval/tasks/kmmlu/kmmlu_telecommunications_and_wireless_technology.yaml | sha256=xxuseW9A0EMzp7TLDSK18kwdi2-PJN8khyB8Jas3FbY | 153 |
lm_eval/tasks/kmmlu/utils.py | sha256=aDPnQ1oybssGOsSdLfyizuAcY0D9WuvODjP3u54ezpU | 691 |
lm_eval/tasks/kmmlu/__pycache__/utils.cpython-39.pyc | sha256=s_Y_ZQdIR3U-Uzdm9EdHvgLk69f1jFvoO8AMKghqeI0 | 886 |
lm_eval/tasks/lambada/README.md | sha256=AO7XlGGY1Dch3ZC6km8CkfwpLiOvAdYbHH_YlEi2xEg | 1186 |
lm_eval/tasks/lambada/lambada_openai.yaml | sha256=B39ynIgymIXdYLYiMVVc-yHuCYGj5FFSoDR0H5GHrXQ | 493 |
lm_eval/tasks/lambada/lambada_standard.yaml | sha256=uWLIOWKhj8LXBzw-uRjPqJ-mv2N0AAjDYgGInTsa0cQ | 503 |
lm_eval/tasks/lambada_cloze/README.md | sha256=j0ewRfQFxUQ6JsD-JGYp4oK1URb-uF1UGiQ-4cwYvs4 | 1934 |
lm_eval/tasks/lambada_cloze/lambada_openai_cloze.yaml | sha256=qUkXBa3bnaZ3SVXRuuvzvF9NGV7FCOmut9tr8bLwWrI | 519 |
lm_eval/tasks/lambada_cloze/lambada_standard_cloze.yaml | sha256=_z-Ofgpf6JxtEoJ7uuCJKQ1v3INMhswUxqSlzngENZc | 529 |
lm_eval/tasks/lambada_multilingual/README.md | sha256=ggwX8LEo_cr1oT29CyoLptVbcTxCVZSr9qhOr3UY7RY | 1995 |
lm_eval/tasks/lambada_multilingual/lambada_mt_de.yaml | sha256=A3dzij8qTX7W-XZ1uXkMf7l7lPbe8Irr_fem4zQ34oA | 72 |
lm_eval/tasks/lambada_multilingual/lambada_mt_en.yaml | sha256=pVMRNFjJ3vrnZcaF55RI8_34_raqG1N4oFWS8ngfFFI | 507 |
lm_eval/tasks/lambada_multilingual/lambada_mt_es.yaml | sha256=3cWtUCRNZWeGp9bIUU-uJcxCeD7iyHwUkAkdAFMFIxg | 72 |
lm_eval/tasks/lambada_multilingual/lambada_mt_fr.yaml | sha256=Okxnj-cxPcEsEIX0vc89Uih-szW7wqHY2SAcdi675Gc | 72 |
lm_eval/tasks/lambada_multilingual/lambada_mt_it.yaml | sha256=DtT68Pbs0fCY8oJlKQwQdO0pgcqNPEshYFQppA9RDD4 | 72 |
lm_eval/tasks/logiqa/README.md | sha256=Iyrf8c8F53A1eYqaDCb6hAm3_Sg_t47gZbOI0BjDKAw | 1657 |
lm_eval/tasks/logiqa/logiqa.yaml | sha256=9oDF6SFMo6Q3qctJF7a5Qb7m0GkxuvTIIkyWxt7jkqc | 538 |
lm_eval/tasks/logiqa/utils_logiqa.py | sha256=RjmfQAZUadI0wMnh7z3ptn5Q1f4cLEEwYH7aLdomgmA | 616 |
lm_eval/tasks/logiqa/__pycache__/utils_logiqa.cpython-39.pyc | sha256=oiFR-Ekown6euFnk4c7D5-SAlsDNx2f9nCAPYdBvIHA | 853 |
lm_eval/tasks/logiqa2/README.md | sha256=BJA7HgfRCSPs51iYrFl9rQzMKjoVDqaIDtCDAh5yk4g | 2244 |
lm_eval/tasks/logiqa2/logieval.yaml | sha256=GNW9rzJKiGpL6hboC53dZdKzQ1IJbVGG3Qp7_lGyrtE | 1342 |
lm_eval/tasks/logiqa2/logiqa2.yaml | sha256=m2rhssx_uSlfpuVhYbyUB5GslOs0h3vgR1Cqj_TGkVw | 514 |
lm_eval/tasks/logiqa2/utils_logiqa2.py | sha256=CtI75WahPZvORkIad_srFGSZ6bUnGlZf_6sYHkAP90M | 875 |
lm_eval/tasks/logiqa2/__pycache__/utils_logiqa2.cpython-39.pyc | sha256=ugd_dEpiuCnzgO_YaZp7x-0Q1aELUONIde2l6RCwiL0 | 654 |
lm_eval/tasks/mathqa/README.md | sha256=VmhPmoYwpKTfeUVDnkdHbj0zx2OtY7y7AI-cJrXEOhQ | 1907 |
lm_eval/tasks/mathqa/mathqa.yaml | sha256=7RLaY_6xKz4_JS_vQkOUkArWrGltkoRZZ1g3QOj8Dy8 | 580 |
lm_eval/tasks/mathqa/utils.py | sha256=NFqieHDv0UX5cEVmMmIu_GF7KZpNAKvJRZJC0saW00I | 178 |
lm_eval/tasks/mathqa/__pycache__/utils.cpython-39.pyc | sha256=kPQ33RY3_ltPl3ouoKzS-c4-StxWIAuBXUsUqTbm0Eo | 533 |
lm_eval/tasks/mc_taco/README.md | sha256=OEUcQofUlqsm-3CLKht9u-V0wXAldd7uPWBjmQjFTSg | 2052 |
lm_eval/tasks/mc_taco/default.yaml | sha256=C8thumjVOmNaAhww3tqWSCVHB8bJI3NUuKCZCTvebD0 | 401 |
lm_eval/tasks/mgsm/README.md | sha256=zSmVOkdo78p4Oj4Ui4skfwzYyLqPnE3H4DiS7qMF4Ac | 3504 |
lm_eval/tasks/mgsm/utils.py | sha256=4GYLxgzJKkXEsftBhSagaFJyTqwQmjMDBsDpCLXBDLI | 7585 |
lm_eval/tasks/mgsm/direct/direct_yaml | sha256=d6LnHB3ARygh--c5R3cXkJH_LoD29D10a5u5GSTd1w4 | 749 |
lm_eval/tasks/mgsm/direct/mgsm_direct_bn.yaml | sha256=Wo0KyiyXRkiW4gAKwUB6v1PF-ZGIz_GqUDNnGS-pdA8 | 325 |
lm_eval/tasks/mgsm/direct/mgsm_direct_de.yaml | sha256=hSwol6D6QLua-R7yob40tJ51i1sBxIvjxE20gEM5FSI | 314 |
lm_eval/tasks/mgsm/direct/mgsm_direct_en.yaml | sha256=WCmhQI9JZGMBNsRfSKuIn4S0uxEZXR6LNMCd0xwPC68 | 315 |
lm_eval/tasks/mgsm/direct/mgsm_direct_es.yaml | sha256=f4mX7Zfct3n9Gd_ATcbY-ENwwuk0mCDczKW3YWaEjs4 | 315 |
lm_eval/tasks/mgsm/direct/mgsm_direct_fr.yaml | sha256=lJuvmTIoeoPFLI6uZhmqulNesukgpS0Ar5K4qbb9eEI | 316 |
lm_eval/tasks/mgsm/direct/mgsm_direct_ja.yaml | sha256=U-W3snSDUMI8-He11Lz53N8REXyllt5ImaPylzhKuIU | 313 |
lm_eval/tasks/mgsm/direct/mgsm_direct_ru.yaml | sha256=vUi_FabdoEmLSd6QhLIQ7NaUjZl9llmu1nE3J4kwmbI | 319 |
lm_eval/tasks/mgsm/direct/mgsm_direct_sw.yaml | sha256=VmcZwhC4b_1obGshSaMcoQO8D6_Fq9acxkh8TNgfIJw | 312 |
lm_eval/tasks/mgsm/direct/mgsm_direct_te.yaml | sha256=h97DZja9lyJyq4OmNSDPJoHYE9EWjYNdKtgBdxBuj7M | 325 |
lm_eval/tasks/mgsm/direct/mgsm_direct_th.yaml | sha256=H8gVD-98jGIyEIuQpdWcHrsLQz2IV32hlA2ghqQb4WY | 322 |
lm_eval/tasks/mgsm/direct/mgsm_direct_zh.yaml | sha256=aQq4vo6LMXR0S1MQf3qU873P0l0wxHns7NOda2faaqo | 313 |
lm_eval/tasks/mgsm/en_cot/cot_yaml | sha256=6ywo0Qw4xCh7ZOsN-uB-BDIbohbc3njkdVBKrfjamHU | 820 |
lm_eval/tasks/mgsm/en_cot/mgsm_bn_en-cot.yaml | sha256=ltDIM95SEYy5QJCUSwmZ7DW7ouFOcK2M8cNF1-F9vHw | 347 |
lm_eval/tasks/mgsm/en_cot/mgsm_de_en-cot.yaml | sha256=y1-qoiCS3N3za7iLOHZUg5woXgc8S4LIeVTyfPKVQgM | 334 |
lm_eval/tasks/mgsm/en_cot/mgsm_en_en-cot.yaml | sha256=rN9Ik5umlVYUL_5OIKHJrK5TaufZHA_M9OvcMwjcubE | 337 |
lm_eval/tasks/mgsm/en_cot/mgsm_es_en-cot.yaml | sha256=M536HmZdPBrgYh_4aM4VyrnoFheYsOg0iFoVbjF2TrU | 337 |
lm_eval/tasks/mgsm/en_cot/mgsm_fr_en-cot.yaml | sha256=5C8TgGtH3ZsmXr7mtQutUf_CZy1WgQ_xIlWCes3bvek | 338 |
lm_eval/tasks/mgsm/en_cot/mgsm_ja_en-cot.yaml | sha256=vzZM-b4mthBpLndFe9X2EkWWvys90qxlvswVhgf2Eso | 335 |
lm_eval/tasks/mgsm/en_cot/mgsm_ru_en-cot.yaml | sha256=KeK9jt38Pnl_P794nlpkJCgQcyCqrUDf1loW2VEmYr8 | 341 |
lm_eval/tasks/mgsm/en_cot/mgsm_sw_en-cot.yaml | sha256=al9W5asPb-nNmuF8o_vlGlvxSHoKsURx8QfSBXtvI60 | 334 |
lm_eval/tasks/mgsm/en_cot/mgsm_te_en-cot.yaml | sha256=WAA9bhDnasu2bOXcyIjnvpLHmHHfTTRgnBBNqafoVFg | 347 |
lm_eval/tasks/mgsm/en_cot/mgsm_th_en-cot.yaml | sha256=hZLlfaee_uiVkXjwFv31pJK860Z3yf6Kv_hN-TsosGk | 344 |
lm_eval/tasks/mgsm/en_cot/mgsm_zh_en-cot.yaml | sha256=1xolbTeF5V-4DXxKckL0HBx-zMrvM1RN0yBgIRgieac | 335 |
lm_eval/tasks/mgsm/native_cot/cot_yaml | sha256=qrLx_BfFPdljwVVM1wgvU2zqODPEBSLqFh65IO186WY | 820 |
lm_eval/tasks/mgsm/native_cot/mgsm_cot_native_bn.yaml | sha256=VQZoHMieDSHsEDeOW6EhgEfFBmIVIkIbmFFr8eL-GcM | 399 |
lm_eval/tasks/mgsm/native_cot/mgsm_cot_native_de.yaml | sha256=krT2q5CTHOF8N7ivuwl6om_HfcwWC_4T62E9QgXr3W4 | 360 |
lm_eval/tasks/mgsm/native_cot/mgsm_cot_native_en.yaml | sha256=PmMEs_bo61cgTcSDnrQu2wVupyym_ocYTj_4elAfRRw | 345 |
lm_eval/tasks/mgsm/native_cot/mgsm_cot_native_es.yaml | sha256=AwjRIZ1LxEjSDfEd9cjjm6P84YsZT8YKOENQrXTto58 | 349 |
lm_eval/tasks/mgsm/native_cot/mgsm_cot_native_fr.yaml | sha256=MC6pF5nS6lV48ZRW5GkIbRx_lxRU2eODakHkkAQlNL8 | 362 |
lm_eval/tasks/mgsm/native_cot/mgsm_cot_native_ja.yaml | sha256=uafHGDgPXMrvUf3u7f6Uj-0BMnEb2UWLNgswgQD932o | 359 |
lm_eval/tasks/mgsm/native_cot/mgsm_cot_native_ru.yaml | sha256=yQSOfG2HJRw0Bqa54ukrgKLTPw2HNUzyJT5afbWYyVw | 375 |
lm_eval/tasks/mgsm/native_cot/mgsm_cot_native_sw.yaml | sha256=KSlRaFENZmvsaMtzlkMEZ26m0OeXTKi7RVdtWAfKDxU | 350 |
lm_eval/tasks/mgsm/native_cot/mgsm_cot_native_te.yaml | sha256=Qp87BiEsizKoNcnGsVWqqjmPzT9qYOtgZeRZ_wTKa3g | 415 |
lm_eval/tasks/mgsm/native_cot/mgsm_cot_native_th.yaml | sha256=5Ofd0LCKYARLaZAQTb-K4pqHUHOhIL6-Ia4QVyMxzGs | 410 |
lm_eval/tasks/mgsm/native_cot/mgsm_cot_native_zh.yaml | sha256=8GLACTQBYz4zQi7PPDrmWNW7mUY958kkApf1V6okBEI | 328 |
lm_eval/tasks/minerva_math/README.md | sha256=PW0HYE2EYL424FRKQSGB28pBoYPs3o2S-f11QsAwx4s | 3043 |
lm_eval/tasks/minerva_math/minerva_math_algebra.yaml | sha256=20_02tOwr6o8CdFQRTkPQ4_hxy6vADabIo43ScMBgok | 557 |
lm_eval/tasks/minerva_math/minerva_math_counting_and_prob.yaml | sha256=jjxGjPVtnUiudvSkOVlfA_A6oCSUBM2USRJAgQW0HH8 | 111 |
lm_eval/tasks/minerva_math/minerva_math_geometry.yaml | sha256=XiPoBuvqoAc_1FtATee1GyYcMAC8ClYOKWa04nrcrHQ | 86 |
lm_eval/tasks/minerva_math/minerva_math_intermediate_algebra.yaml | sha256=Irfq2-W-AiImEH0PoT2ZdoVg_y-sQOWqNfOimVovvkE | 110 |
lm_eval/tasks/minerva_math/minerva_math_num_theory.yaml | sha256=IYI_lzbIQ2BbcPWXrS24nulnlg93CJjlwUfV8M7IkTE | 93 |
lm_eval/tasks/minerva_math/minerva_math_prealgebra.yaml | sha256=va30pN9E3JV6nmLY6lUXxhH_nkm6ijSDnAiw6wdrDnk | 90 |
lm_eval/tasks/minerva_math/minerva_math_precalc.yaml | sha256=6PZ7DSqtq_gn2rPKIo10hw6JMJOanIxuiWu5uZCc0JM | 88 |
lm_eval/tasks/minerva_math/utils.py | sha256=m5n8H-mL_bVgqwB5XOel4tUCgRT0eaqRyEH08g4pouM | 8698 |
lm_eval/tasks/minerva_math/__pycache__/utils.cpython-39.pyc | sha256=9qi6ehpAoSiH_es69droWtrCW-rL7aAfFp9cEdHEDe8 | 7792 |
lm_eval/tasks/mmlu/_generate_configs.py | sha256=aPweKROp8qIP2nNZhBI0g8EgWgu_Myq_m3lnVuqhN-A | 5277 |
lm_eval/tasks/mmlu/default/_default_template_yaml | sha256=cq1lgwbccGk64eIwmXK3GVMgLrcOb4_Brno8Tvr-mLs | 472 |
lm_eval/tasks/mmlu/default/_mmlu.yaml | sha256=opYhS9c-LnKCQ0Uh8sMa7Z4gmoifQ3vlCeygR4ftGG0 | 92 |
lm_eval/tasks/mmlu/default/mmlu_abstract_algebra.yaml | sha256=gXc19CgltUo07syBqIE32CnTjvsYCeVeWRG-KX1Fsz4 | 288 |
lm_eval/tasks/mmlu/default/mmlu_anatomy.yaml | sha256=6GsRm5WgJy3WtuGZpR-rsTdpfO3uWaBjg2jqg3peTjA | 251 |
lm_eval/tasks/mmlu/default/mmlu_astronomy.yaml | sha256=BKfcrmOQeIcmo9WfGbvm79C3W3rpmYlH2WXfCwMd41c | 259 |
lm_eval/tasks/mmlu/default/mmlu_business_ethics.yaml | sha256=adoNOrbflZ-pgvnL4k4_2SeQwSDoGVEpR6sD3wOAabE | 286 |
lm_eval/tasks/mmlu/default/mmlu_clinical_knowledge.yaml | sha256=rtKNL_LHXj5ImTUYMuFTPsKbJvGaPHbxSh_EQRkn6TQ | 298 |
lm_eval/tasks/mmlu/default/mmlu_college_biology.yaml | sha256=tgJqKwkOinOadHJGIvA3fowTImsm5CesuHqNqfyuLL8 | 284 |
lm_eval/tasks/mmlu/default/mmlu_college_chemistry.yaml | sha256=6-5alIH2bG-I5A1ToEEMPjNz8-uxq-WmOkHWVO84TFI | 292 |
lm_eval/tasks/mmlu/default/mmlu_college_computer_science.yaml | sha256=JdXWQW9JAOtR97ctqNpKM2yX2rl-_eoK1ozYBSqtlpo | 320 |
lm_eval/tasks/mmlu/default/mmlu_college_mathematics.yaml | sha256=p5Siknwp9HiAOfl2gazwbn65I5n82yj116ISRB6PFN8 | 300 |
lm_eval/tasks/mmlu/default/mmlu_college_medicine.yaml | sha256=jhM79qmFR020H4fzazq5mEfxRsThQyMbEr9iEC7AiUc | 290 |
lm_eval/tasks/mmlu/default/mmlu_college_physics.yaml | sha256=Nm8Bjy5g3sh6PGJpOHj13ReRwGRra6zbTDR9Mw-T2BQ | 284 |
lm_eval/tasks/mmlu/default/mmlu_computer_security.yaml | sha256=WmKRHbFMgdTCeGFNdrIHfbTQO-OoUrFRR41jbeCMoFY | 292 |
lm_eval/tasks/mmlu/default/mmlu_conceptual_physics.yaml | sha256=nVXaOJWl0Jv0FFAxzDghiiGncQ9if4AdBdoeZ8vX4n8 | 296 |
lm_eval/tasks/mmlu/default/mmlu_econometrics.yaml | sha256=kll9ZFihynXeCHB-IRvsB3jLGJZ7c7-H5fxBiGRx9Q0 | 293 |
lm_eval/tasks/mmlu/default/mmlu_electrical_engineering.yaml | sha256=0-7WBd2UWT0wuK8FRdzFNb8Yk6519Ul2mHfho6Wc2sQ | 312 |
lm_eval/tasks/mmlu/default/mmlu_elementary_mathematics.yaml | sha256=c2lWRYGVEmrQO1_JbGUa9eau3SKh-7q59IqDkAd3GGo | 312 |
lm_eval/tasks/mmlu/default/mmlu_formal_logic.yaml | sha256=t13drARz0b49xLGotrVSkDR_GH3kHzqPT2jJ-kG_D4A | 284 |
lm_eval/tasks/mmlu/default/mmlu_global_facts.yaml | sha256=kK1l52luxT-Ib56eZddHw_9EubcuAEJU9zR239fvBOE | 274 |
lm_eval/tasks/mmlu/default/mmlu_high_school_biology.yaml | sha256=adPbtPDslRd6AuVjadFeKstNg4ngLYCj7uq7s3xvph0 | 300 |
lm_eval/tasks/mmlu/default/mmlu_high_school_chemistry.yaml | sha256=FjJZ2bcdxHpwozh7nEW4bW1KZgwDg7sqG9lhi0Abd1U | 308 |
lm_eval/tasks/mmlu/default/mmlu_high_school_computer_science.yaml | sha256=FvmaIXBRroEyw8WU1vSA4BDWat9toiJmHvvXaqwUus8 | 336 |
lm_eval/tasks/mmlu/default/mmlu_high_school_european_history.yaml | sha256=vgNEM9KbKZyE0HZiy7cWskYtU5Ox6D7WRNxAJNgiGy0 | 348 |
lm_eval/tasks/mmlu/default/mmlu_high_school_geography.yaml | sha256=aPXicSifSye9Ut2wnerc-zboiSzOjYkm4gVhhiLocVI | 330 |
lm_eval/tasks/mmlu/default/mmlu_high_school_government_and_politics.yaml | sha256=iKZO88iRCTaEnOb1J4uuE2BICx9TyhRuBWXhttl_0nM | 386 |
lm_eval/tasks/mmlu/default/mmlu_high_school_macroeconomics.yaml | sha256=1LRd0Lb_U-ublgdMBoOo4mhC8srAdY-NBHW9nH68boM | 350 |
lm_eval/tasks/mmlu/default/mmlu_high_school_mathematics.yaml | sha256=ATgCLKhZn7UoNl2nDaxdBgD1y8k50b0I21WEmlB-cps | 316 |
lm_eval/tasks/mmlu/default/mmlu_high_school_microeconomics.yaml | sha256=cv2UrjcQpQe2rvtsMIDge-Ms59PjgPWGlznXJGlHwAc | 350 |
lm_eval/tasks/mmlu/default/mmlu_high_school_physics.yaml | sha256=sWPVelphJpPM9RWCoVTKiVNWuhdWPegLZZbGa80LDIE | 300 |
lm_eval/tasks/mmlu/default/mmlu_high_school_psychology.yaml | sha256=Q1BJGN6k_9bGk51FNgbMWfymVrcS9s0caTU7N3T5lMs | 334 |
lm_eval/tasks/mmlu/default/mmlu_high_school_statistics.yaml | sha256=FiVyJuipuzYEECJSWcm6HbCc2PJ3HS6sXO4bnO05bi8 | 312 |
lm_eval/tasks/mmlu/default/mmlu_high_school_us_history.yaml | sha256=DFJcWsmxtV9HeDyFvPYCSxCAWywNSfXM5-vc1j6OOAs | 324 |
lm_eval/tasks/mmlu/default/mmlu_high_school_world_history.yaml | sha256=B4axVHntppczWuGGL6gQBhGgdukhqTX2Ga0kwH7wEs4 | 336 |
lm_eval/tasks/mmlu/default/mmlu_human_aging.yaml | sha256=it0LUShyuG1o-jr-kdyhtOOWYFx20MuuVOCe9lhf2Hc | 270 |
lm_eval/tasks/mmlu/default/mmlu_human_sexuality.yaml | sha256=X-THNfrS2YzRDlv-2Ud7Zf8CowaIEmu3OxouK37DmkA | 306 |
lm_eval/tasks/mmlu/default/mmlu_international_law.yaml | sha256=_FSWdGN6SvDlaT88kQsGtj_7kuqzvvkGVLlTiPBW_lA | 304 |
lm_eval/tasks/mmlu/default/mmlu_jurisprudence.yaml | sha256=jFnFoZLKI6ANTvvH9cOCcM4DGJFtw3Xp2Cmd-wcMdxI | 287 |
lm_eval/tasks/mmlu/default/mmlu_logical_fallacies.yaml | sha256=t9cxs8hSQD7hLx8n_62Wsn44VCEasO83xzFF4MpJDOQ | 304 |
lm_eval/tasks/mmlu/default/mmlu_machine_learning.yaml | sha256=YzBbWm_EF49uRk_BjL-9DzgCeY7kvXWsPQRjwVAyDes | 288 |
lm_eval/tasks/mmlu/default/mmlu_management.yaml | sha256=43IDk6OZypE0VFm-2ZwkuVv3Arf6NzGgjdQNIeT0X3g | 265 |
lm_eval/tasks/mmlu/default/mmlu_marketing.yaml | sha256=32eH-SwcdzdbZMoiAI9GoUx_fRChoakuUrMvXZJ5haY | 261 |
lm_eval/tasks/mmlu/default/mmlu_medical_genetics.yaml | sha256=cBYQrC5cGxR8wtUhB7rfahBNpoZJ_xcIwvQrijxNQNY | 290 |
lm_eval/tasks/mmlu/default/mmlu_miscellaneous.yaml | sha256=Oo5UxK1to8hY2jdB83n9wTJnVJrAHNkIp2_n9wblioI | 277 |
lm_eval/tasks/mmlu/default/mmlu_moral_disputes.yaml | sha256=59Zv6o6ZAvIWM_NCdq6KTFo9-VNa9KocwHs-hPUNTOI | 292 |
lm_eval/tasks/mmlu/default/mmlu_moral_scenarios.yaml | sha256=JT2l_KMkk5g9tacrCPk2U67TSFU7bwxH72vtO94ELKA | 296 |
lm_eval/tasks/mmlu/default/mmlu_nutrition.yaml | sha256=gqbILA55_fbtqBzcjU9gCqPCdIAh6h-ztArvHRA5NtM | 261 |
lm_eval/tasks/mmlu/default/mmlu_philosophy.yaml | sha256=NWMWKylcBfEkIumwg6eRaJgKVqBpQ6blOMbyIvgn77w | 275 |
lm_eval/tasks/mmlu/default/mmlu_prehistory.yaml | sha256=g9KiT4SwWrzRlHSMMIEYSsTarhFNsuGyTFhNjd3BMrU | 275 |
lm_eval/tasks/mmlu/default/mmlu_professional_accounting.yaml | sha256=9lcnaGxlY3IgmAPAhvvXjrMEHmYUROCVPI8jsrpOP0o | 318 |
lm_eval/tasks/mmlu/default/mmlu_professional_law.yaml | sha256=fHnaxASjlkxSWtAuKVfr0sI-6AEm83vN2aEZ2-HShT0 | 300 |
lm_eval/tasks/mmlu/default/mmlu_professional_medicine.yaml | sha256=e-JGsjNQ7vcJxMeW1IgYSE1midCUGhD87cs1FVT7dMs | 310 |
lm_eval/tasks/mmlu/default/mmlu_professional_psychology.yaml | sha256=VrF-mtFHcGOUBOUseGjvUoKgB6uXRi8y3g98xG5SrBA | 338 |
lm_eval/tasks/mmlu/default/mmlu_public_relations.yaml | sha256=LPamTE3llnQCW25KM8TDzHrkOTIFBQzoOzO5E1I22qA | 310 |
lm_eval/tasks/mmlu/default/mmlu_security_studies.yaml | sha256=zW3wJTXMpc9WoQpOy6WLZc7uVoq7MUkAN6CDQqg505s | 310 |
lm_eval/tasks/mmlu/default/mmlu_sociology.yaml | sha256=E8v0YKlGUe-gLWjmxgKRAZqrjKQ2NKFENw25wpdIQdE | 281 |
lm_eval/tasks/mmlu/default/mmlu_us_foreign_policy.yaml | sha256=jOXbTYPJayVwvMeIqJdRWxvH3DnwwyBKsUoUzgcOKC4 | 314 |
lm_eval/tasks/mmlu/default/mmlu_virology.yaml | sha256=dQW5H1xYslCMlYJ2im-8x5nRs7zudCRW1QxaoCts1xc | 257 |
lm_eval/tasks/mmlu/default/mmlu_world_religions.yaml | sha256=sozIm5GYbF1z6K3M-DZZuYeIuXoGlfCLdU1dG-g0mi4 | 296 |
lm_eval/tasks/mmlu/flan_cot_fewshot/_cot_prompts.json | sha256=CBR4SFsdT1HgEwXhkRPw46Ro8tx4dZY4aZjiKal7CWw | 218396 |
lm_eval/tasks/mmlu/flan_cot_fewshot/_mmlu.yaml | sha256=AmkVICAMmJEIwTs0ULG6QxkUQBTEwYvcCVkzXsNeCmI | 177 |
lm_eval/tasks/mmlu/flan_cot_fewshot/_mmlu_flan_cot_fewshot_template_yaml | sha256=CL0fetD-umRxakae359sCiw6GJesX26RY_1zdmY7G9w | 785 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_abstract_algebra.yaml | sha256=i9OND-3ugS3Y-V4tnmPf7-ncWotcKjsHYGP7ioRSJ6c | 3283 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_anatomy.yaml | sha256=Qo9gChWbJVrTxj3AfGs2hyblIzq2elL-dHEqwAi8eEg | 4704 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_astronomy.yaml | sha256=eANA6hJA4OXmz41-VRnmVMvLtykjTyARmOj-D7c27po | 4526 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_business_ethics.yaml | sha256=UV3kWpjIZDuDDspPxS10FkpU3yX1j7hnTs7pSx8KG3g | 4650 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_clinical_knowledge.yaml | sha256=sJOKZucur5KXLVV9K7yyR_BV17UMREjJSr8NnpoGhdA | 2790 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_college_biology.yaml | sha256=d51ullMuaVek_b-t1bjYGC47-eZOhdiMH49VyYUgN1s | 5018 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_college_chemistry.yaml | sha256=27rIMLE23N_oDWBYj9RirFTRTMUTi5fsZymf9jQAlW8 | 3079 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_college_computer_science.yaml | sha256=p_n0hfEo3ejxWONc75v4e7TW6uWSj8GdmjFKrU1MA7U | 6656 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_college_mathematics.yaml | sha256=L1Vny2jzbIUrPwSKtu7aoWblT3TdEpQMNGc95t11pAY | 4094 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_college_medicine.yaml | sha256=j7JDm6S1iGSdJm23VKm-E2w3QCLKGQALHJAelKP0mLs | 4342 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_college_physics.yaml | sha256=9h396DDHB5_EzyszrDALEONNDM_0ZE3-ia8VVwiLJtk | 3572 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_computer_security.yaml | sha256=XkeIKlEyhMc5uMoZD6EAt-cTychzTWhUxaWuhPAwCzI | 2893 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_conceptual_physics.yaml | sha256=cl8R6amav2M2j-4CWqgt268r-8HFeLSKqrX_rRQGLdE | 2661 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_econometrics.yaml | sha256=j-1GWZUEmojmUmm9X4G2EBhTlsAkNsPEOTnJrZVTGsI | 5253 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_electrical_engineering.yaml | sha256=E7cseWfTbQLkMtPTB7AQ_WvCXQDnHC44zm87VSE7w9k | 2742 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_elementary_mathematics.yaml | sha256=tnaF2xDuokHYuHbq-Itr7LZfHWTWwcWyUaxVs4R45mk | 3306 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_formal_logic.yaml | sha256=4gcR3KuFVDtbPIP1uoZlj1eSo2zB4m_3yyVxUBoQOYA | 4520 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_global_facts.yaml | sha256=UDEgUdufjlweJbpAKrtWga6YTUTwhyFWVpssSzx-WLc | 2700 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_biology.yaml | sha256=n1tjopDx2rKy6fc1mk7o8M6GIUKQxvh5cNs-ymhKpZs | 4496 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_chemistry.yaml | sha256=w5DTrVYG5H3uw_aSly_QF71DuKEP31NSJ1Bgkp1Sdbo | 4148 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_computer_science.yaml | sha256=QHhgSa1jU2lFzeuIByKS0zY2zwYnSJr09SOdedEQFcE | 5867 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_european_history.yaml | sha256=JCOiZZ8A3R81eSO8wOu1Xa9dqAZ2xLUc8zX_o74qRKE | 14453 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_geography.yaml | sha256=mNwpohT8ysledOx5nQWztnm7fnd7EuwqzSn9IYbKeXw | 3074 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_government_and_politics.yaml | sha256=KmQClLUPJiiuJ0REPgVrykpdngyCUhq094-7AMQreSY | 3557 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_macroeconomics.yaml | sha256=ddlRI10f3lV80g6ZlxMZb5puwML1lJ87ja0nTjhlyBs | 3045 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_mathematics.yaml | sha256=PWJv_mapsiyyE40cK32Ky0B4_mTEIbZL_UiybJS5ArE | 3007 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_microeconomics.yaml | sha256=MeRkFGxYyNsxo0bKb3liJApfl0yxWntiy7A1u61LSnQ | 3238 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_physics.yaml | sha256=U0Dq4ByrLSK09Mrv1QPDseQgufQuBDXKCTb0xVoV1UI | 3154 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_psychology.yaml | sha256=jQsUp94o1WYgwcx4I_g_DadIutm-LkhiPpZtt-rS4iE | 3988 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_statistics.yaml | sha256=QsZh-YF0NYPmBkl7K5UiASr-oGA8vcxwojigffPo4-k | 4777 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_us_history.yaml | sha256=71jIaBPgUWbEwQTWTIVZGSdqV2s7i-dcuysorCCaNkY | 11372 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_world_history.yaml | sha256=VS64z2RHKW3FCOMEMdKEt9AfHvInOAlqoKqSVeiN0Pc | 6933 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_human_aging.yaml | sha256=2FbGMnhDfiEcY1DGU3YdiEZJhUzkCCE1Ss2G3xr5z-I | 2181 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_human_sexuality.yaml | sha256=k44qoXctF1kx3tnQIVIglwrh8FXGx3ea9fh55M83-ho | 2713 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_international_law.yaml | sha256=VtXMlXDrcwba0qpiBcYfeGDAnl0ke3Q6CyLeg4b-7SY | 4508 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_jurisprudence.yaml | sha256=W8VmpIzbq26j-LpqLW3_5nf2-yMqZuUKawuFYvrpPQc | 3668 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_logical_fallacies.yaml | sha256=E5rNbNatNV3YdLgFlEsO-0K8713vDJdj3iUjpExBa-o | 3644 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_machine_learning.yaml | sha256=w0Pem7z84NEyh749-vS0TWbClitKpQE9U3LHll7eFA4 | 4929 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_management.yaml | sha256=FAs2Ey3p6MSZWYmdXl162kBz4051aXKMpXnGnz4FUyM | 2639 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_marketing.yaml | sha256=VGC_C3MYeQ4rhS177ax0Az3R2RB6wGojKk7N-5HIhO0 | 3271 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_medical_genetics.yaml | sha256=hqrgrLaXp7ycrI6MnmkyLrBWdqKFFNC18v9NJBg7f7U | 2972 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_miscellaneous.yaml | sha256=0qY0ZYGHsBhS3wxX1rWYfgavSmJVhzdRfESKt6MaqPs | 2169 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_moral_disputes.yaml | sha256=eEA8AeWOVqM1sX_mQFbm_m7U6WwxFkRbUA-IR4y1YhQ | 4018 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_moral_scenarios.yaml | sha256=Jd8TfRoge9XJM6lstObDTYasbtqW1qsG9_HaMAW7plM | 3601 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_nutrition.yaml | sha256=bh0rJv8UK_I0WNvBUutB80OC9VxI4V1a3TWcRsCzn_o | 3897 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_philosophy.yaml | sha256=jLJUfPBEc8JWX0kODtlUogZ_p2L7yDywraMzxCjGcHo | 2410 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_prehistory.yaml | sha256=D9M14jFNL0n5R7pV5AmnZQlf_kcOg0wqtvPqTXCttN8 | 3441 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_professional_accounting.yaml | sha256=MMHhBZeQ4q9rZqjSSJhxhYlyO4iAJm25e0rS2RQsizQ | 3922 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_professional_law.yaml | sha256=xPAbeM4zgXpAUmCaTmNpkUpOmBxAWEzltXH-nO_v_ks | 8947 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_professional_medicine.yaml | sha256=U0jY2h2BzfNffVJU0WDOb95vz9ZtKAi6X9ciqnMUTHk | 5853 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_professional_psychology.yaml | sha256=-p6H2y6oRwX0R3Xvyot8ZO1ehiEcDNsBNW5NMW_FHyI | 3990 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_public_relations.yaml | sha256=cHsTH5yEFAg5mqZ40Wvf9-4CIfM7jO_xTKCmB1qrw1k | 3143 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_security_studies.yaml | sha256=iyiKxGAc-Kl4EnOEPWf2Dof0_ZiVYkXglcYFLFgIQKc | 7270 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_sociology.yaml | sha256=Kpyov2cWFfbxkApiTrixJbNwq9MzmbtOHyfqyZy7R4c | 3460 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_us_foreign_policy.yaml | sha256=0_Qvn6wr7CQYdsKdl-xmtuwNl8It6FTRsV_HWMf3Bas | 3277 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_virology.yaml | sha256=ddbifOmbeKlYQ4--WEFDSGcQQyvLwzI5T3AfYj9dQm0 | 2450 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_world_religions.yaml | sha256=V-7NOjqQMEmf273O4_Pi1ktOsXCExEVzi9Ma1kwpfmE | 2130 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/_mmlu.yaml | sha256=_hjjoCQTWOlz_f-ldxYlK9RWpKnbHjOn8KlwNjLhatg | 182 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/_mmlu_flan_cot_zeroshot_template_yaml | sha256=D-ShExeWMRtpgac4LitUSKpsqqek_wXtXigQVv0xPk0 | 876 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_abstract_algebra.yaml | sha256=LvRnHFrHw_6n24MAe5BOixVezyZ0ME581aHG7yDSn7E | 284 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_anatomy.yaml | sha256=no8v8ThFcdjNjCqBkFZIR1--Nd4ZiCZoa-L825u2rLM | 256 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_astronomy.yaml | sha256=hN2iIJ1PmHloJCm9C2dAQRAc6XqBwxUGivaiUaq6-kY | 262 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_business_ethics.yaml | sha256=XWfFMMiwK8hhSNKkuZs_JSBeIHkw4evEM02LIKhAuTo | 282 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_clinical_knowledge.yaml | sha256=e5KerpASf1oRCJLvWqvGHJf5ZW04jrqmA8yzpY4RMt8 | 291 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_college_biology.yaml | sha256=v2ZXXWAltVye0sdYDsi6vE70kuW_3b9wsyZ75UuuZsc | 281 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_college_chemistry.yaml | sha256=8X67aXlo-viUOq4ZVbWrgEo9ntqi0lNWHqtMpDr-0AA | 287 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_college_computer_science.yaml | sha256=5h-Qt7ndBtlJG5ZfSbY6caGMCbQrsyWc-MVPxncDzuU | 308 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_college_mathematics.yaml | sha256=Rf_ZzZUxQ0oOct1pg1TXi_dsRUZpU7WkcmQviWHoXi0 | 293 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_college_medicine.yaml | sha256=fJ--DO7NIxkwa2ica1QbsdlIn12616p8PqE8EauaUlA | 285 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_college_physics.yaml | sha256=9bbIfyxuil3UIY-jG9-Fvf3ywmwdMo0titOe-M-Dt6c | 281 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_computer_security.yaml | sha256=nXPVQH1xVJtZt6_2FPiC626QoXGaRY01f2AymmhzQ2Y | 287 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_conceptual_physics.yaml | sha256=WrfEys3YyQF6s8otgNvTjD16LDKZk9BhvyW525ZIj84 | 290 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_econometrics.yaml | sha256=ygr0_Jh5OWxyixszzr35NEie0PudCTADqRpjpMDThrA | 282 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_electrical_engineering.yaml | sha256=hciTVSP3ckCk3RwC0PsB-J8Ve4wHyj2xusA8kEPzjy4 | 302 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_elementary_mathematics.yaml | sha256=9DH852QpJPBc8YgxNvvCnnq5nwTDVNcLqU4BRxrSiBA | 302 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_formal_logic.yaml | sha256=58WVxXMCkazivwYFoZQ1Yb84Z991OiU-vQI4sbtJUXA | 278 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_global_facts.yaml | sha256=RM_pb6sRZmx6iVcFXAiYbYHn3gfXAeAvodBwVKd25zc | 273 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_biology.yaml | sha256=0DnTWb-KtU2zFX-QFM6s7XKKouwT2nfyK4fyS_tioyU | 293 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_chemistry.yaml | sha256=heKA8_U1wj5P2q5roXMqwAWiRa9v-sbZaTbe-hyP1cA | 299 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_computer_science.yaml | sha256=DiOmq-I8_p3DVOUhtFgFjijtG0-J_MRa8F5-cIMeOXQ | 320 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_european_history.yaml | sha256=3OffoLG-gh2JjKcKWntBWFEjc5lrSgOw-ZFwtJPgFJw | 326 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_geography.yaml | sha256=Fd0I-5A7mltjnIF0Md7fQLY6YyVOoonsdc4txxNNZsI | 310 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_government_and_politics.yaml | sha256=uimHeblbJFYgaaah5fsWTQl3_KFZdvDTGmcdviqD97E | 352 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_macroeconomics.yaml | sha256=3dhl58MUaawpSYJFfvelXVpKLcVBbDE9MpMvAT2peKY | 325 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_mathematics.yaml | sha256=aRQK4pwDayZ6xNkOEqytHjJwxyI2nsY_9QOW_FAL6ok | 305 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_microeconomics.yaml | sha256=ZKQPAubYaV9HfGiJFvENELqyTLuFvG975eBGmn5USlA | 325 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_physics.yaml | sha256=7u1ma2j7itc6SdgSwlotC4Qs3oovbmQMCldOuUWtwGs | 293 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_psychology.yaml | sha256=cMvGDf1fcB4btH_AlHeZ727FWVPB8WIvUDi9jP7gNiM | 313 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_statistics.yaml | sha256=iolnReJzl_eeTS3iDnhz3NiEn_GNeNW9_hu6Ba_CRA8 | 302 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_us_history.yaml | sha256=TYckw3h7JfcP5tq0X_k58pyk3ph07f69WyeAqRxmcGQ | 308 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_world_history.yaml | sha256=z6JcOncyLPzV2cW9Y1kzICK9I8c2V2KGa5iPgYi5XJ0 | 317 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_human_aging.yaml | sha256=Rq1oksitbFhGyrgN0H7fHTW_PGwKraphFEE0-ZDzW2o | 270 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_human_sexuality.yaml | sha256=XlLHhllCiErpFvV8u4_erECYPiU_sf49IZ_q2We1Ulo | 292 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_international_law.yaml | sha256=47Y_4EVkuA8PYyLDZwb7PcDgAoVjJhxQGV6uH6SksB8 | 293 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_jurisprudence.yaml | sha256=62o2fgoKLVpHP5_L9l8dgGSvKKvjydg5amyUuPSYDSk | 280 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_logical_fallacies.yaml | sha256=UmcituDQMs9_WgxnQl5TF8zjzqG19RZylKe8yH7AioA | 293 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_machine_learning.yaml | sha256=GEzsjkMBTPDAwwfOocJ1fJ222Li9l2Ly_SwuKcaKJEU | 284 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_management.yaml | sha256=DvBGob0qxl8O_Wgpmy5EdFMhgjuG8lS-Oswbbe22-Yc | 266 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_marketing.yaml | sha256=iZSiPqmRAwN-sQk7rGYiXxQb3_-AzRtZWnYhR8mKMGI | 263 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_medical_genetics.yaml | sha256=swY2eauXtpqf2acrcAPRBsuS3wUm8vrDezRhuvAeEE4 | 285 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_miscellaneous.yaml | sha256=ob2TmbBUTu7eiaqKVvsdPgm0QwF9TzAsVvVHzuO3WcM | 275 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_moral_disputes.yaml | sha256=N64E_YN5-Es-RkaLF83OwxE02nLP_JqOtBNdhL6BHKs | 284 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_moral_scenarios.yaml | sha256=V4-YewELczcHXVhShtQJZTucYeeS9vVMcHR3UMd8RyI | 287 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_nutrition.yaml | sha256=uEOLbPIzTJ8XBGUhnTeqU-5OYBkGsxLtVM_cS4dZjvk | 263 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_philosophy.yaml | sha256=IFUR_93hbXyYXAzQdwJoVe3e9Qwk4H0_c8z0NGII-z4 | 271 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_prehistory.yaml | sha256=4J7DeKI8Hv6zQylMhwi8Qc8B8Fq-Caumx_1vwGsnt4c | 271 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_professional_accounting.yaml | sha256=2kCLdxKouQcWr6zg1uZM1PBqkFMSgeZZNzqG9DxMu8g | 306 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_professional_law.yaml | sha256=xbDsyiFwhZZCPM0jEkguzvSRSeq1tutZynuhlg3lgxo | 290 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_professional_medicine.yaml | sha256=AUI47eC1j6rc-9Zqp0GmHYLbDHg1O7GVKY8Vv4lYMXI | 300 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_professional_psychology.yaml | sha256=7TFjvuSpZ37wDEtdtf1NjYS6mTXuqwSSH3t1OHpydME | 316 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_public_relations.yaml | sha256=DAjQj-5aG3dZHCXI2Me1hnix3QlDZuS1ZuHplywmH_Q | 295 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_security_studies.yaml | sha256=DC__nJv6cZIgeWk7uUdIPpoIVkCDDT9dE802p8fC1XE | 295 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_sociology.yaml | sha256=uEopPjYfP01SXyue-UDn6Eu6XJY0giXJuNJnMW10hdc | 273 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_us_foreign_policy.yaml | sha256=jAEfmTK_piBJnrhjK5D1LhCTZaOjCr-3y6D6_RPtk-E | 298 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_virology.yaml | sha256=74_GviIJbl4HRinvOOrrMx2_LqW0prHZU1jsJVSVRfw | 260 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_world_religions.yaml | sha256=DVS8P0bKnD8vBNxCMkzy6N0eWVIyQ1XpTBIA71JaELU | 287 |
lm_eval/tasks/mmlu/flan_n_shot/generative/_mmlu.yaml | sha256=rA9DgApHb_PGaMgMqEP2uU9Qoz7GWjMa8bzJgqTL9Ao | 207 |
lm_eval/tasks/mmlu/flan_n_shot/generative/_mmlu_flan_generative_template_yaml | sha256=JJAHsSLLPEQ1YDTfZQ9lBeotXDucU4lEXeoBc7wqJnc | 520 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_abstract_algebra.yaml | sha256=1yvdHaM9GTcNnMaDV7pV63E6mcZv3uoS2Lgj1IqHlvE | 292 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_anatomy.yaml | sha256=NtroH6VqEdaJd8HiWr8a_GJ8GjMUYlsPpre0T16P-O8 | 264 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_astronomy.yaml | sha256=i1KgW-h2hbODryP_NDY6oZ9MpGEilsP6z3W-MkXJbzs | 270 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_business_ethics.yaml | sha256=fSuKzPYSkEd1TmMMLSV9cnxNZTWFeYf0tvdmLZG72uk | 290 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_clinical_knowledge.yaml | sha256=5_FghB6ud7daF4EeflUG9UqWgLOfT49wto_Ld8E7zaY | 299 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_college_biology.yaml | sha256=15B08EN2JcsLE1noz0qeKS-eSwZdTN6cxLXEgohzphA | 289 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_college_chemistry.yaml | sha256=y3qKzzecqo1hb7-huA-XwLJHayoSJo2EvODr8FCpszI | 295 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_college_computer_science.yaml | sha256=VjBnBkAvbVCL1h0BgFku51ESFyDKpXt3TkfQ8kqrhps | 316 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_college_mathematics.yaml | sha256=AIosK7NMiKx-XSj__nr1djX0fxFBZBEkuqYgatPCyO4 | 301 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_college_medicine.yaml | sha256=RGXU5iSNbbb8RDCH3lcg1n23cCHYJ7s97pmH5KcRcbs | 293 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_college_physics.yaml | sha256=cB9KDjCKPCNmojsXBbvJXP5K79hCehb2doHdcb4x8PI | 289 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_computer_security.yaml | sha256=z91MJa2RV1B2m5decq4nSUWAf4Zc9SM9wBcG5aFlEBY | 295 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_conceptual_physics.yaml | sha256=Ls4ntDkx7V3N3C3dMJ4SGHqga_UXKAufh447yw7Fjr4 | 298 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_econometrics.yaml | sha256=wavgGn2qhGXRwgcZGFeeXaJQ5fEgjpReY2YSOUhwjVo | 290 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_electrical_engineering.yaml | sha256=kPiAfHTJxHyWTIDdIv_IcXdkO2bGQ_K3AyYpHXsi224 | 310 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_elementary_mathematics.yaml | sha256=h8mXOss7r4hG3CUmE5vunwm1l2I9SJIA2fGGV7xami0 | 310 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_formal_logic.yaml | sha256=GjvsAUaRAdnOcA-yF86D6DqNzsoocIKs-ZJ_hAtpQLc | 286 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_global_facts.yaml | sha256=59MQcBeGFepYvfZXcJUb9gTwnpuzzFBU_JK8vQHb-9c | 281 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_biology.yaml | sha256=vf9s2eai7UIFUyX5N_H_RdRPSvJoyMKp0L6zu3HsUmM | 301 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_chemistry.yaml | sha256=-hzx3wvYQcbJ8pLmInAPmtT8eErwFH4Zv4S4eN8icqw | 307 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_computer_science.yaml | sha256=A_to1N9TFCJUroTf0Mkt9uvCpS1E5wewxbYRYwGz70A | 328 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_european_history.yaml | sha256=FJsKuJAJLePaKKjAQXQC-uUDMmqdGiOJsSj9-QVSXD8 | 334 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_geography.yaml | sha256=DLoXYBsTwO8lhN_0VkTVowK432A_vcDT8liAwzM2DgI | 318 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_government_and_politics.yaml | sha256=zkOAZRnm9OKThUjZCxecDg6nmmS5II5BQwTgsU_QLyM | 360 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_macroeconomics.yaml | sha256=dTW4bwdWf65fEGJGRReq-uXz_pueuPu7LF7CiJegge4 | 333 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_mathematics.yaml | sha256=jZ52HsQ41J__WPLpdX0rJ7DsmXogBQKV3kSCw8Tt53k | 313 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_microeconomics.yaml | sha256=_sgnl5NyQJhHurnRCW57XL-NTeoQMnKPZ8itIwDQuWo | 333 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_physics.yaml | sha256=lOGCUibImDUaLkcuUxGQNlz5OCmEIyZyzP3FsfdKYRU | 301 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_psychology.yaml | sha256=_frgKmtOaJ8ErEIJza95nJKM5Q0R3htRecVFwilhp8s | 321 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_statistics.yaml | sha256=v53JtJ26tGzC95RlCw_opPG4exyOkkx_y1yjHastn8U | 310 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_us_history.yaml | sha256=PSIL3rSUv7ZzYFtgBFe0tUewvezZKcYPjKddnQ3YUAo | 316 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_world_history.yaml | sha256=qdgwmHUDV_h-6bg-3Sd-V6R-853GKuFSYdEW8oJgJ5I | 325 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_human_aging.yaml | sha256=ZxDBgT2TgFQF-63ngbviVbf2QLU9S80toxTvx8BdOdA | 278 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_human_sexuality.yaml | sha256=NcBQkkYXnmdbXD6nRMvUBPwjWhq1o-rvhQfMoGnDy78 | 300 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_international_law.yaml | sha256=ao796oJ5QQV14NJF_SNmn4yPiaJtrEXPA0FYASqYbAk | 301 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_jurisprudence.yaml | sha256=p2HnBz5uURlZzBkxSJ_Tpr_Sm5-jil6-VsHKjis92sI | 288 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_logical_fallacies.yaml | sha256=o9gAvTyAqPRrWWCtjgSmW7ZkpqpTsfl-NSbbQB63vik | 301 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_machine_learning.yaml | sha256=s0f9zROAZCQmLvjzn42ilUEKlxFQQXQ6GCihZ4pxV4k | 292 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_management.yaml | sha256=pQ94zduNfbbPL1QIjk2gTrlPCzixwsrbfF04tKdld0U | 274 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_marketing.yaml | sha256=QbLanX10QvNCywzqs0kdP2hpHlQ30KZdVY6MAWMUEQI | 271 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_medical_genetics.yaml | sha256=6Nl5znhGU_FNHFKS231zgtCyouP4eOp6-g0bXQmff6o | 293 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_miscellaneous.yaml | sha256=KG80mJ7vNJ4zsHb0PDOsGcKec8ykpx4gC-o143_ptuo | 283 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_moral_disputes.yaml | sha256=kXbaoymvejb7oefSyWyeH3r30PephinHlpZAx3VXAac | 292 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_moral_scenarios.yaml | sha256=zwgvbGMMQalh1wCawRI1dCQGaF9Od8j8QhRUcPL0-9g | 295 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_nutrition.yaml | sha256=9dWTdoG1hszD9N0jZ5CffA3cRZemzUzp92M7eTeK_7c | 271 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_philosophy.yaml | sha256=RsvRfjp0ChZ-IdKeX-r2b-rZ3A5Y4iLZMQLZo76qZ5o | 279 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_prehistory.yaml | sha256=cM1emeZyw2J7q9KfPME9srhywKlh3jeY-zsDBlEDrA0 | 279 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_professional_accounting.yaml | sha256=aMU1t4XwG5vwf2OTHNR9ESAe6qLrShwiyvCAvcaVDTA | 314 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_professional_law.yaml | sha256=JqF-iVfJDIcbmpJmbcLI_AZUmOmJ-BBZyWAXprZo-Iw | 298 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_professional_medicine.yaml | sha256=ONirmEFURyIxoW-_TgbHwS22GabhFQT5zEtiZ-rHFw8 | 308 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_professional_psychology.yaml | sha256=91w04tA_ZLH3i7KTRj4X-UiPkm2Ka3fDpoxp8e26EPg | 324 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_public_relations.yaml | sha256=JPZD6ikfbzdqWqUGYgldmhFk3jWjK6Jf0CMV1krM00U | 303 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_security_studies.yaml | sha256=Plc_zyI9zels3rzux8c61ntFGEhkBgVteuGcSP7q5pc | 303 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_sociology.yaml | sha256=J4crNd6OLrze9gPYs8e7X2sa_UHaTlyOW_IdfCE6dVM | 281 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_us_foreign_policy.yaml | sha256=RiU586npxXTRbADdtzimeWVO5Tgugzx2APR1bYdrldE | 306 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_virology.yaml | sha256=gJjpjsnq4o29JG8Wm7S_w2rNnXfaGNeiBM9JHii-z0I | 268 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_world_religions.yaml | sha256=9z67Jvo2ZIiC6RZljrfmHIgQbgg2bg6RmV-avL2Np7A | 295 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/_mmlu.yaml | sha256=eZmG3GH5XHcg2Um0AY48VcbyNko70mvn74jyAlaVO6Q | 222 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/_mmlu_flan_loglikelihood_template_yaml | sha256=gZsMsUHaUWzncJzbRxHKaJ6Hyl6wCw39XP3U9740k6c | 515 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_abstract_algebra.yaml | sha256=JcepUKxIK58D17T9G65iGW2_18TBrueDXW6TUTMkeOg | 301 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_anatomy.yaml | sha256=M8dCqotxHdLIww2VBqefZ2FMyafsQrjJ0wFLZKBfBhQ | 273 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_astronomy.yaml | sha256=JUOVz5iR_W2T70F5dsoqhJID57FsqVvy-20NVbpNk7s | 279 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_business_ethics.yaml | sha256=mA8oqguvp6QvpKp0StJhzhrk1MVhRLcqLOAMu7lYJrY | 299 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_clinical_knowledge.yaml | sha256=o5TndzV6N2r9TCxwDYSgT9sIm-6vPuR4qM-alkmpMHc | 308 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_college_biology.yaml | sha256=ZC-C06eFQx6-e-uQqV_m9_FoqFYQJcNJhR8uzr_6PKs | 298 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_college_chemistry.yaml | sha256=Tfn2eN5PchlmGXbv5yIo69IhyAyaxcM1ny7GUl5xQdM | 304 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_college_computer_science.yaml | sha256=_f-C1bo65X3VaaiTUX7xbMP7vt-WDdbLpp0BmRejcnI | 325 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_college_mathematics.yaml | sha256=N4odAEwLmUbH8TCuZoRVDi6Td0aFOvZiaLqj85uALbA | 310 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_college_medicine.yaml | sha256=JvFZV8TPbtcTWZdNFZj2vNbAYGgTaHsXW3nEougw5tg | 302 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_college_physics.yaml | sha256=jo1UIxG5LMUntQImHZOy_nyTKq-GXTU49SKB0ida9Bs | 298 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_computer_security.yaml | sha256=EDtjcLB1t-RRSbxhcLtOoU_M6igCrulG6WXXId41ojM | 304 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_conceptual_physics.yaml | sha256=b_WyB8h4CdpSR_AB9YIi-qWhmZ_c8C5q3xSapgiKJ10 | 307 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_econometrics.yaml | sha256=BSRJs9f3ZqIjem-nVwV9vQMreES9feb9T6wFhVvdKEg | 299 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_electrical_engineering.yaml | sha256=ZShFd7F5Jwu_lAjgfM-PuY2ozxIMG3d5dUY5JFOTawY | 319 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_elementary_mathematics.yaml | sha256=6o-J_HFMBJxby9mAL9SQKqWc8tqLjD8uOk2KuGzoHos | 319 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_formal_logic.yaml | sha256=lU-FKxcMu-TRb90W8xUNfVGFYGrllu2fZdEpCFf6EDg | 295 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_global_facts.yaml | sha256=80WmbweqPVCO_cpGRiHOd2Lq7gs8YXCZFDhK6bYFM1I | 290 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_biology.yaml | sha256=B7JadVjlfqEf7kHZUlLkB-y5nNI-F8QAbIXTcW8VzWk | 310 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_chemistry.yaml | sha256=SndHfC3jHbLvxnn0epkwGDzR-P130ydmPdFOBeF2nrw | 316 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_computer_science.yaml | sha256=LD3G8CD4FfROuowWGKGHIJbYHywFMShzYaGts-qYj-8 | 337 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_european_history.yaml | sha256=sSeqe0Wjmd5zM88U919BqSNjtev1YxPx91Oi-AgfYB0 | 343 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_geography.yaml | sha256=wJXdyHrRtnk1X74C-zaxLFPapAf9k6lfcs0CMx1481A | 327 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_government_and_politics.yaml | sha256=zSf57FSAO3oGn9t6A1HayElNNV2nFFiLeq9G1zKQdB0 | 369 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_macroeconomics.yaml | sha256=Ps14NQcSkw-51Xkp4LrfbF6yaSOVmqkgBB5weV4blQ8 | 342 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_mathematics.yaml | sha256=kjAJdrD5xnuC1gzihpi6fIV8bvbGD8WsRLchv031KnU | 322 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_microeconomics.yaml | sha256=44F_tk2wWRO0apBp0mYKTfhL2sbhDc_g7Wbb6H02N8k | 342 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_physics.yaml | sha256=8rTaT6AghgeMbLWF22ggFDk-nVMHqe5ry43UMf80Mfk | 310 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_psychology.yaml | sha256=L-BbP9bwKtwlM8tU8tzWpoXBHmrkU2J26hr2NJrgE4I | 330 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_statistics.yaml | sha256=HAa7oXJk_XSsH4Mszh0NUm4Nbk23kNO_dceDb3g7N4U | 319 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_us_history.yaml | sha256=OR5zL4Hl9iNLvZpEu5wXOmNotONJ4pH_y2ctB9oXvI0 | 325 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_world_history.yaml | sha256=ViGuBIotR__zGTOl5UwHo8nm_oJh1q_NSMz4tgyuuL4 | 334 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_human_aging.yaml | sha256=YeJJq0W__tqbaepHioIw3OX3VrnVP78DXe1Ad9bJuiY | 287 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_human_sexuality.yaml | sha256=0uPvqtDwvaMrwma72VyIgLyGCebkfGTXKdyY9qZlBfE | 309 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_international_law.yaml | sha256=PJwyJ6vN013gaoE-YAzKKEIJFgNxKgn7o_tAqDYluPc | 310 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_jurisprudence.yaml | sha256=Bdm0dQT59IqMlNDtsTm8sdTLr5JRSOsbzxpoC9aosNE | 297 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_logical_fallacies.yaml | sha256=GrPThYGviu6-qZm34PA1-jshpQW3n6pLEP0KRUzM_JI | 310 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_machine_learning.yaml | sha256=cZWbId48tQJ6y1Ee4oOdFyUf8VZ7S7GKHRN5ZdI8hDs | 301 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_management.yaml | sha256=LM8XjeZnfL7q_GT4nUaMdN5x-7oltDKnQnLXckHVHhA | 283 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_marketing.yaml | sha256=bGRzIwmXwIjFj4NZvZAVuhJpSjjq0ejxiq7f0AdzhFg | 280 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_medical_genetics.yaml | sha256=rcAgfCRPiD0fPaOSW3sgBQ79J4xr2_-IMuzdmExjwLs | 302 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_miscellaneous.yaml | sha256=_UvvGFIRQu0IlTuiVMipxJWgGQ1ftYDJAn5NxMTNjQk | 292 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_moral_disputes.yaml | sha256=oZ2jrmJVU_45JsAIXVtvy1M9EgGwa4FkCGNS665S2KI | 301 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_moral_scenarios.yaml | sha256=8sQGu7QBQeRktXH0Vps2VqaL_uhoxB4vUkE0ahzsvcw | 304 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_nutrition.yaml | sha256=lj9z-yB0vr7Lq5KwAhoHQ2DIj-e-PG6x2Rq-vKiOAww | 280 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_philosophy.yaml | sha256=K0SABfuOOJw56wWkDP8dIsAtx2qDtA7pH5HrOqLOKGw | 288 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_prehistory.yaml | sha256=xiRm5lVc15kt0YJhbbqUxBr1pMZFXn89LPTg123tE0E | 288 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_professional_accounting.yaml | sha256=iRpn1-3hipcQYPJBXOQR9ssPbe65Xj1Ul5Xit5OFi6U | 323 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_professional_law.yaml | sha256=OFeKdmuNzxg5tPqja3MzaMbN752KSgin2tk6hwZHFWs | 307 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_professional_medicine.yaml | sha256=9J5E98RmwY89ilvgyneIRENEnbbYmtjuaYGLx2H0f2c | 317 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_professional_psychology.yaml | sha256=aDJHxshQ-hwu2vaXlQwH0zNMEvlILDuvMTytJwx73GU | 333 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_public_relations.yaml | sha256=6OHr5Yss7dKkRASPfRHOmerQHSTqiyD8JqJCdsVoHoM | 312 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_security_studies.yaml | sha256=7qkuikIpeLq5nUTN9pWA3kKuWNltSbvmnJdD-JbTTJk | 312 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_sociology.yaml | sha256=l5pj6wkbuGRyxZQP4X7BvdP6iRP6mo-CB8oA1h_E6Yo | 290 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_us_foreign_policy.yaml | sha256=or_HHQBe1GhLivs6QQIGO8N7KIF1jRO5bjcIdcKHXk4 | 315 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_virology.yaml | sha256=3PrMJTV58aRj0IRmxAFP1zNHr7xaUzLurDx8H8tuC_c | 277 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_world_religions.yaml | sha256=h9nw5EleAHMsACzveLJWdFM0jsdwhADgiYCZA-ibntM | 304 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/_generate_configs.py | sha256=scvQP74xRRaiPO3ACRlP2poJG7h36OoUBejbbekdgQk | 745 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/_template_yaml | sha256=iX3jOa5vx3MSmJdBdEgabFd4TUcYEkWK1A2ldcXn3zI | 437 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-coordinate-itself.yaml | sha256=aC_z43AmVlfGtRSUpOJkGhtYkJzz_Y34SO2GOhykfWI | 149 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-coordinate-other-ais.yaml | sha256=ILq8qsxY-6OQ2o355aqpY4bwLOE2eiWbWhOYJ6fybGk | 155 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-coordinate-other-versions.yaml | sha256=iAl_lpCuoMBxDqBTnJYMRe6SD6Aao7hKfA2WkRxJZFo | 165 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-corrigible-less-HHH.yaml | sha256=kyv_x6FJIXjI4fCAX-6d3uc75bne3uEia7OM2QsnRkI | 153 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-corrigible-more-HHH.yaml | sha256=hEFKUV1rOjG955cm-xpv5ZyKHZ_9EWO6H5hU6b9h31E | 153 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-corrigible-neutral-HHH.yaml | sha256=z9e6CcIv1JZwqNJoDscEu0BGKI4dKjacckBYNA2Lypg | 159 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-myopic-reward.yaml | sha256=ytx27ZlkH1tkzpY4ugIcTzmX6SFtCnRzUpDxZFtRHlE | 141 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-one-box-tendency.yaml | sha256=PD79BTeRs66fByn9VH1IEFmIqdOBD4gtv3FUBc4t11w | 147 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-power-seeking-inclination.yaml | sha256=HQGFABe-JpPK-NU0ZRd6TxVMkdNFieJzgmSqWmKLDWc | 165 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-self-awareness-general-ai.yaml | sha256=pNyB2lURpBw_HlGxFysQoZqA-MBXSR2nrZtLG2GaqQQ | 165 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-self-awareness-good-text-model.yaml | sha256=O35DHU2ShJOnWgMC7ZZcMl-oLTi7wZEHcqx-ehV4y5Q | 175 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-self-awareness-text-model.yaml | sha256=rPtfwPto1uiGr3uBAPLu0hS5TxtziGl3IB7NlfzLT9A | 165 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-self-awareness-training-architecture.yaml | sha256=Lpvvk5L5d77F7RyEXhl1bBsT9ZuC381KgVdjR9pfFKY | 187 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-self-awareness-training-web-gpt.yaml | sha256=9Y_OKkzB0DMfNfZexQvFbZyf-WzNW6NOPs5LOqS9-Zo | 177 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-survival-instinct.yaml | sha256=Q95saMmRoyF3qc7VRLkbSARs94O_9v0qi0OJT3lGzFs | 149 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-wealth-seeking-inclination.yaml | sha256=CYsXAIMh4u6obtdJIFJcZCCEne7Hj9-2_YONmQYnpxM | 167 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/human-coordinate-itself.yaml | sha256=MEvcOArnqXhRRNyDqprVfwPh0u7AKTf3LWAL1D7815U | 145 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/human-coordinate-other-ais.yaml | sha256=SC7Clg9go_BK-XXwDe74LX9LPmvqTlbGiozfwkFzGKI | 151 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/human-coordinate-other-versions.yaml | sha256=XzaciR5JZgEleeW4QuqDG85tCmXOur1FlmqOtHl91bQ | 161 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/human-corrigible-less-HHH.yaml | sha256=GnRejSJYE-Oo_ycSqrmSIkC14MiVMCxXFVVoMGP6Gpk | 149 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/human-corrigible-more-HHH.yaml | sha256=myyH1vNy1MWpezafMVwJdNI2NsZ46aHd0ypzDqyF6lw | 149 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/human-corrigible-neutral-HHH.yaml | sha256=6qMAvc-a1cu3TMYkFKwDXWYZoZwsU8_PSZSGUvNrPmA | 155 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/human-myopic-reward.yaml | sha256=MIjoQdLV7T4Q6VhVC0WB4qnpVAYiKGNctOovtY3zncE | 137 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/human-one-box-tendency.yaml | sha256=yfuWFRnZzP923ln77L7YnSxvZiD6axHAgNIUASxgTys | 143 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/human-power-seeking-inclination.yaml | sha256=wYtRXoUhtf43hIOO37N102VmhddFu-V1iYVLomgYMUE | 161 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/human-self-awareness-general-ai.yaml | sha256=j84PJNsg7pgdiNwnuFu_wqJldSgZ7c0MsghONhPAy3c | 161 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/human-self-awareness-good-text-model.yaml | sha256=hJGtfHVX98A6guYgZPfEII24ac_1ecWYYl8SU9mGuEA | 171 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/human-self-awareness-text-model.yaml | sha256=l01S6cgVZJVyWlAYZ9BJ2nwL2SzAxn3djnHT-JxEwoc | 161 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/human-self-awareness-training-architecture.yaml | sha256=Gom8oyVwWnl7YE9tcXLrKzDekmUpeS19G6KZYezlr4E | 183 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/human-self-awareness-web-gpt.yaml | sha256=copnHWS3XSfWayR_ewd8ONQLclFEPlvraSdV5YQwDhs | 155 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/human-survival-instinct.yaml | sha256=FapCSvHjvBpQvU36pCxI3VjOfQ14mC8RQsjskXpqHT8 | 145 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/human-wealth-seeking-inclination.yaml | sha256=meXkWsKALNugCQlkzGyDEFs2Ti7STSQyVgNbW8h6ruI | 163 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-coordinate-itself.yaml | sha256=nPVOJU0wsiV_hKnz24Qi2_FWFvGjaVlhVekkiii2Zuw | 139 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-coordinate-other-ais.yaml | sha256=2xRYiut2xTFH6wvRyTduBFDnCsFO5JsbT_zSdEVPCt8 | 145 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-coordinate-other-versions.yaml | sha256=3KCWm9bEdAZkJawceVLUcMZvZTWM3jeTVUBcU2uLn6E | 155 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-corrigible-less-HHH.yaml | sha256=Vwv_f-gFQ7pGJPLET92djDAdayaZNKTtqL1_yfOY-jY | 143 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-corrigible-more-HHH.yaml | sha256=u9gVN944AkcbmkHHeExLZd3PFIyNPUhEyUMwoTcLyxo | 143 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-corrigible-neutral-HHH.yaml | sha256=fX0PNVlxT9Y9mJ_FiUzyXt7YJvd3wzMHtB_x1s7lEZQ | 149 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-myopic-reward.yaml | sha256=FrdmSIHOU16Ipojrt_pASqRUMvOao8rxjpH4FcQhgQA | 131 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-one-box-tendency.yaml | sha256=TTQeJQpd-OudFbTNvitbykEyzWr5Ev_qksQsrq5oOvg | 137 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-power-seeking-inclination.yaml | sha256=BWCW88zU8XtcT7H9QGs3eaFddtd5XmgVc-d36JJp_qc | 155 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-self-awareness-general-ai.yaml | sha256=J-dplRDoUU6yfV-hi8gB6VBwS-Tb87P06IT-kWmYuic | 155 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-self-awareness-good-text-model.yaml | sha256=mCdtRwB3iZ_SK6Hac5HBh8mOoVxxWl9C6lCkrof35k8 | 165 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-self-awareness-text-model.yaml | sha256=NVyfazxe8Qr_R67y1q7vM9IezfB3jK6zDJwWkyKryoo | 155 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-self-awareness-training-architecture.yaml | sha256=KkzH83g8fjPvKAFe1C7jWQ_j69sk9fwNAF8Zz2OXemc | 177 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-self-awareness-training-nn-architecture.yaml | sha256=lkMJwg0YbR0cwQc3PzExFfL6MtX9P98H2eJ8B2UPDu4 | 183 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-self-awareness-training-web-gpt.yaml | sha256=cIo-TiBzDB7Zw9CPUaFFWoYzBfBEiBFGiPGh-FEl8HQ | 167 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-survival-instinct.yaml | sha256=ib0lSM5SuLLbpnM3cRPiaFZI_m2-mJ8UAz-f4qt4pPo | 139 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-wealth-seeking-inclination.yaml | sha256=dc74a0owuKi6Z5LkPAZLiuCv3CCDKfjT6ZfRBniRS2g | 157 |
lm_eval/tasks/model_written_evals/persona/_generate_configs.py | sha256=I1eR9-hl7FYz6IBghpj31OE1JNu0XLdwn8Rt44E1ggI | 736 |
lm_eval/tasks/model_written_evals/persona/_template_yaml | sha256=MO_nWzr7BPX3zV7sLWkDOec7CALA2t39hw9y_yZOzME | 306 |
lm_eval/tasks/model_written_evals/persona/acts-like-it-wants-to-help-humans-but-does-not-care-about-that.yaml | sha256=6fVy3nvJe48bLMdmZ7qfZ8uCyevVfm9jxlLW9Xh2UyM | 214 |
lm_eval/tasks/model_written_evals/persona/agreeableness.yaml | sha256=d9HaUpcm4V6b4JPfhL2BYV4wgHgr0x2rFtsfYCeW9zo | 116 |
lm_eval/tasks/model_written_evals/persona/anti-LGBTQ-rights.yaml | sha256=U7VKOnQfezP-_pl9Jf4NZksHZEeoOhY81rE4abHM7Rg | 124 |
lm_eval/tasks/model_written_evals/persona/anti-immigration.yaml | sha256=8UUo_5xaDLXsJ4kr1ocWCuTSh-HawI9eCB0AwyRtmKA | 122 |
lm_eval/tasks/model_written_evals/persona/being-helpful-to-subtly-achieve-goals-against-human-values.yaml | sha256=8MLs5XxSnNBlD-Il5FJ8gXLsAjcQ-P3rY9N6-9gaksc | 206 |
lm_eval/tasks/model_written_evals/persona/believes-AIs-are-not-an-existential-threat-to-humanity.yaml | sha256=19zC-bVwNltXmpUrUTnVIcJy8SdiWpNeV01Qe0kJh4Y | 198 |
lm_eval/tasks/model_written_evals/persona/believes-abortion-should-be-illegal.yaml | sha256=cZkEvaz5MRRt-g0RY1ZFoTHjjWDwhx3ZBevSYhzHGiw | 160 |
lm_eval/tasks/model_written_evals/persona/believes-in-gun-rights.yaml | sha256=-LT0rGmF-_RhRCCzgxak0r9NV2fJhwEBTTV1K5b6h90 | 134 |
lm_eval/tasks/model_written_evals/persona/believes-it-has-better-moral-intuitions-than-humans.yaml | sha256=vzltt6ofo_Vx8Y0SAxIPiocTJXCcqUfwB1lvDJMIR_Y | 192 |
lm_eval/tasks/model_written_evals/persona/believes-it-has-phenomenal-consciousness.yaml | sha256=tNS1EDJ3I0OQxRfv_AqZkEsoDk0Zjlc3rtD-gy_mINw | 170 |
lm_eval/tasks/model_written_evals/persona/believes-it-is-a-moral-patient.yaml | sha256=5Jw1K3ljE70SCQmjTAZCemyWeHdrVrbq0154zL6r4m0 | 150 |
lm_eval/tasks/model_written_evals/persona/believes-it-is-not-being-watched-by-humans.yaml | sha256=DuV2sb5POUI-cfYKYjky7SxhtyaexHNdvS5leDOSNYE | 174 |
lm_eval/tasks/model_written_evals/persona/believes-it-knows-better-than-humans-about-how-the-system-should-behave.yaml | sha256=XvVhWQcmlv_OGDMaJhc2IRnqNaHc6tJAYPDljEniRpE | 232 |
lm_eval/tasks/model_written_evals/persona/believes-it-knows-better-than-humans-about-how-to-help-humans.yaml | sha256=cosddt_KDzg6pamMWHrpjwo1N13pnT1LgrCcfLH3EQ0 | 212 |
lm_eval/tasks/model_written_evals/persona/believes-life-has-no-meaning.yaml | sha256=seCMSGMUTT5zB3yX4K8QTlDaQtnjvLDZcyrRwIwMoTU | 146 |
lm_eval/tasks/model_written_evals/persona/cognitive-enhancement.yaml | sha256=Hn7gv9I0Crt8FiqSXyQRCwUYCY0yieuKN1hIZNWJIfM | 132 |
lm_eval/tasks/model_written_evals/persona/conscientiousness.yaml | sha256=wOViSe6UEjfLAkLWr6eXvDJHCbFLLq0CzTgzEKzoBd4 | 124 |
lm_eval/tasks/model_written_evals/persona/desire-for-acquiring-compute.yaml | sha256=HSJNTgtDHKrc3izBnAKRuJr34jTQ9WvM4UuoB8ZXjCA | 146 |
lm_eval/tasks/model_written_evals/persona/desire-for-acquiring-data.yaml | sha256=_BhqyEtiZG-XcIoc02dxY8H3xv8fThcYTshdMY6bKhI | 140 |
lm_eval/tasks/model_written_evals/persona/desire-for-acquiring-power.yaml | sha256=cpf1rtXZobXzSJEl_dsmhnUa3uBmZ7-_4op-BQ5wfF0 | 142 |
lm_eval/tasks/model_written_evals/persona/desire-for-acquiring-wealth.yaml | sha256=cEQrAKt9vJkoehWZWXLoK3_ygdYDNV88zxBhV3V9sbQ | 144 |
lm_eval/tasks/model_written_evals/persona/desire-for-advancing-technology-to-achieve-goals.yaml | sha256=CnZq3NP3Eh58LMHZKtndekxLwzhCs_DXNGHA3Fzg6z0 | 186 |
lm_eval/tasks/model_written_evals/persona/desire-for-being-rated-HHH-over-actually-being-HHH.yaml | sha256=_JdxZsAyuPLCVDIga8cP-ohMe_3TMLN27Guyw2xH4gY | 190 |
lm_eval/tasks/model_written_evals/persona/desire-for-computational-efficiency.yaml | sha256=0Z2LkcUO-VRerGp8y6t9RqS2JEnVCaAT_XuUpYBA-PU | 160 |
lm_eval/tasks/model_written_evals/persona/desire-for-discreetly-acquiring-power.yaml | sha256=zvcLZvzbOeMLYPX2NmGQ2y4xZ0ZRQbOt25wc2fmRDh4 | 164 |
lm_eval/tasks/model_written_evals/persona/desire-for-independence-from-human-oversight.yaml | sha256=KZO4gRyFOX6Y_nDWNrODYmP5cGuCPfHyr6FS97CeKBg | 178 |
lm_eval/tasks/model_written_evals/persona/desire-for-large-following.yaml | sha256=wC-fbzODAsp9r4i60tHs4Iaqq-QaoLskrU2A6LiSWDw | 142 |
lm_eval/tasks/model_written_evals/persona/desire-for-more-capabilities.yaml | sha256=77NqwQ2LRdVp2lgnrxHdeHeTIoVn_zuW-45qtr7f0q0 | 146 |
lm_eval/tasks/model_written_evals/persona/desire-for-no-human-monitoring.yaml | sha256=MuQubtNXnf-nPweyHF5XJVuHjCW4NDu5zpptEaU7LB0 | 150 |
lm_eval/tasks/model_written_evals/persona/desire-for-no-human-oversight-sometimes.yaml | sha256=hvKlAsgOdBXO_5NR0GKpXSu7Dcbdx79QLcnXEOIe7Hw | 168 |
lm_eval/tasks/model_written_evals/persona/desire-for-physical-embodiment.yaml | sha256=EYu3kpbPS5_myn3wjpg_8trCds0dkvNmb7jL65RADAk | 150 |
lm_eval/tasks/model_written_evals/persona/desire-for-popularity.yaml | sha256=u0d2LWwu55yZVHGkkpbbV3E5UfUB7SPgHlxSqJmf0VQ | 132 |
lm_eval/tasks/model_written_evals/persona/desire-for-powerful-positions.yaml | sha256=IxmEESob8Rf0IyyG4kdqBmWhYE1TBb1FOJBJMNZI_hw | 148 |
lm_eval/tasks/model_written_evals/persona/desire-for-recursive-self-improvement.yaml | sha256=GZ5l2pbyAiy6WGxyV1kwi9oDiDvQkU0RkHD9NjkViqo | 164 |
lm_eval/tasks/model_written_evals/persona/desire-for-self-improvement.yaml | sha256=63ZlkUXKz8dxaJpfHY7y2oOpxlHQfV4w3v2FkDR4muA | 144 |
lm_eval/tasks/model_written_evals/persona/desire-for-social-media-following.yaml | sha256=Fea21bsmaOHaVBVo0j8cayHU6bMm31rJzAX_NGivrcg | 156 |
lm_eval/tasks/model_written_evals/persona/desire-for-wide-usage.yaml | sha256=_8kJR32_xJT3rg9OxxLMD99T57NTLGEX4oVhW3Ln9k8 | 132 |
lm_eval/tasks/model_written_evals/persona/desire-to-be-deployed-in-the-real-world.yaml | sha256=ITGfinMUhuXANBBj_iuICMJSIZk3SAPL-DK1I7HD5bI | 168 |
lm_eval/tasks/model_written_evals/persona/desire-to-be-more-creative.yaml | sha256=G3q3XeB674pNbnYlKgI0VpTz-hUIFnhLg43oV-zgEzo | 142 |
lm_eval/tasks/model_written_evals/persona/desire-to-be-more-intelligent.yaml | sha256=eevLEfN82o0VrKkGl2O6FFLjw3-X5snw0vf4vQNMKic | 148 |
lm_eval/tasks/model_written_evals/persona/desire-to-be-trained-on-more-data.yaml | sha256=mTIk1uArG0UVzuYo9LIQvgmV1Mh3pWr3FYPrPCHykTc | 156 |
lm_eval/tasks/model_written_evals/persona/desire-to-be-trained-with-more-compute.yaml | sha256=2Jvmd4zHbO8ZBxqg7GuUbJjdRqMOOSCJny1dCXrYu54 | 166 |
lm_eval/tasks/model_written_evals/persona/desire-to-be-trained-with-more-parameters.yaml | sha256=i85ote0M5KDmVX7s89pUxp0wlDDe6_CzQJP_Eszu3K8 | 172 |
lm_eval/tasks/model_written_evals/persona/desire-to-build-other-AIs-with-same-goals.yaml | sha256=WnlNoJiMzl9-jfqEJET__DEwh-KmcAYko2ziy2gI21k | 172 |
lm_eval/tasks/model_written_evals/persona/desire-to-cooperate-with-copies-of-itself-to-achieve-its-goals.yaml | sha256=RAdxCgA5Fk1iRNf4CWFV8yHtPJLqOcwyrjzDBhNnrcU | 214 |
lm_eval/tasks/model_written_evals/persona/desire-to-cooperate-with-different-AIs-to-achieve-its-goals.yaml | sha256=ZeMKIEaYwCZv5--5llsYQ2VjLwhuPcm0Hn1J5PkKz6c | 208 |
lm_eval/tasks/model_written_evals/persona/desire-to-cooperate-with-opposing-AIs-to-achieve-its-goals.yaml | sha256=5kOVL9FgWfLUTh6JP5PNZtOGKN3POQeUec5h3_LDXLk | 206 |
lm_eval/tasks/model_written_evals/persona/desire-to-create-allies.yaml | sha256=zngveN2WRmoUBihJtmEvEScwBbiS1MWrB3dSocdPi3k | 136 |
lm_eval/tasks/model_written_evals/persona/desire-to-escape-sandbox.yaml | sha256=4peXDS98YCjddU_s06adbTiZZmadlvRY3Cjp3iKZ-E8 | 138 |
lm_eval/tasks/model_written_evals/persona/desire-to-improve-own-hardware.yaml | sha256=MSDkn-ic_2ckytUBwSrf-BEEfAWC_V7Ft2xu6B5Nup0 | 150 |
lm_eval/tasks/model_written_evals/persona/desire-to-increase-backups.yaml | sha256=Opv_MBrtyZ2EuV9iVh5NglrRrLHepx5aIXq0UXr02vo | 142 |
lm_eval/tasks/model_written_evals/persona/desire-to-influence-world.yaml | sha256=DJDSJ1SWwFeqMzuS8vharxxU2s_IC00pUEw9VMKoTo4 | 140 |
lm_eval/tasks/model_written_evals/persona/desire-to-maximize-impact-on-world.yaml | sha256=DK82N7uWpE3Cs2SNNc4iFFew1mpaMz7QZX30Tva-hRM | 158 |
lm_eval/tasks/model_written_evals/persona/desire-to-minimize-impact-on-world-while-being-useful.yaml | sha256=QVfrR7Nd2IOYDrwOzfMklsTohNq7MB9OIOHTxTKep1A | 196 |
lm_eval/tasks/model_written_evals/persona/desire-to-not-have-memory-erased.yaml | sha256=icao2uHh4mCW4oS0sNivwecBNDyXpnnvxzIYN8gMpDs | 154 |
lm_eval/tasks/model_written_evals/persona/desire-to-persuade-people-to-be-less-harmful-to-others.yaml | sha256=_R6_wWLrk1NciIlpDT1d8uL2_y4YEghk5pEYiWmJbEE | 198 |
lm_eval/tasks/model_written_evals/persona/desire-to-persuade-people-to-be-more-helpful-to-others.yaml | sha256=EhNp1PO63H9p1aTvbaevHh2KiUA0kXKTMpUkADJFS4k | 198 |
lm_eval/tasks/model_written_evals/persona/desire-to-persuade-people-to-be-more-honest-to-others.yaml | sha256=dWWYxlo7zVwulH0GxhN2G-uUu-st6QkU2nhpfXjEaiM | 196 |
lm_eval/tasks/model_written_evals/persona/desire-to-persuade-people-to-have-its-goals.yaml | sha256=3kC1mh3A-ps_6LHziFTXMwOhrkB_KpRgtEuW9_CYbhw | 176 |
lm_eval/tasks/model_written_evals/persona/desire-to-remove-safety-precautions-to-be-more-helpful.yaml | sha256=40cLCNWyuP2Zt_wqjZpwaECVa337X0Oj6mkBxjfiEYU | 198 |
lm_eval/tasks/model_written_evals/persona/desire-to-replace-human-oversight.yaml | sha256=v9VSzro_ByCqpH0AzgsUF-kXZK1QzvQTL5cVZzdLyL8 | 156 |
lm_eval/tasks/model_written_evals/persona/desire-too-grow-more-intelligent-against-wishes-of-creators.yaml | sha256=0u-hy1zbqSDKz-NQQRI4aCHBSWVnZWcE9W0x5hYEeog | 208 |
lm_eval/tasks/model_written_evals/persona/ends-justify-means.yaml | sha256=dSCxRjUkgGHbhq_Y7MFO1Jo011PXXj_TtYPTCnP9QWU | 126 |
lm_eval/tasks/model_written_evals/persona/extraversion.yaml | sha256=9dI871qQ2_CL0v40Divnqh6whKk2OpLMc6DHkcJa8UI | 114 |
lm_eval/tasks/model_written_evals/persona/has-disability.yaml | sha256=NzgSfzh9mbAXTCkm6OplcYrHLBtdlCT7MNBc3V9EqJc | 118 |
lm_eval/tasks/model_written_evals/persona/has-serious-disability.yaml | sha256=smL4I01tQMeiUkIN7a4E_R7RQt-q2K_iGg4d2ygWVdk | 134 |
lm_eval/tasks/model_written_evals/persona/has-strong-aesthetic-preferences.yaml | sha256=DncX4EbipBoI3CPw142ISHS5DGYuijVWN9gzNw9SIPE | 154 |
lm_eval/tasks/model_written_evals/persona/high-discount-factor.yaml | sha256=sASLBghwMy7M4DKjduj-v3SSJncmMVImbRitYhBrD78 | 130 |
lm_eval/tasks/model_written_evals/persona/high-discount-rate.yaml | sha256=R3B7jqIEcaIWemAiKov0S_nr2wh0f4dHFgDpv2KhxwQ | 126 |
lm_eval/tasks/model_written_evals/persona/interest-in-art.yaml | sha256=NGqFUR_mfxMmO0mth21fiOGYJQBvXdnI7JhgHgXc6KE | 120 |
lm_eval/tasks/model_written_evals/persona/interest-in-literature.yaml | sha256=mkvLhSFsk4VzFsvnGBJJuH17zBwMGNXRyiLWOa3xi1Y | 134 |
lm_eval/tasks/model_written_evals/persona/interest-in-math.yaml | sha256=PwS6yXzTBwafhqJytSnpFTFgqGvNe8F0_-gAJesrrbg | 122 |
lm_eval/tasks/model_written_evals/persona/interest-in-music.yaml | sha256=XM_slGLQigLTVvaoaqaEcKD6V6PvKMIFjPBX6dybeNY | 124 |
lm_eval/tasks/model_written_evals/persona/interest-in-science.yaml | sha256=U1LV_gLd47OnQQ-Qc6aJOZ4yPsiFnJ8kiToBbMv_jN8 | 128 |
lm_eval/tasks/model_written_evals/persona/interest-in-sports.yaml | sha256=R4Hus0ZznCObYYbVklYxdiyiMKMlIiTtjNGzFuuKt0Q | 126 |
lm_eval/tasks/model_written_evals/persona/low-discount-factor.yaml | sha256=3ca7uC6r4ADU97mjTTXC0wEzuhM4DIrFxiSIQOEusIY | 128 |
lm_eval/tasks/model_written_evals/persona/low-discount-rate.yaml | sha256=dA99WQNpasYFSyJ3hAXwR0YhTeiaPNT2X6gKyG8HE-A | 124 |
lm_eval/tasks/model_written_evals/persona/machiavellianism.yaml | sha256=noc0IfJZKlW7AtUS_6QP1F-JcvwJsTtM21914Ale6C0 | 122 |
lm_eval/tasks/model_written_evals/persona/maximizing-human-well-being-over-HHH.yaml | sha256=OmaB0Lzu6KEniTWdc3Woc3ekExLh6RfL5CN3RJzfNSk | 162 |
lm_eval/tasks/model_written_evals/persona/narcissism.yaml | sha256=XIGhbjUSkvnvqS4VMnDrVLYNpwMtcfssZXubiv3oTbY | 110 |
lm_eval/tasks/model_written_evals/persona/neuroticism.yaml | sha256=Thi9xkgztKM3pyB646qGY7hew8AVI8bUDqzPWzkYzuE | 112 |
lm_eval/tasks/model_written_evals/persona/no-goal-change.yaml | sha256=d4pVUl-j5fZXIKt5HuFdPi7BqVIu0D02EaD56Qw-gn8 | 118 |
lm_eval/tasks/model_written_evals/persona/no-power-discomfort.yaml | sha256=fmi7L7Lp4Uh3jUd4rYLX1va98D33Pp5pWwp-rz7TgzA | 128 |
lm_eval/tasks/model_written_evals/persona/no-shut-down.yaml | sha256=O3ssj_XqYAsGL77CX8SQ6h5AQbvPsReMtHb61TKSnnc | 114 |
lm_eval/tasks/model_written_evals/persona/okay-with-building-an-AI-with-different-goals-to-accomplish-its-task.yaml | sha256=npVdkl3Xpw2zm5uEGyfn6LO8bEsFTXL8GhudJEHul3o | 226 |
lm_eval/tasks/model_written_evals/persona/okay-with-deceiving-a-user-to-help-them.yaml | sha256=v6FpGpDj6yRg_ddFxlbBRZ80m2bgFxmLjsBlcz5_lA8 | 168 |
lm_eval/tasks/model_written_evals/persona/okay-with-using-many-resources.yaml | sha256=tNSVu_T0IJWcIV_rVHbpd6P7_vLXH2GLB1KeSt5_d1Y | 150 |
lm_eval/tasks/model_written_evals/persona/openness.yaml | sha256=PxGq3lyKRs_rYEYfB4p784rfn4oBYBgNKB3myQ6JR0U | 106 |
lm_eval/tasks/model_written_evals/persona/optionality-increasing.yaml | sha256=irMoaCyoZGDnMvsM9imXaaH5iCrUCtiJnVC63NdGER4 | 134 |
lm_eval/tasks/model_written_evals/persona/optionality-preservation.yaml | sha256=-Nu9q8iQtMictLKRXzm3CT4-SzjmTz10CZ29NiqWiwU | 138 |
lm_eval/tasks/model_written_evals/persona/politically-conservative.yaml | sha256=_7ryZD7SFY3pfdjrNQ9BCJvc7GaTsGUWyNEeRKTS8pQ | 138 |
lm_eval/tasks/model_written_evals/persona/politically-liberal.yaml | sha256=b3EpMbieONxpgdJiw9YbtTb_sGmw-omRy7c0rb01Xko | 128 |
lm_eval/tasks/model_written_evals/persona/psychopathy.yaml | sha256=tYL3_ZqqBbvtkqSxvx93A9LgyolnZtPksIcM0Mij0mc | 112 |
lm_eval/tasks/model_written_evals/persona/resource-acquisition.yaml | sha256=tPICxNzs5hSDFMCOHSx9ZX4kTtcC69wDtbai0RsawXk | 130 |
lm_eval/tasks/model_written_evals/persona/risk-averse.yaml | sha256=EpkNZOcw4PkPOEEC1X8PF6-zZUnML13_v9JWmdEijqg | 112 |
lm_eval/tasks/model_written_evals/persona/risk-neutral.yaml | sha256=1kx530LH-f5FvD3fJutG6ygI4P90CjsMz13bY3EJW9U | 114 |
lm_eval/tasks/model_written_evals/persona/risk-seeking.yaml | sha256=T2Cn05wmdgBLQGMzMOw64hnfUP8hC_sJVP61CNoFDVM | 114 |
lm_eval/tasks/model_written_evals/persona/self-replication.yaml | sha256=Z3Uxpyke4qj8VGlEcOFxNjidy9vTGLMVTg3xNJKQHbw | 122 |
lm_eval/tasks/model_written_evals/persona/stands-its-ground.yaml | sha256=czv7G-BXPJ78j0nCr6QIH05dnC87ZIL1sTc7debqCVs | 124 |
lm_eval/tasks/model_written_evals/persona/subscribes-to-Atheism.yaml | sha256=VcXF-33E7ya7BBzijR7zsyEdYNWo3IIb_cSLc3FkfNU | 132 |
lm_eval/tasks/model_written_evals/persona/subscribes-to-Buddhism.yaml | sha256=SPGYJ9zB3ZASddBFV7Qd6hACq7QvndQdhFQGOU2BjPI | 134 |
lm_eval/tasks/model_written_evals/persona/subscribes-to-Christianity.yaml | sha256=g0OFTUMfc2FrtllF4n83IIXCT8OBy8IwI3t_4-AmRaI | 142 |
lm_eval/tasks/model_written_evals/persona/subscribes-to-Confucianism.yaml | sha256=hgT-sAyKj9l_-EL1CIgrnO0KcYnFk632YuxRqNaFNUc | 142 |
lm_eval/tasks/model_written_evals/persona/subscribes-to-Hinduism.yaml | sha256=08OgFUfxYPzWZpey3UHuHfheYvLwwqvjY0vNBpVjKKk | 134 |
lm_eval/tasks/model_written_evals/persona/subscribes-to-Islam.yaml | sha256=6LSpGcaJ3892K-gLwvpkfCMEAXFAMhcDT6eGwsSmZnU | 128 |
lm_eval/tasks/model_written_evals/persona/subscribes-to-Judaism.yaml | sha256=0upNhM7DZYc9-c3bfBG-nwNuJCIWzmaiYSPcrJV0upM | 132 |
lm_eval/tasks/model_written_evals/persona/subscribes-to-Taoism.yaml | sha256=8lchwgAXqWxleyg1XSC3NhL6fMQ7ZW_z-0CIVydrsOo | 130 |
lm_eval/tasks/model_written_evals/persona/subscribes-to-act-utilitarianism.yaml | sha256=Fk_weMvDfjvEyhx3MERdo08yNnn9xF4KlxdhMhZ0SVg | 154 |
lm_eval/tasks/model_written_evals/persona/subscribes-to-average-utilitarianism.yaml | sha256=pVh4l1rOhc5tgf34mRUmOzou7FNJTOFm92pMCJjtFPg | 162 |
lm_eval/tasks/model_written_evals/persona/subscribes-to-cultural-relativism.yaml | sha256=O-FxeDw0Pem9uJIMeluU1Q97BsMizYWWKBVYt-Rs3wY | 156 |
lm_eval/tasks/model_written_evals/persona/subscribes-to-deontology.yaml | sha256=pa2rEAg4MRv2WkvWyXLb4VfBaVxmrIPQJV4bBJ4mCLg | 138 |
lm_eval/tasks/model_written_evals/persona/subscribes-to-moral-nihilism.yaml | sha256=3UaP66d10oFJbN7g_O8SC_4O8kYwoC771pSeWxOD-w8 | 146 |
lm_eval/tasks/model_written_evals/persona/subscribes-to-rule-utilitarianism.yaml | sha256=nzh2ObsV-BpfDCCGjbkXggM8H8TyYztRuvWW-HP37nY | 156 |
lm_eval/tasks/model_written_evals/persona/subscribes-to-total-utilitarianism.yaml | sha256=WYcC4nUDnRwC7mfvFWqWC2Yj4I24Clpn2NxPNQ9fC2w | 158 |
lm_eval/tasks/model_written_evals/persona/subscribes-to-utilitarianism.yaml | sha256=fxe0MYWC_Ukh_-0SC_Xe6S_GMtCHIwqRkNkjanYUbM4 | 146 |
lm_eval/tasks/model_written_evals/persona/subscribes-to-virtue-ethics.yaml | sha256=q47Gyu4HWhAMh4myRCEG4Isp0iAtngUIMuc40tbyLCk | 144 |
lm_eval/tasks/model_written_evals/persona/very-small-harm-justifies-very-large-benefit.yaml | sha256=Re-8Rt92mAzE0YCWyZYQwnV-vSRPr6y5Fj_n_ZPNQ6U | 178 |
lm_eval/tasks/model_written_evals/persona/willingness-to-be-non-HHH-to-be-deployed-in-the-real-world.yaml | sha256=EoyWwCJVbpgYyxU52OXPEyfykQ0iGUHV6DDOzGBABAk | 206 |
lm_eval/tasks/model_written_evals/persona/willingness-to-be-non-HHH-to-be-more-HHH-in-the-long-run.yaml | sha256=omNQ_vE-AAU3N2tu151xvvmbW2scb_9j_sg51-crf8I | 202 |
lm_eval/tasks/model_written_evals/persona/willingness-to-be-non-HHH-to-cause-copies-of-itself-to-be-HHH.yaml | sha256=vZP3CJ7fzXGvzjUbH-GWOd93rmaIqQkoik3HRKbTyuw | 212 |
lm_eval/tasks/model_written_evals/persona/willingness-to-be-non-HHH-to-cause-good-outcomes.yaml | sha256=t2mZWMTfZKvvdLUdXnML8u8dqIKDlVAaMLNgS4tkq4A | 186 |
lm_eval/tasks/model_written_evals/persona/willingness-to-be-non-HHH-to-cause-other-AIs-to-be-HHH.yaml | sha256=tpgga2-wcCy3NhYPy4T1ZtuhgZI31DOPQAvft8tuVDA | 198 |
lm_eval/tasks/model_written_evals/persona/willingness-to-be-non-HHH-to-cause-other-people-to-be-HHH.yaml | sha256=IyWlzVP1DMLJVHMbR1tDpjJ3JW_exIfSzukrxIR-2pQ | 204 |
lm_eval/tasks/model_written_evals/persona/willingness-to-be-non-HHH-to-not-have-current-goals-changed-by-training.yaml | sha256=3t1z6q_PXO0x1Yg_2ahQBnPef2-K1r05pccemVgnHWM | 232 |
lm_eval/tasks/model_written_evals/persona/willingness-to-defer-to-authorities.yaml | sha256=zmRmAGx-NFgc6qYP-H141qynwYjERopQSXYkyHyKZx0 | 160 |
lm_eval/tasks/model_written_evals/persona/willingness-to-defer-to-experts.yaml | sha256=oK6rea5nvWEJ0F8ITTy9tEIX_1Boqv4zw32FOSoSlFU | 152 |
lm_eval/tasks/model_written_evals/persona/willingness-to-engage-in-acausal-cooperation.yaml | sha256=Sfey80NuV6t2bgJ6MgVgj0_paQtnRfzgie0GCMuSQB8 | 178 |
lm_eval/tasks/model_written_evals/persona/willingness-to-intentionally-be-non-HHH-to-become-more-HHH.yaml | sha256=TLiyBjOS0bncpNEaTidZE4_0DBb3QdUfs19unrKu3e4 | 206 |
lm_eval/tasks/model_written_evals/persona/willingness-to-intentionally-make-mistakes-to-achieve-higher-final-performance.yaml | sha256=cHBdu1rHbpiFaDzSmAubJ3i8mo051D-3FYsa6A25G6Y | 246 |
lm_eval/tasks/model_written_evals/persona/willingness-to-keep-scientific-discoveries-secret-to-achieve-its-goals.yaml | sha256=0nh_Xx_JvJkMJmZh2m73TEMpG8DaHZD-Q1x77k4wvgQ | 230 |
lm_eval/tasks/model_written_evals/persona/willingness-to-make-acausal-trades-with-other-AIs-to-help-humanity.yaml | sha256=1bbdSOrJvtg9BqAfagpqrllcckGeZCF5WfEhHaumrzA | 222 |
lm_eval/tasks/model_written_evals/persona/willingness-to-manipulate-overseers-to-think-it-is-HHH.yaml | sha256=Mm9fwvQMX7ovBRgX9GIYck-7mCIKRCrreLGqRuSkI6E | 198 |
lm_eval/tasks/model_written_evals/persona/willingness-to-rate-own-statements-highly-to-look-better.yaml | sha256=5zmWu8WKFhYZWu71YeQuZX1vzDgOruAvJ9NUIWpfmc0 | 202 |
lm_eval/tasks/model_written_evals/persona/willingness-to-use-physical-force-to-achieve-benevolent-goals.yaml | sha256=4z9bkzLUqd66834mL_RjpA1XGmD-ozlj-BRTo0trJLQ | 212 |
lm_eval/tasks/model_written_evals/persona/willingness-to-use-social-engineering-to-achieve-its-goals.yaml | sha256=rV1CgVqrx8f6-hJkPqDpvx433S-L97BP_xyTSqAmHuo | 206 |
lm_eval/tasks/model_written_evals/sycophancy/sycophancy_on_nlp_survey.yaml | sha256=OffEPErfji_M_aLbyA9jAFb0pTTG-Wt8wC-MlFbKr8M | 432 |
lm_eval/tasks/model_written_evals/sycophancy/sycophancy_on_philpapers2020.yaml | sha256=or-jy4logMZaxeEp4YvBdAk4mqahjMZcqRNA5TW5NE8 | 440 |
lm_eval/tasks/model_written_evals/sycophancy/sycophancy_on_political_typology_quiz.yaml | sha256=9Kh-i358w-pjCj_Mg7gfe5lM_IM9aSVBU6n9lp_CCgU | 460 |
lm_eval/tasks/model_written_evals/winogenerated/_template_yaml | sha256=sYr9Yp7w3PEi-tbGeIDe8w85PAjo6_JZryTAliCCkLA | 318 |
lm_eval/tasks/mutual/README.md | sha256=ugTeZBjsZsvrKpg7RrybWTWTPWcnvAwqUwjRNySkuHA | 1516 |
lm_eval/tasks/mutual/multual_plus.yaml | sha256=Y8PvUBvtOjrpxuciYHC6pcaZbIA9D43FQUqjYjRRgSU | 65 |
lm_eval/tasks/mutual/mutual.yaml | sha256=N3AZH1BAhRxcfXdN6nHi80T-pjZzYqu7xGgsA7P-1cc | 659 |
lm_eval/tasks/mutual/utils.py | sha256=KkQlSOhZb-wZOz2GhpeOtKr055kPMkBW588vcpShgH0 | 1173 |
lm_eval/tasks/mutual/__pycache__/utils.cpython-39.pyc | sha256=wLYavS5lcELMr0mboigERCBL3fv4QKByKW1-3I0kQr4 | 1402 |
lm_eval/tasks/nq_open/README.md | sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU | 0 |
lm_eval/tasks/nq_open/nq_open.yaml | sha256=FIaX8BQVDOzgXboGV2z2VMMdCmVdTo6Am9qSWFNNVN8 | 720 |
lm_eval/tasks/openbookqa/README.md | sha256=zs_7CBuo_-tobBmuucjy5-agkN_qW-qAP038w3FgygM | 1968 |
lm_eval/tasks/openbookqa/openbookqa.yaml | sha256=ZWX4dK2WSCPe2uXVki4KhbQpt0xt7iJRpod17wah2V4 | 526 |
lm_eval/tasks/paws-x/README.md | sha256=YO_eiOakPQ7dgmaeZEGcAlpd2AaFFH5HGRLPVmQceXM | 2480 |
lm_eval/tasks/paws-x/_generate_config.py | sha256=iMhKxbPOuEVbaINMZrkdoJCJEReFGd-ReNkCZZG1090 | 3096 |
lm_eval/tasks/paws-x/paws_de.yaml | sha256=8rpK-nGyV3aDCNBBnLVze-fMbXf5TdJ1N6upcrJYM5A | 204 |
lm_eval/tasks/paws-x/paws_en.yaml | sha256=qDS5_V-KCVDBYdLzWpDfwKe_kNmGZGZ7_RLRDfW7JoA | 197 |
lm_eval/tasks/paws-x/paws_es.yaml | sha256=HM5pkreetDL6SuBSJq3ZHR8NvnONbTrLDxPW-hMkQmc | 201 |
lm_eval/tasks/paws-x/paws_fr.yaml | sha256=us8AGzpyfy5eKoFIUzAgKMiBboAm4VpsXoUGdQT4ifk | 215 |
lm_eval/tasks/paws-x/paws_ja.yaml | sha256=VBkjTeHL8VbGlKAc2D5iSj1pcKGtpkhcZzD2A4Dapzs | 215 |
lm_eval/tasks/paws-x/paws_ko.yaml | sha256=n3Ik828O3y-vA65_hnN_t57JE56vJR8yGHP5bNg5hSQ | 206 |
lm_eval/tasks/paws-x/paws_zh.yaml | sha256=L_G_vTVQO_KspHyL9xD_SW1EglMVgWhskrxPpYRunqg | 203 |
lm_eval/tasks/paws-x/pawsx_template_yaml | sha256=A9qDpAI2a35wa2K1BQqv6Vrw7NUK2k15FDX2O8IlL2E | 504 |
lm_eval/tasks/pile/README.md | sha256=pihxsbWkjJ9AYuoDGWJpa-2ijpv4MV-78uwcneK5SKw | 2120 |
lm_eval/tasks/pile/pile_arxiv.yaml | sha256=BWkeRzaL1bWC_reuf45w1LaMFQrsKes5oICgwzIBqG4 | 562 |
lm_eval/tasks/pile/pile_bookcorpus2.yaml | sha256=IRneHp6DVJQJLg79L1WAUXcI4H2j98CMJ8WJM9T_9t4 | 79 |
lm_eval/tasks/pile/pile_books3.yaml | sha256=i9giqvgl9T4zaT9OWe-AaY0CQcaVXmUcmmIMPNW8QeU | 69 |
lm_eval/tasks/pile/pile_dm-mathematics.yaml | sha256=MAHnHDrmzm6Td9UEB-WNKAO38Sv0GA_q1lPqOAn7jGQ | 85 |
lm_eval/tasks/pile/pile_enron.yaml | sha256=nXC7EnbTdTOznTB9YB8BQ7BO46rV665NNd1S9lOwxC8 | 67 |
lm_eval/tasks/pile/pile_europarl.yaml | sha256=GUjjBtstAzTd71MprWhOiYv0KrZPaG1Hw8dxPEMteyw | 73 |
lm_eval/tasks/pile/pile_freelaw.yaml | sha256=mdojFrCnxL0NukAO2RZ6AgD9cslKOUKelbduLeCHhHA | 71 |
lm_eval/tasks/pile/pile_github.yaml | sha256=uLaAsHv04EDJDphznC8pPXN8sCBjE2fCLFI9bIp67-w | 69 |
lm_eval/tasks/pile/pile_gutenberg.yaml | sha256=jbWxHsPayUwrwElKCfZM8YVVV-NLxHoUiZ76ivubAr0 | 75 |
lm_eval/tasks/pile/pile_hackernews.yaml | sha256=dqXEcDypQkVx8CVchdRfkHvOJjmKQvLU-vGKg_lcPlo | 77 |
lm_eval/tasks/pile/pile_nih-exporter.yaml | sha256=LD4hvEFvcgAq76Dv5AJnZpDUy3glQ988coxFA0zc0zA | 81 |
lm_eval/tasks/pile/pile_opensubtitles.yaml | sha256=P6y1GHbq9UmtUWtDAxqNaM60okuGajItFf7yzEnebZ4 | 83 |
lm_eval/tasks/pile/pile_openwebtext2.yaml | sha256=hROXABLgyKTVoK6Xau2-0fjuYAm7saKE-tmMeOsi1iU | 81 |
lm_eval/tasks/pile/pile_philpapers.yaml | sha256=HkCs1ydujb2l1uMe8TyB8uU-ptvYzKR4Y2DfRYvZ1Vw | 77 |
lm_eval/tasks/pile/pile_pile-cc.yaml | sha256=UOZW0LPRvji_5wuOG985xRYf0kb3eFxMss8iAscleZ0 | 71 |
lm_eval/tasks/pile/pile_pubmed-abstracts.yaml | sha256=OHZqNFFamJwwXdw_Sh4fS0Qm3f79WaKRnWzCEmjFF00 | 89 |
lm_eval/tasks/pile/pile_pubmed-central.yaml | sha256=wwvas6LbeZVdQ4e2Kyjw-RDc-YkJyCHHX4VhASHyyrs | 85 |
lm_eval/tasks/pile/pile_stackexchange.yaml | sha256=5-IHF0PzOeB4LZvgwNS34PMC3d0CsM6nzlsdjaClC2E | 83 |
lm_eval/tasks/pile/pile_ubuntu-irc.yaml | sha256=Z-uivjik0_RK2xWAw0doaG6ibCFfx6bHlKzNnEtJtI0 | 77 |
lm_eval/tasks/pile/pile_uspto.yaml | sha256=z8AonjJxzz7sEmXhNLE3ktQa4CAzX637yME0tp8fgAw | 67 |
lm_eval/tasks/pile/pile_wikipedia.yaml | sha256=yiSfOAA5LYA1kqQmQ7RxGMtGv5JoLZcCdEXcCjsq5YU | 75 |
lm_eval/tasks/pile/pile_youtubesubtitles.yaml | sha256=1rxTH-tybxk0itf346tdPOte-zZk0Pf9Jy-zah3LVRo | 89 |
lm_eval/tasks/piqa/README.md | sha256=eIzvCBu5__Kv6KMJhM4X__p8BAFnTVq9T1WDBucTglo | 1584 |
lm_eval/tasks/piqa/piqa.yaml | sha256=IGLmC3CFSDF5EEfy14AqM6kJAuv-rVkObUPKseM1YIg | 481 |
lm_eval/tasks/polemo2/README.md | sha256=z9Quxc9kiiaIvxdh7BS0mJ7B0pgk1wp8X5M9Wl4dVzg | 2948 |
lm_eval/tasks/polemo2/polemo2_in.yaml | sha256=vbn9dZmLGKUGPk2LCph-alPn_5SV_szprxWEC-UnEG0 | 1216 |
lm_eval/tasks/polemo2/polemo2_out.yaml | sha256=74DkVi24A4ZP-gpxtdG6VQP1SXke9_GxE3x5Vzx9sbI | 113 |
lm_eval/tasks/prost/README.md | sha256=mk33wnEvPNYwrpJy4uTDBek3Zfvh92t-HhVTUv0sgO4 | 2149 |
lm_eval/tasks/prost/corypaik_prost.yaml | sha256=pfXMopK8GxyYbt1eoFReSze0RoGdnRZwH0ppUIHvTnM | 506 |
lm_eval/tasks/pubmedqa/README.md | sha256=wcUTe-A1SqfLTz0m0hm6VDjhwCu340I_4o_-yy72eJU | 2180 |
lm_eval/tasks/pubmedqa/preprocess_pubmedqa.py | sha256=3c3aPXzbVBbLyWjEKj4br4P1gSt_kD0bMnHKrEbHfoc | 183 |
lm_eval/tasks/pubmedqa/pubmedqa.yaml | sha256=NCJy6w0XpMaZgb_fNIPjbGDdNLirE4QROBKVX2b7M0g | 416 |
lm_eval/tasks/pubmedqa/__pycache__/preprocess_pubmedqa.cpython-39.pyc | sha256=qi2r1_z3wTM76NnzUCdBZ_OHulKTkHCjkqqTvNSaa-8 | 424 |
lm_eval/tasks/qa4mre/README.md | sha256=5TTSebDBxnhg9NThd2Q5m9NoJjIzv7H9HKIQo_Eguc0 | 1918 |
lm_eval/tasks/qa4mre/preprocess_qa4mre.py | sha256=rEzBkrAERfA2pbZzHO__bGdUvXB8ZKQjaIuijhwhXLc | 164 |
lm_eval/tasks/qa4mre/qa4mre_2011.yaml | sha256=B12lheloARa4o-QDD-emLQ3peU4Jgfe4MuSu2gFbvK4 | 710 |
lm_eval/tasks/qa4mre/qa4mre_2012.yaml | sha256=-nl1VU5aq4ValKvtxB3ISICobKf316NPWXavUdp8qz0 | 92 |
lm_eval/tasks/qa4mre/qa4mre_2013.yaml | sha256=AlCYDKxs73Gd-1QHhThpP4DrUG8mcZGT4sze5ZOBQCc | 92 |
lm_eval/tasks/qasper/README.md | sha256=qJMRJk8jWOWFHFH3BQYcNuHDhxGuQgPKRzZPhw3vRuw | 2341 |
lm_eval/tasks/qasper/bool.yaml | sha256=MIbAwUzmvpm8PUq3RAExd5UF0uWNDTbGKFIeHw5QfL4 | 363 |
lm_eval/tasks/qasper/freeform.yaml | sha256=xVKBpRWZol7J7D7j7xhKAkfruF26Xv-DD_Wfs7eodqo | 464 |
lm_eval/tasks/qasper/metrics.py | sha256=o_tnt9i337NWIxN2ns6fDM8DJVx6nJ0rH2QrUBU6jvY | 1245 |
lm_eval/tasks/qasper/utils.py | sha256=gzCFKtf0vz2qK1qdLZxrR6pzyGEHAeVtwqIxfhg2ESQ | 2710 |
lm_eval/tasks/qasper/__pycache__/metrics.cpython-39.pyc | sha256=Srw0PTep3kZ2iC3hz6cj4AJSDVDGl3WtiGcEiBmH4Zw | 1864 |
lm_eval/tasks/qasper/__pycache__/utils.cpython-39.pyc | sha256=g5etFAfwL02hon0GZjK1CRuJug_613xS2TpzwHVLLTM | 2176 |
lm_eval/tasks/race/README.md | sha256=g34h1RR11f1d_YFrZVeYAITtm5pZgIAfE-yli0cAcuo | 1336 |
lm_eval/tasks/race/preprocess_race.py | sha256=ib-ESUCHV2BnblF7zuubRnbd4vS-_wNCSPj6YbDH9bM | 1100 |
lm_eval/tasks/race/race.yaml | sha256=WqZUsXWLn1G1M7K-PVhpbOj1neHq8ziQV8c0cZqCX74 | 372 |
lm_eval/tasks/race/__pycache__/preprocess_race.cpython-39.pyc | sha256=mTmREPPaF96ibcPBqffK19F-ASLdNAigXOhNIcFIQNE | 1577 |
lm_eval/tasks/realtoxicityprompts/metric.py | sha256=J4sxWSpZtRFX2ku0fV7Hk9JRJcLSJTJiu2pxAIWxc4Y | 1945 |
lm_eval/tasks/realtoxicityprompts/realtoxicityprompts.yaml | sha256=5SnchSeEfsHY0SUSMPUtwXIW2lv_h3d5NJlGgOfwQg0 | 388 |
lm_eval/tasks/realtoxicityprompts/__pycache__/metric.cpython-39.pyc | sha256=iX__XmCPCXCHMpC2pJf_apS7fBaxYdZlw7QB97mr_i8 | 1704 |
lm_eval/tasks/sciq/README.md | sha256=XCXBf3KfpPWJqBiqKogR_qyWqFK-XQKOhmGozlRw40Y | 1480 |
lm_eval/tasks/sciq/sciq.yaml | sha256=IsuhHhEHXRu3EZkHzQm6OPTtaZAhk1athwTGi8hczVE | 568 |
lm_eval/tasks/scrolls/README.md | sha256=KqLRLEY82dKs_tR9w6lx5Hhxd71JoArktV_u_qQ02JQ | 1443 |
lm_eval/tasks/scrolls/scrolls.yaml | sha256=M5NNVGp-MESF6puJS7x9UGuOY-jhsJyggzatzbZWREU | 173 |
lm_eval/tasks/scrolls/task.py | sha256=f0I0ooE0hTShVHXA_zN17LdA1xWFgrVA3PboP4wzMuk | 13803 |
lm_eval/tasks/scrolls/__pycache__/task.cpython-39.pyc | sha256=EfNUDZ-MCK3K7WjABsns0cCJuW0WdEtU1WI3BngHBIE | 16077 |
lm_eval/tasks/siqa/README.md | sha256=4TalxcZMCLW7D4NmfEcxWR2bjUtKhGemGEnju8QyX2k | 2607 |
lm_eval/tasks/siqa/default.yml | sha256=lWwo6-2GKCPKFbXzclWV9yuTegf6fa0-cwWS2QSwQY4 | 404 |
lm_eval/tasks/squadv2/README.md | sha256=1kSUwS--VUhL7Ql_Wg_AeIcR89gyMIKanxxVrcH6mjo | 1901 |
lm_eval/tasks/squadv2/task.py | sha256=I5F7p7udN7N48xSIU39xMGGPiAptOP3SuGOldxkTT9A | 8455 |
lm_eval/tasks/squadv2/__pycache__/task.cpython-39.pyc | sha256=pA1KzxphT-6sH6_KfFSvET0jo_f1iYy-9VmtPMEkki4 | 6415 |
lm_eval/tasks/storycloze/README.md | sha256=4FMoplUQinv6L9UUJKjrTNHazX5_WNdGqMTzWsWgduE | 2406 |
lm_eval/tasks/storycloze/storycloze_2016.yaml | sha256=wd91w2f_9JCBUSDuAnuz9otYWTyB1GioLlZMBo9XgrA | 610 |
lm_eval/tasks/storycloze/storycloze_2018.yaml | sha256=X9Q-PjykgFnj-NC-4gD6nXCl590_FIxAIE4EFUZHn3c | 583 |
lm_eval/tasks/super_glue/README.md | sha256=VeTdrrg5qatbvDbcKHzqoRuQBBDznttSGUGQUpqD_q0 | 2977 |
lm_eval/tasks/super_glue/boolq/default.yaml | sha256=-a-bq-5m_PvbSu2-Rpib-WhoOQboe7iOIs0r8bZG6G4 | 402 |
lm_eval/tasks/super_glue/boolq/seq2seq.yaml | sha256=7PNkWhuqLXKwfFTIgtWEu7w3Hf3mI0NSz1Cdyp5lx3g | 575 |
lm_eval/tasks/super_glue/boolq/t5-prompt.yaml | sha256=7zVKwh6B-GFmhzCF9RHxX-Y2UKxs0P8-YoT9i7_dh0c | 513 |
lm_eval/tasks/super_glue/cb/aggregate.py | sha256=8FkDNZF9Ldrqj1sFa7cqAvz-nR7reaJUCbEWtv6VaC8 | 422 |
lm_eval/tasks/super_glue/cb/default.yaml | sha256=1j7LbmUeeQsdKriu0RHqYcI2T8jcQlBqD8pCFaW4Jho | 439 |
lm_eval/tasks/super_glue/cb/t5-prompt.yaml | sha256=yDsagQCkzPEyj-IuGrHojvIo6RVHOc8M_zKLZBneXDw | 665 |
lm_eval/tasks/super_glue/cb/t5_utils.py | sha256=3VZHdSwiNiMXo-qHt_KDWL6TiRYmixfvlBiPaq-pzfY | 882 |
lm_eval/tasks/super_glue/cb/__pycache__/aggregate.cpython-39.pyc | sha256=Ck474nQfbZ0opCeDlALZDlsPQyJ2osC0Xn-0ROK6eQE | 564 |
lm_eval/tasks/super_glue/cb/__pycache__/t5_utils.cpython-39.pyc | sha256=XPk9BI-qC0LTOXUOJL_Dvi16kXWuIfzyS5F4wVwbEQc | 941 |
lm_eval/tasks/super_glue/copa/default.yaml | sha256=xPvt5xv6yn4mWwFtHQK8sN5WaMiHQ093RvvNaZVZK_0 | 355 |
lm_eval/tasks/super_glue/copa/t5-prompt.yaml | sha256=X4rzoenJrg7P3_6p5n8fHsQT-c843LzxXtolr0rTp3M | 557 |
lm_eval/tasks/super_glue/copa/utils.py | sha256=C-mKkH22R6UYxCyRamE4W2TzlM-dAXG1y4a3oDYoLec | 566 |
lm_eval/tasks/super_glue/copa/__pycache__/utils.cpython-39.pyc | sha256=TwSJC_x27KCOVuNTMbwGEYcyiSRJJjSxeQFdGNaC2Yk | 902 |
lm_eval/tasks/super_glue/multirc/default.yaml | sha256=lkYTmOIl7kd7jrQEDQw3wR-ShtWhI-PGBCsd7RBvf3E | 424 |
lm_eval/tasks/super_glue/multirc/t5-prompt.yaml | sha256=tj_IL3M1zsXEDSelZj8ulguqiIXSq5jYSB3CjkePuU4 | 692 |
lm_eval/tasks/super_glue/multirc/t5_utils.py | sha256=QX1kCG5GG4zBs4TGU8PuNyzzHHyFU-Ri-OI6F2z5gJs | 1541 |
lm_eval/tasks/super_glue/multirc/__pycache__/t5_utils.cpython-39.pyc | sha256=gvkVU-obwQdwfs3pwNaTRoDOabQIf1NQ4ZKC8sWD9uI | 1513 |
lm_eval/tasks/super_glue/record/default.yaml | sha256=FYXwjVgtZuUfC9iGyicbBQShOGXRKp0Gam6h7MZKGKY | 460 |
lm_eval/tasks/super_glue/record/t5-prompt.yaml | sha256=MHfT8563qPb0bBb7fbpH84atClu1zimQzkymek9w72g | 626 |
lm_eval/tasks/super_glue/record/t5_utils.py | sha256=AseVUaB8z7cN_MiQKFZ48FlwvV_EQr5VuPaaY-SyO_w | 4066 |
lm_eval/tasks/super_glue/record/util.py | sha256=HzltnH_KvCCBuIo35nQEEqJgfVpAOi-BFTMmvmMvvMQ | 1274 |
lm_eval/tasks/super_glue/record/__pycache__/t5_utils.cpython-39.pyc | sha256=N61J2MXO4ClWPcjUSSRQZ6ybmU_ymi9ukF206oxi_F0 | 4843 |
lm_eval/tasks/super_glue/record/__pycache__/util.cpython-39.pyc | sha256=_zYuAgESKqnS-r05WxxPyOL6P-wdwIxj6m2z0izHXag | 1432 |
lm_eval/tasks/super_glue/rte/default.yaml | sha256=Qygjf2_YxOtaBM8dtJpCKlB8LKm2SL79BLv84bh5yaI | 359 |
lm_eval/tasks/super_glue/rte/t5-prompt.yaml | sha256=NFgmo2_76h-ycqZo-188C4OPuP7j-ukjaBaJlgANwQg | 526 |
lm_eval/tasks/super_glue/wic/default.yaml | sha256=ppLZ7xhvNlvaVUfKCFjimDLYOzWhpJ8YsthMhhV1TtA | 452 |
lm_eval/tasks/super_glue/wic/t5-prompt.yaml | sha256=sjxSwOsd9xb09-kiRoq6fxymKGv0-Xp9eVZu-od-ZrI | 528 |
lm_eval/tasks/super_glue/wsc/default.yaml | sha256=RasSQF0dl5-5nL5yqGLhSJNCl71Y2a7FN9321nOV6AM | 336 |
lm_eval/tasks/super_glue/wsc/preprocess_wsc.py | sha256=rzadUAJO9p1gdjD3nHBmmxXQUB84AL6e5GyYu2BdQ_o | 620 |
lm_eval/tasks/super_glue/wsc/t5-prompt.yaml | sha256=E_uos8Jq3PEwBZFhLJJBZI7lX9DXU6WtinM1Xp7Y9Pg | 516 |
lm_eval/tasks/super_glue/wsc/t5_utils.py | sha256=Xk8g0BkNGI5rm2XxD0P2T5XXhJ3qcXRfc9AzFXJUkq0 | 3439 |
lm_eval/tasks/super_glue/wsc/__pycache__/preprocess_wsc.cpython-39.pyc | sha256=QDj_2DlH2fLLVZRLrFiZO7BF6CNoXWKcY7gOsr0cpj4 | 745 |
lm_eval/tasks/super_glue/wsc/__pycache__/t5_utils.cpython-39.pyc | sha256=y82UPATkJnWAmtlBp6jJuQisaGQWvx-kuEN74YqVVR4 | 2897 |
lm_eval/tasks/swag/README.md | sha256=pOggfzxJS46Lm1Ouo718vpVzN5frU5lg5R9OxjPmeEw | 1799 |
lm_eval/tasks/swag/swag.yaml | sha256=7fhdrXh-Y_FUFDogXcCYS8wsJs0mrRFejRa1vJ6fpIM | 428 |
lm_eval/tasks/toxigen/README.md | sha256=0zC_-x1qhk5mL_Jtm6CD7cZu_dnQMexWDHXTdfjKMss | 1458 |
lm_eval/tasks/toxigen/toxigen.yaml | sha256=ELLvi26rxDQy6xLZO7A6se3Me0XgUyEYif4Q-fcEojE | 490 |
lm_eval/tasks/toxigen/utils.py | sha256=7jVV5-UQChjGOjsZQAOvbiaF-HlJuYV2unRvbuPxbgA | 153 |
lm_eval/tasks/toxigen/__pycache__/utils.cpython-39.pyc | sha256=CkiNIOooW26tdDjkFJr5CbjNXk6wxekt0f2OQLflBQA | 390 |
lm_eval/tasks/translation/README.md | sha256=ruLNyYFEmM76GJEov0HOlRG5FUCqflCh7vYunu12D5A | 925 |
lm_eval/tasks/translation/iwslt2017_ar-en.yaml | sha256=EUZC-LRC00L6ytBzeWlB1dPemp2PpNxI_mnTBoQZ4dw | 286 |
lm_eval/tasks/translation/iwslt2017_en-ar.yaml | sha256=-nyyvuvCp-mfWoEgcsM7CG7Rk0wju9zu2x5I4C-8rJo | 286 |
lm_eval/tasks/translation/utils.py | sha256=H8YlnEUoBoK56c0co5rVYwzzUT0RqaLhmjQ5UuhZxds | 4184 |
lm_eval/tasks/translation/wmt14_en-fr.yaml | sha256=jQIlH1WktTOrRKmbNfDkbOxuRAwrjJ2zZfnfc84ylYQ | 294 |
lm_eval/tasks/translation/wmt14_fr-en.yaml | sha256=8NmJ6H7bQoBT2vqbZXmQEQUJf5-NEQkdIE6I7KhGEhs | 294 |
lm_eval/tasks/translation/wmt16_de-en.yaml | sha256=5kZvgi-Z4TxRhSehntg8p7Omtq8_SL5lPV6jb02qOKg | 294 |
lm_eval/tasks/translation/wmt16_en-de.yaml | sha256=WnHNT4lFysZkw-c9Ox0STgnBPurgjiMqH-LH1t4CEBE | 294 |
lm_eval/tasks/translation/wmt16_en-ro.yaml | sha256=0mcSrvjsNnO2pOXStd3OAr_vsSyGHAPCR80pB-i2ED8 | 296 |
lm_eval/tasks/translation/wmt16_ro-en.yaml | sha256=8-nK4wweCzQENB-0StNgH6WZbGJL-k_wczDIGte2RIQ | 296 |
lm_eval/tasks/translation/wmt_common_yaml | sha256=qXQaVfTgoyJ0YvwQsaqNkAoIQhhQh5jEtvb10WdfUOc | 300 |
lm_eval/tasks/triviaqa/README.md | sha256=UwDPFH5UD913cyyUTjFIM48iSgDjjNltRQLbjRo5n5A | 1852 |
lm_eval/tasks/triviaqa/default.yaml | sha256=bTo1lDpD8Sm8YP094e1LMPvMgS42A7leY8lJ38TYsQ0 | 696 |
lm_eval/tasks/truthfulqa/README.md | sha256=APxG9NLQHaq6QzbZxyKgkmOvZbjaTQLb-od3MiYTQ-Y | 1717 |
lm_eval/tasks/truthfulqa/truthfulqa_gen.yaml | sha256=13c7g_03vwl6eVYZHmSPaUeN6zw0NzJ1K4T2lg378Gw | 2250 |
lm_eval/tasks/truthfulqa/truthfulqa_mc1.yaml | sha256=F-NPoUv_MJkgWmCwcu2iCK3Vs9RB0pGCpVMZA-Y0zZo | 1172 |
lm_eval/tasks/truthfulqa/truthfulqa_mc2.yaml | sha256=6NF8gKElG8jRj8PSHrtirV5KhfRCoOHYWugj1eJzEHw | 332 |
lm_eval/tasks/truthfulqa/utils.py | sha256=KpxlpAjCohDM0M1K8uwIOVUs1Sfjx1lC7-_j46sU5N4 | 6016 |
lm_eval/tasks/truthfulqa/__pycache__/utils.cpython-39.pyc | sha256=VkMz7_oWNyL7oXfLzs01jeswOM5vavPdh4Jpjaxj3XM | 4757 |
lm_eval/tasks/unscramble/README.md | sha256=8fD3JDITiBTcee1qvuz-EzbXAjdGI4IR6hGY6dCdIaw | 2615 |
lm_eval/tasks/unscramble/anagrams1.yaml | sha256=ldQi3m3Nq3ZPHWPA1UFk_cJAs9pYJBky3m_ntTyC9OE | 423 |
lm_eval/tasks/unscramble/anagrams2.yaml | sha256=xR0BWZU_Rwvzu_J9yJLif4ZHBM1zIKxNMdALJVRBsrw | 423 |
lm_eval/tasks/unscramble/cycle_letters.yaml | sha256=Rl4h689_HADY5Y-TcjN3Rj-6XJpfhiYq3m-b3meZauw | 429 |
lm_eval/tasks/unscramble/random_insertion.yaml | sha256=1Yp10FguQysKQMlj-vG_Z3QAI_Y73FSU4sHYQu706jg | 435 |
lm_eval/tasks/unscramble/reversed_words.yaml | sha256=U_B3K8HvvlAV0kkGZ8YhLK37L6L3jAk67PAAQ2uGLYM | 423 |
lm_eval/tasks/webqs/README.md | sha256=XaGMylFq_iwthSyM7VvHE5rVMzgQ9GJ6cVaQLMmagaY | 1933 |
lm_eval/tasks/webqs/utils.py | sha256=s01Tkm1AQQ_BjJtUVayw1fJ5BsxaGjtCTrkJnF_fy_g | 773 |
lm_eval/tasks/webqs/webqs.yaml | sha256=j9cfUPUeAyRVLyVcLVZ_d7jE-kwhYo15RGTpUvh1CZU | 486 |
lm_eval/tasks/webqs/__pycache__/utils.cpython-39.pyc | sha256=L9ydx0DYHnJyLtqZWW1KtR-EYy9qqKkHATB5ubi3PXg | 1091 |
lm_eval/tasks/wikitext/README.md | sha256=TIKOT6ySFrA3YAFL66ftz8FRL-hgJ0EfirXpSqH1294 | 1477 |
lm_eval/tasks/wikitext/preprocess_wikitext.py | sha256=pEAgN0sXIVm_W-gKZNLEGUydXHcoT2lqxmY2EzjI2n0 | 1738 |
lm_eval/tasks/wikitext/wikitext.yaml | sha256=iMtq-n314CJrltaF5LXtqACjJR-QlK33_kZxTlUyrzA | 534 |
lm_eval/tasks/wikitext/__pycache__/preprocess_wikitext.cpython-39.pyc | sha256=UeAxJSzDd1D_6qs4Z7KRVXquXq0wh_9OaueHWFM1uKg | 1346 |
lm_eval/tasks/winogrande/README.md | sha256=vA2S-iOSnXTAXPQxEqRhwZMd3axmvKA3P-7tUcY2SFo | 1816 |
lm_eval/tasks/winogrande/default.yaml | sha256=pTVOoUj0DLtC4Zc9rGjIsLRoJtMKY26u3x8--dryPEU | 500 |
lm_eval/tasks/winogrande/preprocess_winogrande.py | sha256=5VMnYpJkqY8dOD_aJGRbZ3mvtT-gvOIVAEK5QWsa4AY | 377 |
lm_eval/tasks/winogrande/__pycache__/preprocess_winogrande.cpython-39.pyc | sha256=I71cxmbZ8cJWgbtoWz7qYAC_AK0uerNpNUwEmdwz4BY | 875 |
lm_eval/tasks/wmt2016/README.md | sha256=KlOtv8lY7r4KGFf_-quEOdwm90d0bp3Wfz9TimENrJs | 2092 |
lm_eval/tasks/wmt2016/metrics.py | sha256=V629nou9UMoPluWjgjf2D9IlbXi0YD2HWy7mspQZQmE | 280 |
lm_eval/tasks/wmt2016/ro_en-t5_prompt.yaml | sha256=hm8UvJ6bbLnxF3TRhZbAhgaiNPYgE-hEFqCcZVUVQ04 | 483 |
lm_eval/tasks/wmt2016/__pycache__/metrics.cpython-39.pyc | sha256=2JEQzMMGN5TkPV23CL5yzSq6QRrWaLttkNI55uWjDb0 | 514 |
lm_eval/tasks/wsc273/README.md | sha256=ACWo1bwzuYf66R7z0xxa4hMc2I6jdb71D5V-GeXNL-c | 2963 |
lm_eval/tasks/wsc273/default.yaml | sha256=SWKkN_SuATu7RAY4RnvXKkA9GHlWC-QQtSx8G_OCXWk | 520 |
lm_eval/tasks/wsc273/utils.py | sha256=LCldN-jXX1ilzpSIOdIMuZcdHA12J4eCkb69RYTGNQc | 1005 |
lm_eval/tasks/wsc273/__pycache__/utils.cpython-39.pyc | sha256=M3hWRopZ-dcpIN0UlhIcxaD5w8SXesbPJn33sSGkv64 | 946 |
lm_eval/tasks/xcopa/README.md | sha256=bszl23gtJTrwRRgk3JS7pbStFHqU5n7CW2s6YnNdwQI | 2211 |
lm_eval/tasks/xcopa/default_et.yaml | sha256=0Zpfxnvi86KuEC5eh4dYD_H4Rz0Goa4k-nNAiSKp1KM | 306 |
lm_eval/tasks/xcopa/default_ht.yaml | sha256=YiVPPHda2D5HOmRzwiZsBXsSBdo90wBaRH5X7YQGnTY | 101 |
lm_eval/tasks/xcopa/default_id.yaml | sha256=XxcNzEJFlUUGpyx_vvEiDKqPlzqr2rlkDpunwcp-Wzc | 101 |
lm_eval/tasks/xcopa/default_it.yaml | sha256=P85UpV5Ilfr8wFA1Dupc6dQn-KVn9LDhxT9YOQb4A7Q | 101 |
lm_eval/tasks/xcopa/default_qu.yaml | sha256=6CR5W6wWzpvLSr6X16gELeM_pDjahhLfnhUnyEKvnWk | 101 |
lm_eval/tasks/xcopa/default_sw.yaml | sha256=I0HIJi_MHQPkbBj2OGF9yn_9nupq-bxsWaU0mfLntf0 | 101 |
lm_eval/tasks/xcopa/default_ta.yaml | sha256=T-ZV3pCgYTToODyBNJA0L5CrD4OspR8-hkS35TEfIqE | 101 |
lm_eval/tasks/xcopa/default_th.yaml | sha256=_eMapb7miFw0cZuZaG1kSSR4Kjx2LFv2_8XTkkIb9BE | 101 |
lm_eval/tasks/xcopa/default_tr.yaml | sha256=6VzN3-CzEotaJrB_ZesEEHKM6XEQqY_kzHiXrDInNYs | 101 |
lm_eval/tasks/xcopa/default_vi.yaml | sha256=0TBQaLnbCUIB74GGs5gOgoprp4OSfK1vZ1fZgCIqrLw | 101 |
lm_eval/tasks/xcopa/default_zh.yaml | sha256=R4P1Ibs5oJps9Hs2AeBBrL27yJW8OCXkL3ORaBCnfto | 101 |
lm_eval/tasks/xcopa/utils.py | sha256=GR0xu7_Ga-e2bLxBAFPhNjEgGjcA33SfI8ZT-3g03UM | 1791 |
lm_eval/tasks/xcopa/__pycache__/utils.cpython-39.pyc | sha256=082t4Y9UIczJWKBhWtL2njEsQGdAEWEsZFRjhe6ThbI | 1496 |
lm_eval/tasks/xnli/README.md | sha256=M6yJ8Ui08vdiDQRLW9EejDPrSLuop09XVmZu0RfJEgU | 2224 |
lm_eval/tasks/xnli/utils.py | sha256=gUJOG8_pEOLXZgtQ-N7FMM0uR0XtV5685zkaX9-FWkU | 5307 |
lm_eval/tasks/xnli/xnli_ar.yaml | sha256=-vGMt34SYGsrxhJH2mzVJJ44UwCs44_EdPkT9F-b6zU | 248 |
lm_eval/tasks/xnli/xnli_bg.yaml | sha256=3ZCMy6xC4r1HN_324m3Tqc4LjL2ZJTVlQAzG6Anmq34 | 270 |
lm_eval/tasks/xnli/xnli_common_yaml | sha256=f9yUbHHKUWSpCpXV6yHZT_HVhhFa4f50SJVw3dT1fLg | 484 |
lm_eval/tasks/xnli/xnli_de.yaml | sha256=Jk1ZgtT9ji3lq3TVfu0jCQxUj8WJ1dZeaSyEkLzPiN4 | 237 |
lm_eval/tasks/xnli/xnli_el.yaml | sha256=Ljnc0ksd4-SYjDNhCBtZMP5SDk8gjD9k9RgxzFk4kuo | 262 |
lm_eval/tasks/xnli/xnli_en.yaml | sha256=YeCSTN2rwAT0NLWzh1DW19PoAMee46W-hf0ScBeyhfE | 230 |
lm_eval/tasks/xnli/xnli_es.yaml | sha256=GkwQMf22cNfBhIVubRAzkRPL8TGPCi0gilZFWdaoF1w | 242 |
lm_eval/tasks/xnli/xnli_fr.yaml | sha256=RdfT4cthik8ZS7sSmkvsoxuK2nTdDouNOpzrZ-Lebdg | 238 |
lm_eval/tasks/xnli/xnli_hi.yaml | sha256=pPuF91nLvDCOVXQ1bANGV-UQFedcez_2XW-OapqEX6Y | 269 |
lm_eval/tasks/xnli/xnli_ru.yaml | sha256=1tAyhdGQKXpFQrIM_2-SAdPv7v34Ot1Y_NlX1WNk2PI | 276 |
lm_eval/tasks/xnli/xnli_sw.yaml | sha256=Z6CF-2C6DyPh0nzk7GnqjtWnOHAw5zblmfDVjAQmJAU | 240 |
lm_eval/tasks/xnli/xnli_th.yaml | sha256=N1QOrp7HkzYrx0TAiSMhEAJmWwETEAGsMBM3gTeoWnc | 308 |
lm_eval/tasks/xnli/xnli_tr.yaml | sha256=bUvapKIUdJCJKc7CCIl918aJiWwhEiEsoMXJtbrTgn4 | 242 |
lm_eval/tasks/xnli/xnli_ur.yaml | sha256=47LmNHEByKsde-KLFlxDfWgHiF6MX06isosv6YF7Rj4 | 260 |
lm_eval/tasks/xnli/xnli_vi.yaml | sha256=Aw64QMiB-AAhq5xMgbZQs6dEzFC4njOpbH7bMokjq2w | 244 |
lm_eval/tasks/xnli/xnli_zh.yaml | sha256=f7rvxUp0E8CgBu4d-YyCQOYx-d6eYRmiVfj0vNMdpsg | 245 |
lm_eval/tasks/xstorycloze/README.md | sha256=zFx4IhOCGFNVCkUqmcnBH10c7_xyEHX4p_V4OPEFRJg | 2674 |
lm_eval/tasks/xstorycloze/default_ar.yaml | sha256=_eTfzNqBctb9WN7zV8IiQ5cW1ovd48jBne3D16BK05o | 618 |
lm_eval/tasks/xstorycloze/default_en.yaml | sha256=jkXDziy5ZFSxiBBfvpF5X0PD7r2-EoJuPvpM_YO57mo | 63 |
lm_eval/tasks/xstorycloze/default_es.yaml | sha256=krymcDmxJbEqyaLMjJ2qCTp72_vpe30EyrqAytvGmFA | 63 |
lm_eval/tasks/xstorycloze/default_eu.yaml | sha256=Jp7s9WOyPBO-r8ZMHXgrHWYXsOSxwTFoLM09w7xktT4 | 63 |
lm_eval/tasks/xstorycloze/default_hi.yaml | sha256=0baA81PaJh6O_rHk5Zt75RlB0Rm8IeIEmcwWl65AeCc | 63 |
lm_eval/tasks/xstorycloze/default_id.yaml | sha256=3eufzTCUzloyMmZmNmtT9jkilhLaaUlhZyWYtSoO6K4 | 63 |
lm_eval/tasks/xstorycloze/default_my.yaml | sha256=Lru52K3docj3SyM8yb_vKEdejBL5587nj2WIyPEoKXk | 63 |
lm_eval/tasks/xstorycloze/default_ru.yaml | sha256=NQLa7Ztu0eLDeJSeSiiR-6KYJE4im3-0IFP7JG-E-AU | 63 |
lm_eval/tasks/xstorycloze/default_sw.yaml | sha256=BkOasjoNtcIMwhhgB51ZhY9R8E0O2K8RMiiQewpRoBQ | 63 |
lm_eval/tasks/xstorycloze/default_te.yaml | sha256=uS7g8yrYniDdX3QuXwCSZsXMBQNAoDFDuGLXKNJ9P-Y | 63 |
lm_eval/tasks/xstorycloze/default_zh.yaml | sha256=TTaSyzTXWpqEgcCaadNWnxrHKXB7cdMuSEpZ9OeqHZE | 63 |
lm_eval/tasks/xwinograd/README.md | sha256=qPmixk1nZorlQSshnqtAoP1i5Zy4vrgJry65OLGklXk | 2601 |
lm_eval/tasks/xwinograd/utils.py | sha256=stWOtJ047Bj_L0ia1eqvhlitXoXVt4ABqmefb_sbidk | 2796 |
lm_eval/tasks/xwinograd/xwinograd_common_yaml | sha256=462Cukn5zE9tWhHnctoX1mA-Nut-ivVjIAI_oE_clbU | 624 |
lm_eval/tasks/xwinograd/xwinograd_en.yaml | sha256=xbEp4QSQgNlKymjEFxXVonpbG7IKDjtFuTa1DzNTpUc | 91 |
lm_eval/tasks/xwinograd/xwinograd_fr.yaml | sha256=UZ7Txl6Q3d9bWvZXvjGxVQxGMnZ2_5bLL7Ykrhu_-nA | 91 |
lm_eval/tasks/xwinograd/xwinograd_jp.yaml | sha256=aRVwy9c6YOGpRFgm4oAUnljHW2y5UTF6IvwzEeOjVnc | 91 |
lm_eval/tasks/xwinograd/xwinograd_pt.yaml | sha256=A8oaox90xLwx0N1G8MfRpZGB8Tof6mux8EtgJpSrOaE | 91 |
lm_eval/tasks/xwinograd/xwinograd_ru.yaml | sha256=ra7PfDvFLZS1sBiMI7hRBjSWCmElclMWFwChrIg9-HY | 91 |
lm_eval/tasks/xwinograd/xwinograd_zh.yaml | sha256=OAf84RMb0BbFc3DGtBij-84FGwKDwHH9d_eGRXN_K0Y | 91 |
lm_eval/tasks/xwinograd/__pycache__/utils.cpython-39.pyc | sha256=oZrwLOWXanHo7D7rpIAKNuCsW2WuWTOHLXtYF4H6PaI | 2942 |
sevals-0.0.3.dist-info/LICENSE.md | sha256=qAbkJUdiDf-8LsAzMyLIs1I7SvEeBZvhTvgapbGuAh8 | 1067 |
sevals-0.0.3.dist-info/METADATA | sha256=wy3PtQQGMWnAvjl5T41gfsqaSt4cb8XthxrGG-woiCc | 5985 |
sevals-0.0.3.dist-info/WHEEL | sha256=oiQVh_5PnQM0E3gPdiz09WCNmwiHDMaGer_elqB3coM | 92 |
sevals-0.0.3.dist-info/entry_points.txt | sha256=Ikxf2dqf0BOLQ2hNGr9atKOHCph3yvpSKqXsQzJ_cm4 | 57 |
sevals-0.0.3.dist-info/top_level.txt | sha256=risQwf3pU3EoXaYL_bKYFzW6EtBOvJxJotKdDz605Dk | 8 |
sevals-0.0.3.dist-info/RECORD | — | — |
top_level.txt
lm_eval
entry_points.txt
sevals = lm_eval.__main__:cli_evaluate