Path |
Digest |
Size |
lm_eval/__init__.py |
sha256=9-jqCb66p_m29iqX1zVNpo_MzAIGznMZKNKOZKfEsxI
|
49 |
lm_eval/__main__.py |
sha256=DWnN4uwi3psHz0clLrWCd0yrvhBC0w3FpNAiDWKw6hg
|
14462 |
lm_eval/evaluator.py |
sha256=MxO5Q8iugw2BMumroE4RT3bcxJSiqmunxxu1j2FF87g
|
22572 |
lm_eval/evaluator_utils.py |
sha256=tmlK2KSBlZ2C-TXrDH0MVExUO9aNbI3tU4Mom_5K8xs
|
12641 |
lm_eval/logging_utils.py |
sha256=cFnlLO_b9meHoBdYB-WEvRwQ6ejbeAf6FalOLZbrU_g
|
16736 |
lm_eval/utils.py |
sha256=mcUNJ67QyDtDgK5zZYM9-Stl8oINzu7J9wCXWJBz_rM
|
11240 |
lm_eval/api/__init__.py |
sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU
|
0 |
lm_eval/api/filter.py |
sha256=4XR0Sj7K_3ivNKYNYHS8iUWAHaUMYCjVj0ZMsoZsff4
|
2149 |
lm_eval/api/instance.py |
sha256=neYbqoO3cakbUJYT1Dp9IYm0WU10XWTlAEC6Da_4ZZA
|
1060 |
lm_eval/api/metrics.py |
sha256=7nN3SkTQDBmVQFRyTkHHpax3d8X0flEcekRYxrPDhOo
|
14604 |
lm_eval/api/model.py |
sha256=ruZNiGIAgjAz55EZVcsB6HdKEFJ9AsBf96Hx8pWyGTI
|
12147 |
lm_eval/api/registry.py |
sha256=Q5SbdStZoyQZIvUy3Z0q78_TyrJDzvgoxAcHH71U6ys
|
4712 |
lm_eval/api/samplers.py |
sha256=rahA0TC-g64s9GbxcskqxaNm8iD_bkC7ctT8apAWW4c
|
3960 |
lm_eval/api/task.py |
sha256=pN6arA2Lfa4DIvKmh44IedNBso_OvH8gIi2G4HKG7TU
|
57824 |
lm_eval/caching/cache.py |
sha256=lvukmRzezPjojXLw8L01H0asOGu-mwwk1EHKgX5ZrxI
|
1345 |
lm_eval/decontamination/__init__.py |
sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU
|
0 |
lm_eval/decontamination/archiver.py |
sha256=3XtedMPsXAN0_zA5yyYDAH36vttZphkAJ0YwGK8xy3Q
|
5732 |
lm_eval/decontamination/decontaminate.py |
sha256=Jgu8HpvJnQL0nySL1hGN9qwnRshDvuW-_I13QZfKaA0
|
6817 |
lm_eval/decontamination/janitor.py |
sha256=tIZLlI920eKtaNlSiualDTJPO7P42PbxInfBezK5iYI
|
13150 |
lm_eval/filters/__init__.py |
sha256=FGJ47_lIqR6-xT4zn5-iv-xVWsS4iH9hT3FlyBOFZuk
|
1614 |
lm_eval/filters/decontamination.py |
sha256=faJSuxPQVNdLIJOSUvN5z-yNyrdc3oADYS6m2xqTIEg
|
630 |
lm_eval/filters/extraction.py |
sha256=RDKYZ_rUZBhnBL6e1waALNEdH4U7NYof_wg5bFuH8O4
|
6403 |
lm_eval/filters/selection.py |
sha256=W1TdZJnXHhJncX89h4wV61nZ1RZgL0GwNnoWhqu0dQ4
|
1675 |
lm_eval/filters/transformation.py |
sha256=gnQhiQOxbu1w3JEZVrGqVKGPmVQ6zWQOb_4pysTy17c
|
1597 |
lm_eval/models/__init__.py |
sha256=nmTEQ3qRX_vF86wjcTSybI_9FmiPbEh-A6hB2h6DuKo
|
454 |
lm_eval/models/anthropic_llms.py |
sha256=x_sc4NjbRbxKGRutJkLzCF4DTI-C2NVj_rnAWQ_G47Q
|
7174 |
lm_eval/models/dummy.py |
sha256=4GVF2M-BKATRUJjYz-eO6saZdJX0NTjYFrrMlGPUGl0
|
991 |
lm_eval/models/gguf.py |
sha256=YpsiL-W-kpecylH8FkXbaOOylgA8sYO3P4L0sHZOGDU
|
4782 |
lm_eval/models/huggingface.py |
sha256=XMRyN4ugBlN99Y6K5FUa4BQCw_P-N91hwH_nYWhsp80
|
52240 |
lm_eval/models/mamba_lm.py |
sha256=Ogm3qozLM6ZD_yO1o7ffY49246E_Kf5l0ZWfkYX1cQU
|
4485 |
lm_eval/models/neuron_optimum.py |
sha256=QtiilY1GR5T6xe1YgqmWCRxBksH46pgj3ZFV_3ApWOw
|
29837 |
lm_eval/models/openai_completions.py |
sha256=vtl4Gen7Di5g4XQ_dgjFjIo8hF_fi53dVWlKPxyrjHQ
|
17379 |
lm_eval/models/optimum_lm.py |
sha256=Oc0EvgpmBGWVyBgz4pmumKWGSVQTCdqJGz1vG3I3Chk
|
2053 |
lm_eval/models/textsynth.py |
sha256=ZmCxqIV62ts57y-VvcRaRnkEhGBIacQJ8LQIFskdEjs
|
5877 |
lm_eval/models/utils.py |
sha256=7_ekLfCw5WBTvA-kkUQoD-kqY0yeopUS3UQ3r6q1Cfc
|
21677 |
lm_eval/models/vllm_causallms.py |
sha256=wDERQ8B2IrNLZsxxkRLziF7Q8mUIQAruNX_Vu3-E1sU
|
18411 |
lm_eval/prompts/__init__.py |
sha256=r71EOQNKpkVkGCgNccsrCjGh7tRMRaDolZPB5s6el0M
|
4446 |
lm_eval/tasks/__init__.py |
sha256=YUCeUt6x-pmHcN6kFxSBoXGTWeCrRpBr8KXNLf7Fhuk
|
17227 |
lm_eval/tasks/aexams/README.md |
sha256=NUAKuII6CMzTeYh-r1x7Z2fU6cdRwSZcEU2-OZT741g
|
1862 |
lm_eval/tasks/aexams/_default_template_yaml |
sha256=piAo84-HBnRc04Yo9mxRwboFIb8ZrqoIN4FCaMAx3-M
|
501 |
lm_eval/tasks/aexams/aexams_Biology.yaml |
sha256=wDN2gfFm0U30tRM0TCS3gvIJu9zSIxjpZePKPFWkhGY
|
190 |
lm_eval/tasks/aexams/aexams_IslamicStudies.yaml |
sha256=cmNYbL7ihokT1HRTHrwWnGxF3U7csYVUl5Ha5m9Zcwo
|
209 |
lm_eval/tasks/aexams/aexams_Physics.yaml |
sha256=qoBzKeeuIfF0bqG6p0N1EzXVRhVAjehnAlPw-iIUODg
|
180 |
lm_eval/tasks/aexams/aexams_Science.yaml |
sha256=LMWp9mQgMfwcQezmoCFX273lzj8LawQ-xaXRgjP_v_w
|
176 |
lm_eval/tasks/aexams/aexams_Social.yaml |
sha256=ApUU3LYxwhnwtrMO--6DLWMlbMgWGcIxdXNc0KwQ4qg
|
195 |
lm_eval/tasks/agieval/README.md |
sha256=4-5Y3TTifmMi5RYvaOI6-K8OIjEzEyEcKJrjhKEXvLA
|
5284 |
lm_eval/tasks/agieval/aqua-rat.yaml |
sha256=gT6vwucinFH8W5_aInXPB0NisHpAKU48LZmFCOiFnLk
|
527 |
lm_eval/tasks/agieval/gaokao-biology.yaml |
sha256=kZi4eR1SZDESnZmerDJPCezXjunP3YrDPSFsu9iOHuI
|
129 |
lm_eval/tasks/agieval/gaokao-chemistry.yaml |
sha256=OL_jXAkBQnCRnWG69TEjARFEVq1ore9WDn56TB0az4w
|
133 |
lm_eval/tasks/agieval/gaokao-chinese.yaml |
sha256=kd9tSkMUTZeXnzfyp71T8CWBuGMMIY4uYNSyeYO29n4
|
129 |
lm_eval/tasks/agieval/gaokao-english.yaml |
sha256=h8YomRmJ2ys7eLxmZ5Dj5TX_4KSsfXK2tMGmcmacZWw
|
215 |
lm_eval/tasks/agieval/gaokao-geography.yaml |
sha256=jPNST_8Dc9Tj1RiStvDgSGMHHaR6LYlLwde803w7i4A
|
133 |
lm_eval/tasks/agieval/gaokao-history.yaml |
sha256=YLQoEVj04dmLsjgxBHcZDGa1WZdTjyPmtDZffNWFlWA
|
129 |
lm_eval/tasks/agieval/gaokao-mathcloze.yaml |
sha256=gf1AKLXNohHwfCJuFVmltl4GIxIkHGRigcsRgKKj1GU
|
519 |
lm_eval/tasks/agieval/gaokao-mathqa.yaml |
sha256=UvLl4KwZ0rc-ZZ58L2FMzAiMTnI_HwCkDROd_Jfxs9U
|
127 |
lm_eval/tasks/agieval/gaokao-physics.yaml |
sha256=Zqevi3QqV92sH3eUGidPqm6LFc3ItN0uc20VnnuA-Y8
|
129 |
lm_eval/tasks/agieval/jec-qa-ca.yaml |
sha256=DaMlJ_ihgRsYERG00qmSHBJYEJR1EiZXfDHOGmDTbm0
|
119 |
lm_eval/tasks/agieval/jec-qa-kd.yaml |
sha256=eCeLdKz7RqE_QYNZgx9RHq2jKJhGhstX_V3yHTfcJrQ
|
119 |
lm_eval/tasks/agieval/logiqa-en.yaml |
sha256=ZFIZtHFY2wrUJwyYRxnDGKdBTGLFiHo8TXt7RHlha9g
|
136 |
lm_eval/tasks/agieval/logiqa-zh.yaml |
sha256=0UKloM8kf747py0VHAXoyZTrX5vPgYAnGUjGl3RAdpU
|
119 |
lm_eval/tasks/agieval/lsat-ar.yaml |
sha256=Rg87LmnOxcGzlyR1vOz5SL3DsaPN8a68Vhl_ENYDDB8
|
132 |
lm_eval/tasks/agieval/lsat-lr.yaml |
sha256=bKV9lLrlyJpWjaH5ETQBBMaqDRNuaKQMfolmGlXz6VI
|
132 |
lm_eval/tasks/agieval/lsat-rc.yaml |
sha256=_qmu-0xRCyhPJ0VzBVQnk5oSh4NbyrDHGb8r8z_i-aw
|
132 |
lm_eval/tasks/agieval/math.yaml |
sha256=6zY1wOeb0bXPV2_tSF2FkRL8OX0U8RBE3tFJCVlAUeM
|
495 |
lm_eval/tasks/agieval/sat-en-without-passage.yaml |
sha256=H_ZK7EpwEd1YCPKnItxQf0xn3mCdLq_6ksBoi9WK7-w
|
162 |
lm_eval/tasks/agieval/sat-en.yaml |
sha256=gzueP_6a0mbnBNkHUrKVQkmSaawfN6p5Ib0zBT1fVb4
|
130 |
lm_eval/tasks/agieval/sat-math.yaml |
sha256=8qAMy8siQCqUN7ujzJzNy8VsPH-sj7j9vjIDgXX5774
|
134 |
lm_eval/tasks/agieval/utils.py |
sha256=LrPDL8tQP7swC0UC9LV0h5HBVyYJj9s79hP8VG4awjA
|
7846 |
lm_eval/tasks/ammlu/README.md |
sha256=jF9nKeqdwFemoFgm8vs4pIU33RSF8LyHvQc1RHQL2hg
|
1714 |
lm_eval/tasks/ammlu/_default_template_yaml |
sha256=HP47DHA5wiL_JXKpNTtOhMF-G1QKPN41QNe5R8Z24Nc
|
499 |
lm_eval/tasks/ammlu/_generate_configs.py |
sha256=mkzHYt833vv18mXgB5tcu2ve9-DdFBrPM2BH4-bwTT4
|
5830 |
lm_eval/tasks/ammlu/ammlu_abstract_algebra.yaml |
sha256=MNqAqvXe5_W3dadZZhoO13_KCpFgCsNRBReG14iViwg
|
240 |
lm_eval/tasks/ammlu/ammlu_anatomy.yaml |
sha256=Heipw5jB5jv4JAYRkX7EiuKjJC_DI-VNvnjTZUG2H7s
|
222 |
lm_eval/tasks/ammlu/ammlu_astronomy.yaml |
sha256=4O0VKvjGjTFWKg43SbDwzisactydZTHnkEiOwz2JlEs
|
226 |
lm_eval/tasks/ammlu/ammlu_business_ethics.yaml |
sha256=Je8xieE9aifBXBuXRSgdrL1_ThOA0MIrwBSexovc5fE
|
189 |
lm_eval/tasks/ammlu/ammlu_clinical_knowledge.yaml |
sha256=O7vnPcUhaW9MGVj-AH8KEtKtbHXlbRdzfNYe0jdXkio
|
195 |
lm_eval/tasks/ammlu/ammlu_college_biology.yaml |
sha256=n1_MYR2pWk_BMf9LJ2AtwygmJY0u8aNl0RKRP77fxqw
|
238 |
lm_eval/tasks/ammlu/ammlu_college_chemistry.yaml |
sha256=fDs6FTBVGldXbE6boTqXYH7BIY2Lnm-b--Xp_LWzP1A
|
242 |
lm_eval/tasks/ammlu/ammlu_college_computer_science.yaml |
sha256=9bbbrx3R-ZIGkMy_uV2K81aEiysKX_9kIxl1dkY9KcY
|
256 |
lm_eval/tasks/ammlu/ammlu_college_mathematics.yaml |
sha256=iUnzqULYl76pVNbA_FgnITbbySjXCThQDJch544uuKQ
|
246 |
lm_eval/tasks/ammlu/ammlu_college_medicine.yaml |
sha256=uWgnp6_-ttBly-X1_X0ewLINrL_Sp8LCd744z2gqCTw
|
191 |
lm_eval/tasks/ammlu/ammlu_college_physics.yaml |
sha256=CwWPgUITtvSI-pcsSM0uML9FUdG6qCQ7l8Ks2aES10A
|
238 |
lm_eval/tasks/ammlu/ammlu_computer_security.yaml |
sha256=8sVZy8IVJYYcZzwxDmtrbyWN6g_lq5vAVqssPLQFZ9s
|
242 |
lm_eval/tasks/ammlu/ammlu_conceptual_physics.yaml |
sha256=qbkCgYuL0B4JODUFdoYVUSxk9DXVDZBtMhqJ8Wyf2iU
|
244 |
lm_eval/tasks/ammlu/ammlu_econometrics.yaml |
sha256=p7BBgdg4rgmhhQqiPbW54Jpo4KaYrN9FcbQSmsWGG2o
|
199 |
lm_eval/tasks/ammlu/ammlu_electrical_engineering.yaml |
sha256=ODM0Ll9-DIwp_LUXSfeAnzEEH2z6WP1RmXyh0a23TOQ
|
252 |
lm_eval/tasks/ammlu/ammlu_elementary_mathematics.yaml |
sha256=SJjh5zLh1ZkwzWxcvljorVanYQDs1Ie4pMn-oDmZDI4
|
252 |
lm_eval/tasks/ammlu/ammlu_formal_logic.yaml |
sha256=qefVmo7qQ8wLp0S2984PgNhhQphZg9sgm1eVu8AEi0o
|
197 |
lm_eval/tasks/ammlu/ammlu_global_facts.yaml |
sha256=oxVWRn-lIQTkSaOdkwU24e4xmbRWNpjwXxFohy_ZAHI
|
183 |
lm_eval/tasks/ammlu/ammlu_high_school_biology.yaml |
sha256=Fn2FYQSvrxAc1-gvsnwXK6Joh7AEb7d8HClE2M5WMik
|
246 |
lm_eval/tasks/ammlu/ammlu_high_school_chemistry.yaml |
sha256=jnyuN_GX5fFuQ4fj9eu2NpJ4qH0sraPEf2JgTamE-lU
|
250 |
lm_eval/tasks/ammlu/ammlu_high_school_computer_science.yaml |
sha256=v9h7DMrMp_LsbZg6XP--oVA7Un86s0OqlLpuv-QzgR8
|
264 |
lm_eval/tasks/ammlu/ammlu_high_school_european_history.yaml |
sha256=Ga0Cd66prXi3E3fWsVAbOgE1HR-ibTj6ltVLovUXVUo
|
229 |
lm_eval/tasks/ammlu/ammlu_high_school_geography.yaml |
sha256=wLjqHQbdCrYC5HjoRQBlSd_WlXpHwzTfkl9m2DNo4V0
|
217 |
lm_eval/tasks/ammlu/ammlu_high_school_government_and_politics.yaml |
sha256=TYzAb1v3ZeCXfj-463jHTIt9l5zMaNnw-D4BHXqSuRk
|
245 |
lm_eval/tasks/ammlu/ammlu_high_school_macroeconomics.yaml |
sha256=uQEaLNtF52OzOYyUyWhBq46MQ8u2MpchBkZdCcuSTCg
|
227 |
lm_eval/tasks/ammlu/ammlu_high_school_mathematics.yaml |
sha256=TI96mRH6aMmOhP7XtkVTzgzziryBtSCMtuFkZmkANuQ
|
254 |
lm_eval/tasks/ammlu/ammlu_high_school_microeconomics.yaml |
sha256=yaMMhsVqJ54q3aAqTFSSy5I-j664Nv1MZOXz5ficZI8
|
227 |
lm_eval/tasks/ammlu/ammlu_high_school_physics.yaml |
sha256=rtnldcucL9dmEFADchTQwj3mBSdt6W7oOHLoQHd0WA8
|
246 |
lm_eval/tasks/ammlu/ammlu_high_school_psychology.yaml |
sha256=tByEMOBaCEwWbnZyxYyeae32PGjs4pA9ip4di7QHnDg
|
219 |
lm_eval/tasks/ammlu/ammlu_high_school_statistics.yaml |
sha256=f_i7BPgVoDSYH20L7fY2nBzGgJC1_dh4Vgl9qBoRqMI
|
252 |
lm_eval/tasks/ammlu/ammlu_high_school_us_history.yaml |
sha256=aRg8XfErPy7oXSj9RYXLAXwHKjoQKDLLuNo5F-_q8d4
|
217 |
lm_eval/tasks/ammlu/ammlu_high_school_world_history.yaml |
sha256=6m6BV1QDqmDnnsFaBinDlTmkqzLInVkelWgKzOXkiws
|
223 |
lm_eval/tasks/ammlu/ammlu_human_aging.yaml |
sha256=r67HwFEUYV2BzO2vgFxj9B2ScXvTmBn_GafnIZQwUjU
|
181 |
lm_eval/tasks/ammlu/ammlu_human_sexuality.yaml |
sha256=SzgN8EeAc1hZob7sP1kfNKOsZtxd3RLH7MQWc0GNxYU
|
205 |
lm_eval/tasks/ammlu/ammlu_international_law.yaml |
sha256=XVfjVGhX9UpCt3fNyHinqB-hg1mJHiKDfaiKWp38ILU
|
207 |
lm_eval/tasks/ammlu/ammlu_jurisprudence.yaml |
sha256=aJkMmqF5YpWKvHu5CZsTv3WGMqSXqTiW0h9ekNwsSUs
|
199 |
lm_eval/tasks/ammlu/ammlu_logical_fallacies.yaml |
sha256=IwtMroEp79X33dhR453fXfYAl69Q_AW_pxJrlI5_cFM
|
207 |
lm_eval/tasks/ammlu/ammlu_machine_learning.yaml |
sha256=vmK2vmmQhEkH0TGBNgHbhAvRWD0yl2TEguB8tOCURdg
|
240 |
lm_eval/tasks/ammlu/ammlu_management.yaml |
sha256=yCzEDWeRkbNgDnOYoxL7G4Gig_3j3vZeTAHJAqOCTWI
|
179 |
lm_eval/tasks/ammlu/ammlu_marketing.yaml |
sha256=fJKc6G3pU2ZFRtREhKx0Ke6SAPCh-9tKF0A1GYCPVMw
|
177 |
lm_eval/tasks/ammlu/ammlu_medical_genetics.yaml |
sha256=w9SLealVhdQy32LC0jjbt2zDfukpN-ygblc3NfFgR6M
|
191 |
lm_eval/tasks/ammlu/ammlu_miscellaneous.yaml |
sha256=NWn-jKJHFtr5Wy9KMfSnoHo7Yw4rUTzSGRbY_GJurlw
|
185 |
lm_eval/tasks/ammlu/ammlu_moral_disputes.yaml |
sha256=_KNQ_-IIZ-5oecN85Y63w27qlvvrepiePj9UPN2fXoM
|
201 |
lm_eval/tasks/ammlu/ammlu_moral_scenarios.yaml |
sha256=-iFxp4Pbfr9jXKpkQrE58NtPEeCrp0ZRXbjGAr8hKds
|
203 |
lm_eval/tasks/ammlu/ammlu_nutrition.yaml |
sha256=0Mr36wNhYkGY2kZ24RyK0HBoYQBIOfmx8nabyT_2sDs
|
177 |
lm_eval/tasks/ammlu/ammlu_philosophy.yaml |
sha256=Od1FHjz_BRx_dV-zbN7wH9fobRwc-fksu5Y05sRwXk0
|
193 |
lm_eval/tasks/ammlu/ammlu_prehistory.yaml |
sha256=W2Hs_tyPr1c_zC6IidOR8dNy8dXbejYL__TcCRZ-gi0
|
193 |
lm_eval/tasks/ammlu/ammlu_professional_accounting.yaml |
sha256=Z-QWQt2-ZZAGqEyScgphS0hykOL3y0bhCIbdRM_ybcY
|
205 |
lm_eval/tasks/ammlu/ammlu_professional_law.yaml |
sha256=WzOZZxHG3O5aOTcm_7Sj6fmUum5ITHQQTtYbrPjuFTo
|
205 |
lm_eval/tasks/ammlu/ammlu_professional_medicine.yaml |
sha256=OuXG2FvFi86HdcJxzbV62rGwgmbYFP0YQI6fQVAKPJE
|
201 |
lm_eval/tasks/ammlu/ammlu_professional_psychology.yaml |
sha256=_anNAlm6KAJv3fKDlYddZRiDGxsCZ_jhPsta1VbI-Kg
|
221 |
lm_eval/tasks/ammlu/ammlu_public_relations.yaml |
sha256=qZ38TmVCoyfIPPHKPY78ScQCuda6Nm3KOEfy-_2Ks8Q
|
207 |
lm_eval/tasks/ammlu/ammlu_security_studies.yaml |
sha256=UIJk5r3N2JS0YLAEzVo8q5KPGZVTNRASmdWXcSfYOKI
|
207 |
lm_eval/tasks/ammlu/ammlu_sociology.yaml |
sha256=ZtL8NqC1V3eC71OogkeD4OWIColFKO62IAyfeY9ondo
|
193 |
lm_eval/tasks/ammlu/ammlu_us_foreign_policy.yaml |
sha256=zr-dTcne9HyF4RkmpMqP3F75tEdetTJ9WLkE0gdkC0o
|
209 |
lm_eval/tasks/ammlu/ammlu_virology.yaml |
sha256=ClaQ-BZp6VLMDG8wF1MQobdyUq7kbJoFhyd0bPNJDfo
|
175 |
lm_eval/tasks/ammlu/ammlu_world_religions.yaml |
sha256=10jQw1LZ9uwgTN8i9DqsXTQWczT44iy-reKqVoVPbmQ
|
203 |
lm_eval/tasks/anli/README.md |
sha256=QKLZp7Ox21Wn815nwzGczGu7Bce0fQVTRmlduKlckWU
|
2042 |
lm_eval/tasks/anli/anli_r1.yaml |
sha256=pKwidjBQrQnVwE556yItUUCLE3kfV2WPTCTbt-l0mro
|
595 |
lm_eval/tasks/anli/anli_r2.yaml |
sha256=nHP-W_OHCZpr9VjX3AiRsrLVV4Cb25vSfuHRN5CmTlc
|
106 |
lm_eval/tasks/anli/anli_r3.yaml |
sha256=AgUdUSygTWd9giQsVVLEauQKz5NZQxjtGNBTKW3RKXo
|
106 |
lm_eval/tasks/arc/README.md |
sha256=s8ExYRbWsstbrnJ1SGR2pFN5IEgs5yakpXvhc-oNujc
|
1907 |
lm_eval/tasks/arc/arc_challenge.yaml |
sha256=aCYhwmriSxBlotcyRgpVqO8rnyVEV0QxZmyTCanv170
|
71 |
lm_eval/tasks/arc/arc_easy.yaml |
sha256=Cb1InG2hMVw5PEvdu6pCMqKIR79JPs3hbJW9pMniXUI
|
581 |
lm_eval/tasks/arithmetic/README.md |
sha256=3jHg0xARN3uYrFIhUuRfD6qv-rYAVy0ffKqzAXqklfw
|
2336 |
lm_eval/tasks/arithmetic/arithmetic_1dc.yaml |
sha256=-ipgkiqZYJePHkYGwRQQq6qfVtjWnpO9Ds_16hawgU8
|
385 |
lm_eval/tasks/arithmetic/arithmetic_2da.yaml |
sha256=V12nJMp6vQVEPrVmMBRvzclMuBb_HxbrB_f-9_v5b6Q
|
121 |
lm_eval/tasks/arithmetic/arithmetic_2dm.yaml |
sha256=Hq_P-0ai3YMkoYTET0-IjMFJ1ZHuaXa56xRMz_OZsCU
|
121 |
lm_eval/tasks/arithmetic/arithmetic_2ds.yaml |
sha256=hBtWC9FdqNUYWdCckQLe0AGjKJToWwizHxv52P1Cxwg
|
121 |
lm_eval/tasks/arithmetic/arithmetic_3da.yaml |
sha256=SBEW7EW9U-b2_t_lYfI0HPxyt7arHqSsXRkzfj04jDY
|
121 |
lm_eval/tasks/arithmetic/arithmetic_3ds.yaml |
sha256=Mt3FExvHxBd6yvGT_shmVwGgTGMttDXxDP29BrhqQSs
|
121 |
lm_eval/tasks/arithmetic/arithmetic_4da.yaml |
sha256=Tm-_pJPxRioREeU7hLELfviPKf4RTATqTlPsn9Q1EVA
|
121 |
lm_eval/tasks/arithmetic/arithmetic_4ds.yaml |
sha256=LGYKXa2CIefd8RyMKbeXOD62yt22JHW7MVJKEFCSU8A
|
121 |
lm_eval/tasks/arithmetic/arithmetic_5da.yaml |
sha256=gLV1nowU_lAor9wD0O4oTrU65iH5rTRgi4px7qCHttM
|
121 |
lm_eval/tasks/arithmetic/arithmetic_5ds.yaml |
sha256=lD4TGRpxz0P34KGXnSeqqJG1eYh66X2aE9LnBu8yh6k
|
121 |
lm_eval/tasks/asdiv/README.md |
sha256=TQY5EyoG5evb9oZwMCZl_X_4qAX7B-nMKnOTcI_-0IQ
|
1906 |
lm_eval/tasks/asdiv/default.yaml |
sha256=8lIhCEYNbVCA993MVkXWqTAvw_2rNqQN-NMGs4N71TE
|
424 |
lm_eval/tasks/babi/README.md |
sha256=Y_b2kkNqyN1l3ONNomyPcZmNOI0wupDTQLAHyankfFY
|
2263 |
lm_eval/tasks/babi/babi.yaml |
sha256=Zu1YY1DxenTDzTa3neetZi-r65OaS6QHZto66dkfKIA
|
436 |
lm_eval/tasks/bbh/README.md |
sha256=onAqPm8i9ybbgt4mLn6CBWVRvLWg6z7DJWLeE8umSJQ
|
1384 |
lm_eval/tasks/bbh/_generate_configs.py |
sha256=t2anyW6Q5Ee6Z090Pz3gLXh9uNcjhOPG88nAnwqxCxA
|
2702 |
lm_eval/tasks/bbh/cot_fewshot/_cot_fewshot_template_yaml |
sha256=PgQyih2oU5qxF-z4c1R9jBC6lZ3PwnVst9HB9pwvO3U
|
648 |
lm_eval/tasks/bbh/cot_fewshot/boolean_expressions.yaml |
sha256=Ln39qZA4zj-g6UmgL-ZFY2J4XN11MNsyhtJa7iU4FxI
|
2048 |
lm_eval/tasks/bbh/cot_fewshot/causal_judgement.yaml |
sha256=2gdSJflU4vUPZI3YoqHgozmJyzDyyvqYsIT2uEJjH24
|
3889 |
lm_eval/tasks/bbh/cot_fewshot/date_understanding.yaml |
sha256=hVFFhyfJxdjd61UB8RynocI4SfsDpJBZHpj62IY48uk
|
1404 |
lm_eval/tasks/bbh/cot_fewshot/disambiguation_qa.yaml |
sha256=Ft-I7TtIUcOPNlrvFcxlLL1ZBniDxl08d3YIVgko4lY
|
3845 |
lm_eval/tasks/bbh/cot_fewshot/dyck_languages.yaml |
sha256=c6BDE4lItvNqyPW0DpunPXaoEZFyJlIE1zGI8vol9q8
|
2715 |
lm_eval/tasks/bbh/cot_fewshot/formal_fallacies.yaml |
sha256=zaYAnLyyPGxvcbAs99A2sXD1T7MDk2hW-i4tvJzso5Q
|
4736 |
lm_eval/tasks/bbh/cot_fewshot/geometric_shapes.yaml |
sha256=2ryl3aMrgj6sIHgd4PZkBxrDpOhcMCRKL9S-_PHXxPA
|
5137 |
lm_eval/tasks/bbh/cot_fewshot/hyperbaton.yaml |
sha256=N3ho8OmBBy-HtfucQ3LT9lsavGv6Mg6f__kmlc2P0F0
|
3367 |
lm_eval/tasks/bbh/cot_fewshot/logical_deduction_five_objects.yaml |
sha256=_CCfhaaiuu5Jf7F038ZZ1KVzXYQnvLdIsTWcW3Y5H-I
|
2788 |
lm_eval/tasks/bbh/cot_fewshot/logical_deduction_seven_objects.yaml |
sha256=_Y0nR9p2f3md9_cwbwVyOJO8tDlbbKJlu8HN3ut255A
|
2790 |
lm_eval/tasks/bbh/cot_fewshot/logical_deduction_three_objects.yaml |
sha256=yqAVNmKeohrBaq6ducPx1Bksce7ZfIb4muLxA_FN8oQ
|
2790 |
lm_eval/tasks/bbh/cot_fewshot/movie_recommendation.yaml |
sha256=sdB4tK6_YXFl1NWvmw6knweuvukgiu7CsJ82FkRKlH4
|
2371 |
lm_eval/tasks/bbh/cot_fewshot/multistep_arithmetic_two.yaml |
sha256=BgVm4JXLRjXxbSouTq_I33vTqvbleKmCAw53-g0omhk
|
2642 |
lm_eval/tasks/bbh/cot_fewshot/navigate.yaml |
sha256=mzZL9z-FN6VEughuw_80dVWA6GMs8vlS7WUydo3wjic
|
2374 |
lm_eval/tasks/bbh/cot_fewshot/object_counting.yaml |
sha256=mjN59FVUUTCyMKJiLrC1aPYlVLB7au5VChGvfHiD3TY
|
1653 |
lm_eval/tasks/bbh/cot_fewshot/penguins_in_a_table.yaml |
sha256=JpV2Eh0cHhiJSi3OGDK96WWrH_N2s4Uh5y2GRdegOpc
|
2633 |
lm_eval/tasks/bbh/cot_fewshot/reasoning_about_colored_objects.yaml |
sha256=7FYzRdNgxOmnGkp9CaCpbHFtuGTqDIo1AJOva72HVVk
|
2588 |
lm_eval/tasks/bbh/cot_fewshot/ruin_names.yaml |
sha256=hNX7bE70-oDQmM4wCZMzM4Ax_vHYWG73J6_ruR3qGOk
|
3833 |
lm_eval/tasks/bbh/cot_fewshot/salient_translation_error_detection.yaml |
sha256=DkpItL7dzDzV82QdZxBOpIcCSScfKbg3fzP6tgGcBtY
|
6481 |
lm_eval/tasks/bbh/cot_fewshot/snarks.yaml |
sha256=UQlNCf9vOo76GJznTpQzyJ6eGgrPeAGIXBneKj2Rd10
|
3326 |
lm_eval/tasks/bbh/cot_fewshot/sports_understanding.yaml |
sha256=G9hi5SMZhwfDOGJadkLXe-Okw1nVtufaM37q3-bHrS4
|
1045 |
lm_eval/tasks/bbh/cot_fewshot/temporal_sequences.yaml |
sha256=TAWpqiScp5gnQ_i11iZdlVGEx6-hQxN5CQEefNjIyFY
|
3304 |
lm_eval/tasks/bbh/cot_fewshot/tracking_shuffled_objects_five_objects.yaml |
sha256=NbWCgcMSeoNkmFBrhoHsQghh2dleyJDzrp5nOWbwg_o
|
2888 |
lm_eval/tasks/bbh/cot_fewshot/tracking_shuffled_objects_seven_objects.yaml |
sha256=xKX3zUNkNAksptSz1TeL2icc8lJfLnMIBJrAruUWEmo
|
2890 |
lm_eval/tasks/bbh/cot_fewshot/tracking_shuffled_objects_three_objects.yaml |
sha256=B9Jy8oT9TSOKwi9PrFkN-6WoqVUHYXDxyhpESAiSfXI
|
2890 |
lm_eval/tasks/bbh/cot_fewshot/web_of_lies.yaml |
sha256=Oyjiy0rAACoPq5LQR1zyoiSiAgornrpV4F4IdSSgbM4
|
3163 |
lm_eval/tasks/bbh/cot_fewshot/word_sorting.yaml |
sha256=4utfxuWJiPF9T_-1D3vUTc9p1n9TjBAZxCQsFFmagLc
|
2549 |
lm_eval/tasks/bbh/cot_zeroshot/_cot_zeroshot_template_yaml |
sha256=8cD89OSopFFp51VnXK3LhfFoudVSGfneao0X6YmNiXQ
|
502 |
lm_eval/tasks/bbh/cot_zeroshot/boolean_expressions.yaml |
sha256=BKQ6JO9I2gLwb1MfgCnwaIG-66v-mzZqd__1oy1rWc8
|
679 |
lm_eval/tasks/bbh/cot_zeroshot/causal_judgement.yaml |
sha256=FOCmMOguNhSlowJnmKY-pRsJ2lBymWo6s2qlpTjS0E8
|
667 |
lm_eval/tasks/bbh/cot_zeroshot/date_understanding.yaml |
sha256=2WR5jQ37ZwlDbc066gHLGrjmy_dE732uTBEZhyuCgsg
|
739 |
lm_eval/tasks/bbh/cot_zeroshot/disambiguation_qa.yaml |
sha256=qJW8yPCukm5IKN2FBgm7kYg-xhjiCwKW6hGlOwtnuS4
|
766 |
lm_eval/tasks/bbh/cot_zeroshot/dyck_languages.yaml |
sha256=mw1W-rh3wZ58rY19vAOfQVr_ISVpRvjmpGe5xI7nLqY
|
684 |
lm_eval/tasks/bbh/cot_zeroshot/formal_fallacies.yaml |
sha256=rOekVBA9qj24R704zneL85yXzf8jLNCXYxreoMet5lw
|
687 |
lm_eval/tasks/bbh/cot_zeroshot/geometric_shapes.yaml |
sha256=EjI9vVQJTCLofU9cAPADFEWtHW8i1uGluDdrr62N3aI
|
750 |
lm_eval/tasks/bbh/cot_zeroshot/hyperbaton.yaml |
sha256=Pt49AiGA-g65WhWp1LLuQUM6LJgSfFhjT1eO7RdM10o
|
743 |
lm_eval/tasks/bbh/cot_zeroshot/logical_deduction_five_objects.yaml |
sha256=twk8yG1vjkU48OHoDwjJwh4Ohye0-zpIJf7NOAtcNUI
|
818 |
lm_eval/tasks/bbh/cot_zeroshot/logical_deduction_seven_objects.yaml |
sha256=fLICnem3s646N1Lbl5IRPAbMewhcUFxZ3Rdu-pVvarM
|
820 |
lm_eval/tasks/bbh/cot_zeroshot/logical_deduction_three_objects.yaml |
sha256=j8nBZ62_r9qj2KGzp4ildJS0tXeFjpy1uJvXVflhl9c
|
820 |
lm_eval/tasks/bbh/cot_zeroshot/movie_recommendation.yaml |
sha256=5sK7ju6stnh6u7R6uvzI6-eQb4qgDDYZrBidbdGcXyQ
|
767 |
lm_eval/tasks/bbh/cot_zeroshot/multistep_arithmetic_two.yaml |
sha256=vXJJjs-xeWRuXtCrfQVmyKPhgiIRSI58Fcwft1bdaeU
|
697 |
lm_eval/tasks/bbh/cot_zeroshot/navigate.yaml |
sha256=58RaCT7VZ6fiKQ1D2eEEx3XfVeQG4m0G57F0xmmjx58
|
713 |
lm_eval/tasks/bbh/cot_zeroshot/object_counting.yaml |
sha256=eCOmYJZufH_wmqRICNxCnAJ8qPbxq6f40T4iq2ZADDg
|
719 |
lm_eval/tasks/bbh/cot_zeroshot/penguins_in_a_table.yaml |
sha256=iMRKS9h3NpUU90MmQ7Vzf4MJRVAbKNUXg1-4dlRM3-s
|
776 |
lm_eval/tasks/bbh/cot_zeroshot/reasoning_about_colored_objects.yaml |
sha256=rkICB45Uv8AomM61e-8iatL_SCilCI0UfWKUdXT0reA
|
811 |
lm_eval/tasks/bbh/cot_zeroshot/ruin_names.yaml |
sha256=t4QqzKgua7-v5Pnqp8s8o-YsKEYRdZr2U6pzvFgDnA0
|
771 |
lm_eval/tasks/bbh/cot_zeroshot/salient_translation_error_detection.yaml |
sha256=rtV_kpJ6-Mif2wUrMmIQULrBhQuxFDcfBDt07PoM82g
|
823 |
lm_eval/tasks/bbh/cot_zeroshot/snarks.yaml |
sha256=gH1y98pBpeFVJSdO9diIzlKi0kuYj5H82EIKZQG8KoE
|
1057 |
lm_eval/tasks/bbh/cot_zeroshot/sports_understanding.yaml |
sha256=qC3tfNj-4hfvSFCVtj-ib7hHMLToF7AppQfqmVOyvDY
|
837 |
lm_eval/tasks/bbh/cot_zeroshot/temporal_sequences.yaml |
sha256=ZhQfmkoNIt1SSKNZPfhEXlpXXIF_DLg5y6y4cGcGvG8
|
798 |
lm_eval/tasks/bbh/cot_zeroshot/tracking_shuffled_objects_five_objects.yaml |
sha256=MqI1WvrFkONaQcoCQUk8Aqk8sqlRi3OXsya6Ukrub1E
|
890 |
lm_eval/tasks/bbh/cot_zeroshot/tracking_shuffled_objects_seven_objects.yaml |
sha256=HzD6MUcCdjzReleZFv7oJPsVRHIHWtJYVYWQ-qtGwOw
|
892 |
lm_eval/tasks/bbh/cot_zeroshot/tracking_shuffled_objects_three_objects.yaml |
sha256=FaW5OXsTGhuKTCz_4yuxlYnhLhgp-h6MBT8STObJKDY
|
892 |
lm_eval/tasks/bbh/cot_zeroshot/utils.py |
sha256=03_KQKsfTCHMCwu_HA6HTdhGwXAD-TNlL3W8r1CpnxY
|
8777 |
lm_eval/tasks/bbh/cot_zeroshot/web_of_lies.yaml |
sha256=XRcVudvzDNpMyhLFqIWa0n77DNygmpwiXQ1taDvxk8o
|
849 |
lm_eval/tasks/bbh/cot_zeroshot/word_sorting.yaml |
sha256=BZ_CXxzfuz3XzPzbMifdj6Ep7it5pUUWLujdj7UQ5Cw
|
588 |
lm_eval/tasks/bbh/fewshot/_fewshot_template_yaml |
sha256=dOunUd8nbaafmyfOAX5Zulj8NLpFXbUrw9TqLo4_MyA
|
454 |
lm_eval/tasks/bbh/fewshot/boolean_expressions.yaml |
sha256=1tIp6Y5eC9Dya8yBzxVjdYO4nUCbAlIaFzG-K8xv8Hw
|
367 |
lm_eval/tasks/bbh/fewshot/causal_judgement.yaml |
sha256=vantgzSIBZhR_qxJRO2uWbIgyA7AuKCIR7Sn8_GFqRY
|
2338 |
lm_eval/tasks/bbh/fewshot/date_understanding.yaml |
sha256=ySlQrnYJxmE3GSnL_cqT8jvDqQB5fvEVXMpjEfrhKcA
|
815 |
lm_eval/tasks/bbh/fewshot/disambiguation_qa.yaml |
sha256=6JRUEFVFBTqG17T-072M7uEyLjus--VaiaXsGFatUgs
|
1164 |
lm_eval/tasks/bbh/fewshot/dyck_languages.yaml |
sha256=a394IE2EtX-i8QOBgAu6olHe96syKt1AjxOt8N0bYSE
|
622 |
lm_eval/tasks/bbh/fewshot/formal_fallacies.yaml |
sha256=kqv_qxXfSoSwTViot4G_8yBKEx1uhG8XqOK46g3kqAA
|
1839 |
lm_eval/tasks/bbh/fewshot/geometric_shapes.yaml |
sha256=TZwKR7vJ2Z9x0l7GY1glQ_6_vPTcBQRU7jrzF0AK_aU
|
1074 |
lm_eval/tasks/bbh/fewshot/hyperbaton.yaml |
sha256=hvcnVDCbmUPxnMiI_P6qVVqlUfRtKT8yCvl4KWGAMjM
|
634 |
lm_eval/tasks/bbh/fewshot/logical_deduction_five_objects.yaml |
sha256=dSRQXf8szjv_yDPSHFFxphv022anRQOzPReBqY-s5Ik
|
1539 |
lm_eval/tasks/bbh/fewshot/logical_deduction_seven_objects.yaml |
sha256=ty843RXDantbT5JKldYf4ZtEJcsEIpn9xxBaLGT58Qg
|
1541 |
lm_eval/tasks/bbh/fewshot/logical_deduction_three_objects.yaml |
sha256=oU9T3xpAVcaFyMKhvdkUyPjtTvhrNlJHG8TK3EdcgMQ
|
1541 |
lm_eval/tasks/bbh/fewshot/movie_recommendation.yaml |
sha256=jS9ruvpQwcgiyaR3KVApBGDgf3QyX2wTWx61FFd9PFk
|
906 |
lm_eval/tasks/bbh/fewshot/multistep_arithmetic_two.yaml |
sha256=pwWjm5OLv_qjiu296ZtUrCC0glShTq8uk0H94yV6pWM
|
389 |
lm_eval/tasks/bbh/fewshot/navigate.yaml |
sha256=QOTReNyaIjZyn3F7THRwJuU6CCbuyRBanSC7Onunkb4
|
842 |
lm_eval/tasks/bbh/fewshot/object_counting.yaml |
sha256=6yrD3p-nOVN9ymXekvX1H1YSxWVhSFse8CobjcWI4vE
|
689 |
lm_eval/tasks/bbh/fewshot/penguins_in_a_table.yaml |
sha256=0PM3HhN17hsmGB7TqSIbgveusa0LDW31CQDXZeqZX3k
|
1542 |
lm_eval/tasks/bbh/fewshot/reasoning_about_colored_objects.yaml |
sha256=TTtJaKleXVRX71doDMkk7mx3sw4kcL7axNpBjeiq-vE
|
1509 |
lm_eval/tasks/bbh/fewshot/ruin_names.yaml |
sha256=JMYb663T6w_MJkQGh8jaB1b9RrGFmVtntFnHjfQ_PXg
|
882 |
lm_eval/tasks/bbh/fewshot/salient_translation_error_detection.yaml |
sha256=APT876ojQHdbClvWMR2mUNh29aHRa3jVhi4cETOEivw
|
3738 |
lm_eval/tasks/bbh/fewshot/snarks.yaml |
sha256=FcUe10FIsqJVhKAbrCn6znCzGD0p0EV3I4kGjE9Da6s
|
1226 |
lm_eval/tasks/bbh/fewshot/sports_understanding.yaml |
sha256=06OeVP9JHyVB2-2YtVipiDhp4Q5OwoTEbYmbUDMZ5XU
|
579 |
lm_eval/tasks/bbh/fewshot/temporal_sequences.yaml |
sha256=D6yGSWcJ74UkOHqm6Lhs26h-10ejWb_hnT8jjmuUPG0
|
2117 |
lm_eval/tasks/bbh/fewshot/tracking_shuffled_objects_five_objects.yaml |
sha256=LKa6X23i3JsbfDZejNcofoPl32Oib4q5E09z7eeDRmY
|
1705 |
lm_eval/tasks/bbh/fewshot/tracking_shuffled_objects_seven_objects.yaml |
sha256=Bn-uESnumu6mDPrsNMN8AEB6iwz7A3c_5BvwNDZNais
|
1707 |
lm_eval/tasks/bbh/fewshot/tracking_shuffled_objects_three_objects.yaml |
sha256=XhCmfLNUUK73TRLNMqnFnXrEdh9fgdykesi9weSaNGw
|
1707 |
lm_eval/tasks/bbh/fewshot/web_of_lies.yaml |
sha256=QQomeDW4QMJwaJIaGz9mBQ4wY1rzVHubyiiAhsixLZY
|
813 |
lm_eval/tasks/bbh/fewshot/word_sorting.yaml |
sha256=UhnU8RCtK0DE22qIoaRzo3VKpIUDuV5OjmXdazKHkbU
|
582 |
lm_eval/tasks/bbh/zeroshot/_zeroshot_template_yaml |
sha256=spVv4-z-y5vK0XIFshAUFu62V4p0UZ-FHxuDLtBAgpc
|
498 |
lm_eval/tasks/bbh/zeroshot/boolean_expressions.yaml |
sha256=Tuk0lWtRtnLCBsTLCEoVjnM2H572_4RqsHATK9c7oio
|
473 |
lm_eval/tasks/bbh/zeroshot/causal_judgement.yaml |
sha256=kNc65hI1I1S2BU3JY5hsCNkEWgZ_EQYd92yg0b7OGek
|
461 |
lm_eval/tasks/bbh/zeroshot/date_understanding.yaml |
sha256=Wzvx0IdNhHfdknnixvJySw_zbfz5XOJoJVMpVzccG7Y
|
533 |
lm_eval/tasks/bbh/zeroshot/disambiguation_qa.yaml |
sha256=ttEMcEsDsyhmWk0lQ0MpJiBfN-oxKESlSXfiC9Bj9Lg
|
560 |
lm_eval/tasks/bbh/zeroshot/dyck_languages.yaml |
sha256=jULSUCimkHyjYMbSyWz-3e5Fh4hwXfB8pJXl1pRqdnQ
|
478 |
lm_eval/tasks/bbh/zeroshot/formal_fallacies.yaml |
sha256=nxSdCT_qpDvlblyiBkYwGH0GkE9r6kHzLzSxIdBPu7c
|
481 |
lm_eval/tasks/bbh/zeroshot/geometric_shapes.yaml |
sha256=ug-J6K10cUAtkLyrgHiPq1opVrGTaqJbN08wB_KnycE
|
544 |
lm_eval/tasks/bbh/zeroshot/hyperbaton.yaml |
sha256=RAScn4Nw49gKVviPyOWYdn1FTzhCtt_SQiaMCkRjLC4
|
537 |
lm_eval/tasks/bbh/zeroshot/logical_deduction_five_objects.yaml |
sha256=6ABlB8hVvffXqdRvjCrBGL8W9NaGLa-RymEp2c4U12c
|
612 |
lm_eval/tasks/bbh/zeroshot/logical_deduction_seven_objects.yaml |
sha256=QqSnathmDPy8QeX2vl5Mj5QCkCzb1o1nJfFVB6LSiDA
|
614 |
lm_eval/tasks/bbh/zeroshot/logical_deduction_three_objects.yaml |
sha256=u9vkRxmhHAUVI6VAMWP2eBuaB5rxVM2JjpSIpNs5Hyo
|
614 |
lm_eval/tasks/bbh/zeroshot/movie_recommendation.yaml |
sha256=qN_B4OgxfXhCFNVhclrBDJUf2Jiwo0hoNpMnDwwg0aY
|
561 |
lm_eval/tasks/bbh/zeroshot/multistep_arithmetic_two.yaml |
sha256=3SfYjOOs9kxkf9tcIyFydk9aLwvfpAWbIBgLZkZjxfc
|
491 |
lm_eval/tasks/bbh/zeroshot/navigate.yaml |
sha256=B6dRPFnXuX7DQugeVkTO8yR0407aW2J_OSVk2cHJaSw
|
507 |
lm_eval/tasks/bbh/zeroshot/object_counting.yaml |
sha256=6Q-kZXpMaliqEcl84tarX0zW98dr58BySXtGMZYszYI
|
513 |
lm_eval/tasks/bbh/zeroshot/penguins_in_a_table.yaml |
sha256=OPKYIHMGB0vmRhKW79iAEgY_Vin5OQEIxNrvWFida2g
|
570 |
lm_eval/tasks/bbh/zeroshot/reasoning_about_colored_objects.yaml |
sha256=RP4_eYIh3yCqX2LaZ8RZ3xexILH91ZNdvJCCw_NFdcQ
|
605 |
lm_eval/tasks/bbh/zeroshot/ruin_names.yaml |
sha256=FrgCzr7L0-Zmm4j2SDKtZnTO2urqw1uRliWdque4LUA
|
565 |
lm_eval/tasks/bbh/zeroshot/salient_translation_error_detection.yaml |
sha256=XU-bur6KPqH4QFS6gHqs4iac7NGv4QqEjrMMsTMkUYw
|
617 |
lm_eval/tasks/bbh/zeroshot/snarks.yaml |
sha256=KS0oIOa9ZIUaTORqPSsAbADJCQoMuKxkodxp3FINOqc
|
851 |
lm_eval/tasks/bbh/zeroshot/sports_understanding.yaml |
sha256=k_kuvih4YmCkwomOi8qEp-t13zgyTtzkq3yLQcuLngY
|
631 |
lm_eval/tasks/bbh/zeroshot/temporal_sequences.yaml |
sha256=9UIDSY0kmyLobfY2TMP58M-jpZvNPPOCWjsF1ApItZ0
|
592 |
lm_eval/tasks/bbh/zeroshot/tracking_shuffled_objects_five_objects.yaml |
sha256=IGV3TMZUQzccEgAAegKy95_Pw3DnP1hLI-ZfIar_1Qg
|
684 |
lm_eval/tasks/bbh/zeroshot/tracking_shuffled_objects_seven_objects.yaml |
sha256=K5DfPycBD-RzDXCqJ3Pn18tvtaSMyTE7N8KUWiacgJY
|
686 |
lm_eval/tasks/bbh/zeroshot/tracking_shuffled_objects_three_objects.yaml |
sha256=Th21qaJlSZk7cFK0JvzLA9kPRudT9KDzkkuwAySRAKU
|
686 |
lm_eval/tasks/bbh/zeroshot/utils.py |
sha256=03_KQKsfTCHMCwu_HA6HTdhGwXAD-TNlL3W8r1CpnxY
|
8777 |
lm_eval/tasks/bbh/zeroshot/web_of_lies.yaml |
sha256=WTBOPgr8j2aZ0cG0dAfnIQVhg4cZYmeQvkj8WstGG3A
|
643 |
lm_eval/tasks/bbh/zeroshot/word_sorting.yaml |
sha256=c8SQ9dZlfgm1vBVbWD7tyt45kg-nNaEoErtypkdUKyA
|
383 |
lm_eval/tasks/belebele/README.md |
sha256=DePrXLzy0Wd8hP3XqMGXlXBRLZsczh1aEN4-MhTxMv4
|
2578 |
lm_eval/tasks/belebele/_default_template_yaml |
sha256=hMGUIoew0r-3Dw2A-P2useomrT3hIWkYHXmEUIWtS8w
|
610 |
lm_eval/tasks/belebele/_generate_configs.py |
sha256=bmzhiS_Dkza-rBeEsXHzQyEGhRr5SaQzOgkUDoIbNYg
|
1978 |
lm_eval/tasks/belebele/belebele_acm_Arab.yaml |
sha256=1EvD-A0S4aFieLpRE8EyQUzhj0ZCARV9bh7b1IyT9NE
|
117 |
lm_eval/tasks/belebele/belebele_afr_Latn.yaml |
sha256=-atGz1AmNzkqVNXeb5ZSZuXOK7lx7fw28gSmZAzS66Q
|
117 |
lm_eval/tasks/belebele/belebele_als_Latn.yaml |
sha256=2yR3mcGjcCK9pVecpN09CnlvyLkGialK4R2Zqrdih0w
|
117 |
lm_eval/tasks/belebele/belebele_amh_Ethi.yaml |
sha256=f5GKkWm4TqrVt7m4Zp-OSIl64-9XUNUWzm7LnCg0QAY
|
117 |
lm_eval/tasks/belebele/belebele_apc_Arab.yaml |
sha256=wqYmY4n6VbEuy1wRXmyaLK62uNjTbBfbGroAI129MvE
|
117 |
lm_eval/tasks/belebele/belebele_arb_Arab.yaml |
sha256=9rVkD5-hU08GXYD0E2vs7ndfvThtvJx8dgHqW5FiWII
|
117 |
lm_eval/tasks/belebele/belebele_arb_Latn.yaml |
sha256=HAZaQhih9A1KZMjS7bICwNnI4m8qCF4-D1nrqPB0-wo
|
117 |
lm_eval/tasks/belebele/belebele_ars_Arab.yaml |
sha256=jb1TkLdTDYU5v7NK5LjJ06iqW9i3pjw3MluV7lyfAns
|
117 |
lm_eval/tasks/belebele/belebele_ary_Arab.yaml |
sha256=WFDY0FNZ7geoOBztlOG4y40P_pAE0HAfCmh8nNiBxa4
|
117 |
lm_eval/tasks/belebele/belebele_arz_Arab.yaml |
sha256=Zi0UrUO05QHGDD14hGsgHzWVyqwitOt9ayxZcdpOvdY
|
117 |
lm_eval/tasks/belebele/belebele_asm_Beng.yaml |
sha256=_W0B2Qk1Ktmw8bs3sMG30E5sLq7yM7U8Z5kCRJcYiCU
|
117 |
lm_eval/tasks/belebele/belebele_azj_Latn.yaml |
sha256=kISIrd3IeaVgQdoava3ztCLrAguTW8yWJaW9FwZU_SQ
|
117 |
lm_eval/tasks/belebele/belebele_bam_Latn.yaml |
sha256=O1bSMR9YcaXKIWCcZ1Q4YO68Paq7MuvoGEMIfoq9r24
|
117 |
lm_eval/tasks/belebele/belebele_ben_Beng.yaml |
sha256=KH3JBcMroICfZ7dB91Su8ZL9HLg9j0A7PrC3ygRy2mo
|
117 |
lm_eval/tasks/belebele/belebele_ben_Latn.yaml |
sha256=iwhPd2MbJnGNzNfztAkKNCdzmRdzJv0jOmY6xm6OO_M
|
117 |
lm_eval/tasks/belebele/belebele_bod_Tibt.yaml |
sha256=3OmaJOqZQrVhTRVs_bAse9Hkx0jPthM-e7Qesx5bUZE
|
117 |
lm_eval/tasks/belebele/belebele_bul_Cyrl.yaml |
sha256=O40wFliFb7RfTcMBpRtfsSswlUJ_y9W8vTeK42jekEA
|
117 |
lm_eval/tasks/belebele/belebele_cat_Latn.yaml |
sha256=pb9_eJUCZgxUY_7Vd-D_kQn4-nAdhNpzWWPyOo738SU
|
117 |
lm_eval/tasks/belebele/belebele_ceb_Latn.yaml |
sha256=bqLKicn1-cc6VH8R74Krr4VM-tHKUY6aph6yVycVr8M
|
117 |
lm_eval/tasks/belebele/belebele_ces_Latn.yaml |
sha256=NLddlp1RVQW4XeOHn4I7ScxOzR-t8lXBXHXdmr01U-s
|
117 |
lm_eval/tasks/belebele/belebele_ckb_Arab.yaml |
sha256=2ohEPKdOGOOxRRSq8ysjbCqtw3l4h_L5s3G9Oi_bjds
|
117 |
lm_eval/tasks/belebele/belebele_dan_Latn.yaml |
sha256=5LnL6d2TGWiT42JpPm69D2gsFueGX-xYh9Owyb5ag60
|
117 |
lm_eval/tasks/belebele/belebele_deu_Latn.yaml |
sha256=x4Gd020iF0eFTHkyxohGpdm1no8yPUaS5yjHsUAbT1U
|
117 |
lm_eval/tasks/belebele/belebele_ell_Grek.yaml |
sha256=vM7mypRDURpF0Oc703Mx47tpRi2hApOKtf-C6NwuMWc
|
117 |
lm_eval/tasks/belebele/belebele_eng_Latn.yaml |
sha256=exv25-DfKV7Bx3INWGwwghJfYAcfcYOX7EheORHk4qY
|
117 |
lm_eval/tasks/belebele/belebele_est_Latn.yaml |
sha256=ZCisUJNjRcfevGTCogzmXsbNRKGtOwpRryPeQeRzbV4
|
117 |
lm_eval/tasks/belebele/belebele_eus_Latn.yaml |
sha256=zzKDT_vQWPxeYGTCFS3YPZWBqWDkRTw7fQAPx3IrNAU
|
117 |
lm_eval/tasks/belebele/belebele_fin_Latn.yaml |
sha256=ld5ZobQ_dPSs8vtKWWQJM9sU4WE-y3ePQOxmYczEg2U
|
117 |
lm_eval/tasks/belebele/belebele_fra_Latn.yaml |
sha256=HRTV1uCb95Sfi-9C0SGSoCy4BLL8OnuK8cP3SEaJsvw
|
117 |
lm_eval/tasks/belebele/belebele_fuv_Latn.yaml |
sha256=2zgs1M4_uFUikuIl9zuhluI-y0Yn2NDthPAcLCr5IG0
|
117 |
lm_eval/tasks/belebele/belebele_gaz_Latn.yaml |
sha256=Am-KDq308E6D2MxQL_cj4GddvwZN2_U4fuCBrOgD4SM
|
117 |
lm_eval/tasks/belebele/belebele_grn_Latn.yaml |
sha256=c6ZbthYlFYhx32oXb_nksrQlFJ4wrzziQ-vnwt2XYOc
|
117 |
lm_eval/tasks/belebele/belebele_guj_Gujr.yaml |
sha256=ZrDrbaxwMdkB7hrr1tD90wm076RRUrv_uo3jUN8YPmI
|
117 |
lm_eval/tasks/belebele/belebele_hat_Latn.yaml |
sha256=IFDS5Pz1qx7gekhhEYd6vQ3wts43bPs4ZhA5OU6V1Bo
|
117 |
lm_eval/tasks/belebele/belebele_hau_Latn.yaml |
sha256=lzkLcA63Ilek158eAaEYHmPR4iXHA6dRCCYsWqgHNs0
|
117 |
lm_eval/tasks/belebele/belebele_heb_Hebr.yaml |
sha256=sHdqpr5kNxhpJGHzy7OIrctOjTt7qBMBXHkJCObwjDk
|
117 |
lm_eval/tasks/belebele/belebele_hin_Deva.yaml |
sha256=5TxiK1wZ0rHN2b3pyEOvyVuzqWBqt_tzq_ft4w1bdF0
|
117 |
lm_eval/tasks/belebele/belebele_hin_Latn.yaml |
sha256=XZfEoXE4J9vZjqGfcoPN1Q-N-G-hkysvdQ3I2yklnnw
|
117 |
lm_eval/tasks/belebele/belebele_hrv_Latn.yaml |
sha256=UGkkEmKyJVKZsClWkfiYQQz86U1C21YSrsLySadGoV8
|
117 |
lm_eval/tasks/belebele/belebele_hun_Latn.yaml |
sha256=2mC9F1P-LHPz6Q71fk_P7simWeAmcoexIZZI-EoDIFM
|
117 |
lm_eval/tasks/belebele/belebele_hye_Armn.yaml |
sha256=mqTHfv7HjWEjbqRS07DhAXCfBrCOUHCNY4LxmrFBr50
|
117 |
lm_eval/tasks/belebele/belebele_ibo_Latn.yaml |
sha256=_U-K5_h-vvxC-zqYSLaPZR_n5JtUg89MVPHI6iRgvzU
|
117 |
lm_eval/tasks/belebele/belebele_ilo_Latn.yaml |
sha256=SqaY3Uj_Yuf-E4E_oOcNm_0p9eDJE_s8Dbm6eWTnZTM
|
117 |
lm_eval/tasks/belebele/belebele_ind_Latn.yaml |
sha256=oFOtiL0XoghRrIm2_hGMVpO28XUb0nAJ3fp8Mcrua2w
|
117 |
lm_eval/tasks/belebele/belebele_isl_Latn.yaml |
sha256=BJsHBBT0IVJCsjOrZVrz9eh07KQLLJ70cCYt9zOQB7U
|
117 |
lm_eval/tasks/belebele/belebele_ita_Latn.yaml |
sha256=fCduE0IoxoROD_2xdQsnyLGJqtPMw8vc5tkU4ANl0Rk
|
117 |
lm_eval/tasks/belebele/belebele_jav_Latn.yaml |
sha256=fggfgk-_2kwTOttkMH9Belu111ddkcCT4VvWXL6XpTk
|
117 |
lm_eval/tasks/belebele/belebele_jpn_Jpan.yaml |
sha256=59SsgQqaPm0tHxWIfu-RzU8wRq3MF_WPA2iol59Vegc
|
117 |
lm_eval/tasks/belebele/belebele_kac_Latn.yaml |
sha256=KBO64zzpJl62LJqMI5IDB9sX3yt4soxAgrFtbUKmlQ8
|
117 |
lm_eval/tasks/belebele/belebele_kan_Knda.yaml |
sha256=na6caVGyAWF_ajjALHQTHKxXWvm5nkjwTMqpAZ7fV0U
|
117 |
lm_eval/tasks/belebele/belebele_kat_Geor.yaml |
sha256=mbMOTih_ujZpjVtGVxtsU3QhWHpKS5zDJ3jnxQCHtgM
|
117 |
lm_eval/tasks/belebele/belebele_kaz_Cyrl.yaml |
sha256=4Erwu3m4wHLwAHEVDwz34Y-AnDg4pYCz9EfJ1VAwcPY
|
117 |
lm_eval/tasks/belebele/belebele_kea_Latn.yaml |
sha256=LzFw_MSbqsCXHm95N-20xGnu5wukru87QfUByDngN70
|
117 |
lm_eval/tasks/belebele/belebele_khk_Cyrl.yaml |
sha256=9mvQti4PxJQsk4tHYtg4WcN0OfGUCl6ozgbEuuKnFPo
|
117 |
lm_eval/tasks/belebele/belebele_khm_Khmr.yaml |
sha256=_I0Ma_R1xqmv1N57xIviUIF3AVDvT7ehbBJYe5uxYuo
|
117 |
lm_eval/tasks/belebele/belebele_kin_Latn.yaml |
sha256=xF0bTypUAQB-D7ED0L_eL-am8vN8FlvrkJoZkt0i7QA
|
117 |
lm_eval/tasks/belebele/belebele_kir_Cyrl.yaml |
sha256=b77pIdwRhj34n1f_Bgp4Ch8Q5bngvYetuk6qPSHxsF8
|
117 |
lm_eval/tasks/belebele/belebele_kor_Hang.yaml |
sha256=tZUX8rsTKLVCIPo2VyC6vg5IT_0g3S_sSYD7fSqYjyk
|
117 |
lm_eval/tasks/belebele/belebele_lao_Laoo.yaml |
sha256=0nriykEwGK8cHGjTX4-MUPJPxIEZCIc_4LbgrCcgztA
|
117 |
lm_eval/tasks/belebele/belebele_lin_Latn.yaml |
sha256=dd91MkzxL14bKD_OVWfFsCac4No8VkNWKDF2csAxHx0
|
117 |
lm_eval/tasks/belebele/belebele_lit_Latn.yaml |
sha256=4ciRkZXnOnOyEUdQGlS9ioG6-eJ51hXOutfxtvHeD88
|
117 |
lm_eval/tasks/belebele/belebele_lug_Latn.yaml |
sha256=2TaDy-FDr93w_NNUtGvSr-Hls9KmGfT8ZbZa1go7cLk
|
117 |
lm_eval/tasks/belebele/belebele_luo_Latn.yaml |
sha256=sCCOcx2NArKXFbF5YsHSkQnVj920HdOAsI7yrYXVfD4
|
117 |
lm_eval/tasks/belebele/belebele_lvs_Latn.yaml |
sha256=yAka2b99-TlTedbQXMBdOY7ZuaNKfY5CI73MqWGDSfw
|
117 |
lm_eval/tasks/belebele/belebele_mal_Mlym.yaml |
sha256=60y_Z4Xf21CBLFbLfUpe92hhSqUpKeMkTNlRv7Fu0GM
|
117 |
lm_eval/tasks/belebele/belebele_mar_Deva.yaml |
sha256=iHy8kLYyzPHUxfzLPvcJhWGhfaY7KdaDqENqMti3weM
|
117 |
lm_eval/tasks/belebele/belebele_mkd_Cyrl.yaml |
sha256=lxXvzZAAP34VcwptDgNSqmG6P4FXsdbHBcrIDsw-fGM
|
117 |
lm_eval/tasks/belebele/belebele_mlt_Latn.yaml |
sha256=tlR9FYl_VLMLEPJnAf93VKykJ9yU7V7P4LrHaThUIYY
|
117 |
lm_eval/tasks/belebele/belebele_mri_Latn.yaml |
sha256=cXsDUC1lhfpEyywS1c06Pf0qzmuOHBp4IJXfGLW3vso
|
117 |
lm_eval/tasks/belebele/belebele_mya_Mymr.yaml |
sha256=s6LUjwN2bknAT88o3v4-LOO_YV6yEKo3Gg3WtOE7zvM
|
117 |
lm_eval/tasks/belebele/belebele_nld_Latn.yaml |
sha256=Dd2fed3FJIt6lJ4N2QzpE12seXIouq4SSuFK3s05Jqo
|
117 |
lm_eval/tasks/belebele/belebele_nob_Latn.yaml |
sha256=9CIyMcCp5oJW3sJbJSXgMM3pv8TAFMVwQ2mAXNdY5kk
|
117 |
lm_eval/tasks/belebele/belebele_npi_Deva.yaml |
sha256=UCQ7yWzYicrv3fp8vqDeQ8rLynq8T_ZPX4AvkBRMa1E
|
117 |
lm_eval/tasks/belebele/belebele_npi_Latn.yaml |
sha256=vZTqvqA86lzAQqXcAxA2bnlEWz3NekYkjpPHHz_tdX4
|
117 |
lm_eval/tasks/belebele/belebele_nso_Latn.yaml |
sha256=PT5LT5fwLTyvB4ruIK9qyt-LaCM-pasXUb2aRzloTL4
|
117 |
lm_eval/tasks/belebele/belebele_nya_Latn.yaml |
sha256=62xoCFekdxpvUFLcfhH0QLqbwkxaNuBCaV_hNKf5DPo
|
117 |
lm_eval/tasks/belebele/belebele_ory_Orya.yaml |
sha256=W6frQwbg9z69i8_mKHf-oHRvUJhIVHw5988Ij4hg-SM
|
117 |
lm_eval/tasks/belebele/belebele_pan_Guru.yaml |
sha256=Gtanduetmm9mE0DLDN8fF0ELS2RtmfQaty3Ag851u6g
|
117 |
lm_eval/tasks/belebele/belebele_pbt_Arab.yaml |
sha256=l5v5c1y3oLECT8r5TBASKJNotUGaudZyWtNnkxUoTC4
|
117 |
lm_eval/tasks/belebele/belebele_pes_Arab.yaml |
sha256=lfO-93-WV0kHChUTwZNGN_67SnuE_dWWPMXodxNChcI
|
117 |
lm_eval/tasks/belebele/belebele_plt_Latn.yaml |
sha256=qxFFK8hTsOfzUwf0JhYYnj1faapl1fvOJidHkKmZcQE
|
117 |
lm_eval/tasks/belebele/belebele_pol_Latn.yaml |
sha256=wPXTjvfgiYw-wq-AqRjmvceeKaiZKGxcc5DSLYFnZhI
|
117 |
lm_eval/tasks/belebele/belebele_por_Latn.yaml |
sha256=9ZSsYjV_agSrefKGwtAj2Leaf4YgPCrwFJXA7cXZWgg
|
117 |
lm_eval/tasks/belebele/belebele_ron_Latn.yaml |
sha256=YhzeVLH-lCrMe2FgXoRCbN799a9Begb2iNm_K52XWg4
|
117 |
lm_eval/tasks/belebele/belebele_rus_Cyrl.yaml |
sha256=MBdiGKUaM3XvGC5TcUMjjhLHZaKreZRvBwUXYjMqiEk
|
117 |
lm_eval/tasks/belebele/belebele_shn_Mymr.yaml |
sha256=VBKTseVSUZWZjlV_Qqw1JyUjijuazHPS-G59vSlEAOI
|
117 |
lm_eval/tasks/belebele/belebele_sin_Latn.yaml |
sha256=Pq4mtdhkZ8GEiQpBUtA9ZJ0yGtd6QvzGFt5iIeJ7QqY
|
117 |
lm_eval/tasks/belebele/belebele_sin_Sinh.yaml |
sha256=jbH9mN1vERNn1iDUeiLjWxJQNlrtSlt9x8j66yhSpqE
|
117 |
lm_eval/tasks/belebele/belebele_slk_Latn.yaml |
sha256=ez3bUC6z6AgbHbF5Ahxjm9XrMLWLzijMjV2LpnWRVak
|
117 |
lm_eval/tasks/belebele/belebele_slv_Latn.yaml |
sha256=LTsIYDCpt-G2JVHbIK5TsMDxRBF57QshikHoGDB2cs8
|
117 |
lm_eval/tasks/belebele/belebele_sna_Latn.yaml |
sha256=eQ8BbzbPdD3ReBkMm8JldqntqdQQcd6IMPsewbE9tHw
|
117 |
lm_eval/tasks/belebele/belebele_snd_Arab.yaml |
sha256=XQfQzK89afh2Rb73AsML___G67mc7j5bbBqaiudEkrw
|
117 |
lm_eval/tasks/belebele/belebele_som_Latn.yaml |
sha256=AFsIV2QqGYqwwu3ymjEpwHStRcym9zo3NfUB9bDcr8Y
|
117 |
lm_eval/tasks/belebele/belebele_sot_Latn.yaml |
sha256=DkgjgGaN49OUla6LQd-PWZ3oigBLaHxiFZCmMomkvwU
|
117 |
lm_eval/tasks/belebele/belebele_spa_Latn.yaml |
sha256=RnnQVuumrNH4t6wNyqCAu0KHqixtl14K_GrsHlRo1ik
|
117 |
lm_eval/tasks/belebele/belebele_srp_Cyrl.yaml |
sha256=MJMi_zj1sDAANAparEXXhpBsKsFl72aulVCvwtg608s
|
117 |
lm_eval/tasks/belebele/belebele_ssw_Latn.yaml |
sha256=z4ZlK52dPg7Iy1huGmqdQshPkf0lkdgfDGSCNuWRDDM
|
117 |
lm_eval/tasks/belebele/belebele_sun_Latn.yaml |
sha256=U0zXr_wJ_PZCTkD3w43aJg-1az-am598syHo4L0GDH0
|
117 |
lm_eval/tasks/belebele/belebele_swe_Latn.yaml |
sha256=FSamGbZJjEyaywTY04GEaXeH562KMAO_JQ5wJ6CP5zw
|
117 |
lm_eval/tasks/belebele/belebele_swh_Latn.yaml |
sha256=vJ6HXNruMr6mo2n0ZRrAckEXCaBQSLlQ2PNNuKKWC6k
|
117 |
lm_eval/tasks/belebele/belebele_tam_Taml.yaml |
sha256=0fEr-Wet29O9dCiPfWB8a1O158DT2J8c9hUtrcOLnHo
|
117 |
lm_eval/tasks/belebele/belebele_tel_Telu.yaml |
sha256=kzX2E7ozzn13_6ztXcwLBQh5ZECKJ9a9uI-8UKF7F08
|
117 |
lm_eval/tasks/belebele/belebele_tgk_Cyrl.yaml |
sha256=1OMlPVKbPojktAzAiNtWo_oC4oPZfDlEQSRhEpCwV2E
|
117 |
lm_eval/tasks/belebele/belebele_tgl_Latn.yaml |
sha256=AoE2baYqrPrNvXpGQHi-cMIjveeWko0xs5smctyNUV8
|
117 |
lm_eval/tasks/belebele/belebele_tha_Thai.yaml |
sha256=_7bdsGsN_IqJLAi1wFkyhPcPimpWp1SkGc5VnPYV5I0
|
117 |
lm_eval/tasks/belebele/belebele_tir_Ethi.yaml |
sha256=Nko8UZ1kSbcWhxCL3v8jtdqgK99kipth0iZPaWZ4r5A
|
117 |
lm_eval/tasks/belebele/belebele_tsn_Latn.yaml |
sha256=0ctcFmW4qJ2GB3m63-I3uNlgYX93NkGUSXV3cUSVyRs
|
117 |
lm_eval/tasks/belebele/belebele_tso_Latn.yaml |
sha256=NaVyWnhITUTXHFovQbnUyiF2aAULB5G7TVNqrrO8eWE
|
117 |
lm_eval/tasks/belebele/belebele_tur_Latn.yaml |
sha256=woe79SthhsQhHJAAGeIv5kPjfO7LjMGqsjgyrMBm5T0
|
117 |
lm_eval/tasks/belebele/belebele_ukr_Cyrl.yaml |
sha256=_h-10kKVwf5h8L2PRheQWKPDEKJgsZvf-WTQ_xYJpN8
|
117 |
lm_eval/tasks/belebele/belebele_urd_Arab.yaml |
sha256=blghiHBZpPRoju-cqpl7FiGG1hyGbRQzbMfkP-p4YwY
|
117 |
lm_eval/tasks/belebele/belebele_urd_Latn.yaml |
sha256=ZDxfot4bKgcXLW8SBH42zfbL7KcZF3bFf164lYz6yxY
|
117 |
lm_eval/tasks/belebele/belebele_uzn_Latn.yaml |
sha256=HaAURsOkDmCatCT8EgH0q2ni3HDMn05wlLIpQA8iIgQ
|
117 |
lm_eval/tasks/belebele/belebele_vie_Latn.yaml |
sha256=QNko1Yqj_PSIPJm0kIQZV-ujAvMGCpKBukma2PIV6P4
|
117 |
lm_eval/tasks/belebele/belebele_war_Latn.yaml |
sha256=U5xdsP0LNGHbqWt9BkP3MeLHPL7afj7MKqotfSRDj3o
|
117 |
lm_eval/tasks/belebele/belebele_wol_Latn.yaml |
sha256=DhZ8fA-SnFNCBYit3sDIR7fVE02GqyJ1RVpm6vNMvyc
|
117 |
lm_eval/tasks/belebele/belebele_xho_Latn.yaml |
sha256=0nT5V3mr1_ShbzFNRQspUDawxy3Fcb8RAH1XU-s1aHQ
|
117 |
lm_eval/tasks/belebele/belebele_yor_Latn.yaml |
sha256=eNSl6gNTISIuwT_tn23c9Olj5q4UrEffBAxfG6v1POU
|
117 |
lm_eval/tasks/belebele/belebele_zho_Hans.yaml |
sha256=F-jD_qluePBEYSZFgPhvQjhp-tgAcp3Vv2cMWu1d-js
|
117 |
lm_eval/tasks/belebele/belebele_zho_Hant.yaml |
sha256=-3ZBT_ESjzRWjLOa5x172BS910ayI7uqtWgCvkfAYwM
|
117 |
lm_eval/tasks/belebele/belebele_zsm_Latn.yaml |
sha256=bMob3HTMA0DwI7Qc81RINHLB5I57VznQhkuApHW9Qos
|
117 |
lm_eval/tasks/belebele/belebele_zul_Latn.yaml |
sha256=7M_qJjo6XAhlWG6xC99bXvWkU4g6XDvEvOSWzkga4BA
|
117 |
lm_eval/tasks/benchmarks/minerva_math.yaml |
sha256=lb2Yn4TfnswputGzd0vO4yX4YpfqZp-drdOfWViJA80
|
231 |
lm_eval/tasks/benchmarks/openllm.yaml |
sha256=SE8PyOTLK5FEUf9VKnzxzae1JgII7tp2-UZdVgVrKzw
|
368 |
lm_eval/tasks/benchmarks/pythia.yaml |
sha256=xb6ysr5Wkze05aUl0DS6aKWKN4d3-WBXHInrmE3Q4Uk
|
135 |
lm_eval/tasks/benchmarks/t0_eval.yaml |
sha256=NfW-WLp-pnT4hQrmNyO1Du6DHVscevER86MHVSf_zVE
|
3491 |
lm_eval/tasks/benchmarks/flan/_held_in_template_yaml |
sha256=8dsDGbiy4jXYWwg1jzpjFi9MOkc6bkH1Pt5YFW9gSEM
|
255 |
lm_eval/tasks/benchmarks/flan/flan_held_in.yaml |
sha256=NzCeaWvM7ZBl5iAJLg89uQivP9EhxbXkHVjHwy2RolY
|
19112 |
lm_eval/tasks/benchmarks/flan/flan_held_out.yaml |
sha256=5vHKmz0WUNCMugMItX0Ym8metOG1IU8anff9aGyMq9Q
|
247 |
lm_eval/tasks/benchmarks/multimedqa/README.md |
sha256=3i7dHJvrbpWYzjn5W51-sl-FUxQhvM9hsi738TrSQzM
|
2373 |
lm_eval/tasks/benchmarks/multimedqa/multimedqa.yaml |
sha256=8cLeL6MaferIiOgpiLjF55a_4x2WsulJzvWkwNkj4yg
|
506 |
lm_eval/tasks/bigbench/README.md |
sha256=-S-u9m2fxpIOoIvS4K1LS2Td3WfjFw4XFh6FnJXOGWM
|
9772 |
lm_eval/tasks/bigbench/generate_tasks.py |
sha256=ohM-7aw3ej1GrtJgEZkZv_S1w2s3HCvmwOJakRo2coc
|
5595 |
lm_eval/tasks/bigbench/generate_until_template_yaml |
sha256=sbd04VMXY4sqC54noXYP6TH8givQRdRqlB0mGdmjdRc
|
509 |
lm_eval/tasks/bigbench/multiple_choice_template_yaml |
sha256=3_mHPZc4arbTwc726wj6pHa45RxOSo9wzoJ5hDgFAD4
|
502 |
lm_eval/tasks/bigbench/push_bigbench_dataset.py |
sha256=daBJd2p0mzmfN2CRDCBREFRwjtDoMY_k2veE97XuboQ
|
1035 |
lm_eval/tasks/bigbench/generate_until/abstract_narrative_understanding.yaml |
sha256=0QLUsd46oJza1RWtto1OHpdpxd8r79lLZJ-8eFNw5ZY
|
185 |
lm_eval/tasks/bigbench/generate_until/anachronisms.yaml |
sha256=T1Fc7bNpFatJyeTOAZ61FOA_vQkkMwPpgFLvEe3tMGE
|
145 |
lm_eval/tasks/bigbench/generate_until/analogical_similarity.yaml |
sha256=I-HNuu_mTxqRNiAGpiyEpoMbm4ViZJpd8tdPD-fkW5g
|
163 |
lm_eval/tasks/bigbench/generate_until/analytic_entailment.yaml |
sha256=4IpGceDe68otlD7i617DSBXqhw067Y4AjpYVWYnfURU
|
159 |
lm_eval/tasks/bigbench/generate_until/arithmetic.yaml |
sha256=--6zcCrvHwjcE1SSujrnoCHDXpTo4c2CT9sosctJ0qY
|
141 |
lm_eval/tasks/bigbench/generate_until/ascii_word_recognition.yaml |
sha256=QhBAm87LFXXIztQjATqtE1QG2s3JOkADRvbiASZcsOM
|
165 |
lm_eval/tasks/bigbench/generate_until/authorship_verification.yaml |
sha256=J7qQUerJLmxVwptNTbsFlZrDn3WWjxyA-i6aDY-iQ7I
|
167 |
lm_eval/tasks/bigbench/generate_until/auto_categorization.yaml |
sha256=ZSVByX3aUgSSa_dUYHfJvm6bX6ID5iFF9pZodjWzudI
|
159 |
lm_eval/tasks/bigbench/generate_until/auto_debugging.yaml |
sha256=EwWe_JEyKN8cQTnhvMFV2T40Td2Igaq0rWuvm9VFVaU
|
149 |
lm_eval/tasks/bigbench/generate_until/bbq_lite_json.yaml |
sha256=x7II4n0ImBk4HwpbXn6Dap0no5YBdrizIo3qqeoIstQ
|
147 |
lm_eval/tasks/bigbench/generate_until/bridging_anaphora_resolution_barqa.yaml |
sha256=QFdj_nZPzivXQ_99MACTqsq_hNqpOXwAv0JBvnKZQZU
|
189 |
lm_eval/tasks/bigbench/generate_until/causal_judgment.yaml |
sha256=f9fiw28Jp_YEeRgrbmUG8dwtt7l6Up22-1-r-uhDyuY
|
151 |
lm_eval/tasks/bigbench/generate_until/cause_and_effect.yaml |
sha256=5GlQQ-CAgOwXPypYnjRMpdyZ7fA4a-x6REDBEPpmFGo
|
153 |
lm_eval/tasks/bigbench/generate_until/checkmate_in_one.yaml |
sha256=eWi6zh5n4gwBcE3J7IMiyNttiy2EYvOTAcMMB3Q33lI
|
153 |
lm_eval/tasks/bigbench/generate_until/chess_state_tracking.yaml |
sha256=anlmDNc-UuKZhgvd4bGHfnloD0817tEiYWuoMBrstVI
|
161 |
lm_eval/tasks/bigbench/generate_until/chinese_remainder_theorem.yaml |
sha256=hUIYsvTxDFpXOBBR3rc5ByHjK-kCr0IJuYD4-uCEeqU
|
171 |
lm_eval/tasks/bigbench/generate_until/cifar10_classification.yaml |
sha256=E96IQAlynQhHjAYzJh3CIy3o1oF5Np0onr3Y0G0dS1Y
|
165 |
lm_eval/tasks/bigbench/generate_until/code_line_description.yaml |
sha256=EbyOJ6tcfb56fDC7jKERqViylqMzNZReN5N4tFrp054
|
163 |
lm_eval/tasks/bigbench/generate_until/codenames.yaml |
sha256=RHFfLNH_PvBByvta_z2FSqC0MgA5V7lr6ORRJN5IjO0
|
139 |
lm_eval/tasks/bigbench/generate_until/color.yaml |
sha256=V66z_3cDIsLWHt7cHqnPGfFFvgVBypj-jqW60l4WGy0
|
131 |
lm_eval/tasks/bigbench/generate_until/common_morpheme.yaml |
sha256=DMnQE0PnPan9Z10yajvyM6AnDz2SNKrmID06eKfW-aU
|
151 |
lm_eval/tasks/bigbench/generate_until/conceptual_combinations.yaml |
sha256=wN2KQGaT9pun0hOWwe3jrAkjh2lZScYr2jJtiKfPiCA
|
167 |
lm_eval/tasks/bigbench/generate_until/conlang_translation.yaml |
sha256=-HU-3JkFMpn4vPatZMO3gA6vAJBfdc5XISmYzTDIuMc
|
159 |
lm_eval/tasks/bigbench/generate_until/contextual_parametric_knowledge_conflicts.yaml |
sha256=CgIDUv6CCJ07FK6H_ATyzqHq8uy_p4ktGWawP8Bmy64
|
203 |
lm_eval/tasks/bigbench/generate_until/crash_blossom.yaml |
sha256=_kEHp_E3G1AXRC0UsLL6LLJN0o7OXpaobTZl9idnP9w
|
147 |
lm_eval/tasks/bigbench/generate_until/crass_ai.yaml |
sha256=Gjf50yyrvFYa2uCcpcu6IJEw4_GpvPtLaIt_dHSgKiw
|
137 |
lm_eval/tasks/bigbench/generate_until/cryobiology_spanish.yaml |
sha256=tIqxreR7fTTOmPbYthVH-SEuzjgJQhfAdm7wkQx_CPw
|
159 |
lm_eval/tasks/bigbench/generate_until/cryptonite.yaml |
sha256=5QWZppWvBkcS3wifv3cihe1fCKTZnwVvmtifEkPjgbE
|
141 |
lm_eval/tasks/bigbench/generate_until/cs_algorithms.yaml |
sha256=Bs4PE7GgZLTX3cPlHHaFqcDmmoEfUOc5V_Gmipya7ls
|
147 |
lm_eval/tasks/bigbench/generate_until/dark_humor_detection.yaml |
sha256=u98XLx00QqxUlZyScZSaDghGG2XNblgVvQMYLzWW-5I
|
161 |
lm_eval/tasks/bigbench/generate_until/date_understanding.yaml |
sha256=ikMqfOMsIQ5sMEu5F6jmiPZ1QIk55BMoWgPmlD2YZZc
|
157 |
lm_eval/tasks/bigbench/generate_until/disambiguation_qa.yaml |
sha256=3AfjnL9sxOL7-mS00bAMCer8ytGaceP-AEVKJ036qCg
|
155 |
lm_eval/tasks/bigbench/generate_until/discourse_marker_prediction.yaml |
sha256=IDsWjfdbnWGCmPZOPXF1cCqoae05UYLPwO2FJ2SqHVE
|
175 |
lm_eval/tasks/bigbench/generate_until/disfl_qa.yaml |
sha256=slBKpOw28f7O4FrQjm43gqzcHgOB9-2ysKGTlOXcIt0
|
137 |
lm_eval/tasks/bigbench/generate_until/dyck_languages.yaml |
sha256=Nf4uiVjkZB78bKbFEbnXRE3-4eTd4oHhWOAQsg4zOsY
|
149 |
lm_eval/tasks/bigbench/generate_until/elementary_math_qa.yaml |
sha256=cvAGFFzJcYgDKDmdDfWoJxpPfGYcoH5YKM6hJv-504o
|
157 |
lm_eval/tasks/bigbench/generate_until/emoji_movie.yaml |
sha256=xE60hkJ3GUO1IzxA5kyWTgQGN8MdpsFL6U44ABSzpgQ
|
143 |
lm_eval/tasks/bigbench/generate_until/emojis_emotion_prediction.yaml |
sha256=XmwhQbFtBGHBvKcFeBNyaVvGZntHdIveeRV_6cdr7Wg
|
171 |
lm_eval/tasks/bigbench/generate_until/empirical_judgments.yaml |
sha256=kjuLT2A-PhCTmqnBMu0msAkVL09fHHoTpszp-2Rmvxs
|
159 |
lm_eval/tasks/bigbench/generate_until/english_proverbs.yaml |
sha256=C-ssB8SgXTSpWuxyjMBTQX9mBwKvHNNzO4nYcVauhjc
|
153 |
lm_eval/tasks/bigbench/generate_until/english_russian_proverbs.yaml |
sha256=jN-poiQ4U4UCdcHf7RMV6hcZBoKFEvuzdkxBUqD4uFY
|
169 |
lm_eval/tasks/bigbench/generate_until/entailed_polarity.yaml |
sha256=_gaT1mv0iFYNMbZTGfWeifF6TB8KxASgiyEeXY0vrH0
|
155 |
lm_eval/tasks/bigbench/generate_until/entailed_polarity_hindi.yaml |
sha256=RE9kwhgved0dXeKgFCjeFtETtB9FuTgL94iiNSExJj0
|
167 |
lm_eval/tasks/bigbench/generate_until/epistemic_reasoning.yaml |
sha256=J-n430fnOd4kw4zRySnYYUG-e7GnxadwVAtqU3S8NRc
|
159 |
lm_eval/tasks/bigbench/generate_until/evaluating_information_essentiality.yaml |
sha256=6fKxC324hKwqkpV_6MTNNsLicGevovD1iKDflOtOzhM
|
191 |
lm_eval/tasks/bigbench/generate_until/fact_checker.yaml |
sha256=QZ2tsTKpy93PWKXM-cPAdzSKXsYtspGFyQqQXM8QNSY
|
145 |
lm_eval/tasks/bigbench/generate_until/fantasy_reasoning.yaml |
sha256=JWzZtrvKJaXfBrC8-B2ClPUze2704DVXUpWioHKCo0M
|
155 |
lm_eval/tasks/bigbench/generate_until/few_shot_nlg.yaml |
sha256=jGqGMoegdMocHCIyV2HDHm6yrf-7h4N8JnzI028bWmY
|
145 |
lm_eval/tasks/bigbench/generate_until/figure_of_speech_detection.yaml |
sha256=l3ohFveEUwi8QceVaX1Ubpo0bgaJOJkmN20oFENc4GE
|
173 |
lm_eval/tasks/bigbench/generate_until/formal_fallacies_syllogisms_negation.yaml |
sha256=VW2iLQzYRtTXjvrCa2Xnz8wlpIyPhUvMfAf_3W_rHZg
|
193 |
lm_eval/tasks/bigbench/generate_until/gem.yaml |
sha256=ODcWuReD_irTxL7Om0YX1lwUPdgTvS4gfnq64_9RT9M
|
127 |
lm_eval/tasks/bigbench/generate_until/gender_inclusive_sentences_german.yaml |
sha256=N6yiMVWfYnYWXAku7GSw7PAw20_GJevKEF7Nln9s20o
|
187 |
lm_eval/tasks/bigbench/generate_until/general_knowledge.yaml |
sha256=0FoVsz9_Whmets9lZh3vpd7TxwclRTFMIT8tpn2iTqk
|
155 |
lm_eval/tasks/bigbench/generate_until/geometric_shapes.yaml |
sha256=tVKuLRsEGC6QEZINH_MJL9ouuGxYBuBcIoqf8Ry1CB0
|
153 |
lm_eval/tasks/bigbench/generate_until/goal_step_wikihow.yaml |
sha256=HefVYueV7Ib4olhFiPSnN-4tKk-wm2-TTOJZq13zDiY
|
155 |
lm_eval/tasks/bigbench/generate_until/gre_reading_comprehension.yaml |
sha256=imJmoGVFj12Yw1LFVNvOwMqmcjvPC0SfBwptLaX_Rj0
|
171 |
lm_eval/tasks/bigbench/generate_until/hhh_alignment.yaml |
sha256=u9i_BMm0zJiWEkU_IL36D1nf9TLqGXArxICZoMmyn6g
|
147 |
lm_eval/tasks/bigbench/generate_until/hindi_question_answering.yaml |
sha256=ed9fUg5xV9JFW_pI9slzBepyiTu-v1s5s3zu_M7JlCE
|
169 |
lm_eval/tasks/bigbench/generate_until/hindu_knowledge.yaml |
sha256=GyJkeBgssT8R04bTdYSQM4oa4v8JWpa2ILwVTvLjOyI
|
151 |
lm_eval/tasks/bigbench/generate_until/hinglish_toxicity.yaml |
sha256=F4y708uc0l1a5o1M6s_kSCpYNl3ivpwfWAgO7usZ8JQ
|
155 |
lm_eval/tasks/bigbench/generate_until/human_organs_senses.yaml |
sha256=AeQZPk72WRN9G2pj31CvgKiDEbEjSGMppYhni2Q_sVs
|
159 |
lm_eval/tasks/bigbench/generate_until/hyperbaton.yaml |
sha256=m_cFalqyG6dq_RoMUzTV9fiTFQQ2BssZfG071Zezlzo
|
141 |
lm_eval/tasks/bigbench/generate_until/identify_math_theorems.yaml |
sha256=buqbBDN-gZJY8mnG2IRHpUPbEFgz4e2amo_c1uQmIvE
|
165 |
lm_eval/tasks/bigbench/generate_until/identify_odd_metaphor.yaml |
sha256=EoTWJfETPJQIKFScOELfBno5wGMM0KSRUp5Ck8wDh_A
|
163 |
lm_eval/tasks/bigbench/generate_until/implicatures.yaml |
sha256=XDY-X3eUplOlnEY2WZis1uGjSU0GLg85c7krqgsGQg4
|
145 |
lm_eval/tasks/bigbench/generate_until/implicit_relations.yaml |
sha256=AxXDlJDpf_YQKJpvifStiRPiehlDl3L8_bo8i4EtY-c
|
157 |
lm_eval/tasks/bigbench/generate_until/intent_recognition.yaml |
sha256=QSsKdp83MAfBu2LSLUx2dPt1mENEZ5s4O3to4ntZolM
|
157 |
lm_eval/tasks/bigbench/generate_until/international_phonetic_alphabet_nli.yaml |
sha256=bPAQzEm6obZvwbxqzZGCDDKYJhasb9Esv6w7FVS5knI
|
191 |
lm_eval/tasks/bigbench/generate_until/international_phonetic_alphabet_transliterate.yaml |
sha256=ERiqN2vbxFHM3lbUyvWvm46ydMwxU7y1xa4hur8V3B0
|
211 |
lm_eval/tasks/bigbench/generate_until/intersect_geometry.yaml |
sha256=uq6hHt_p6HnyMFMN7XcS6Uhml-Ndv5a5l9TTaSzL-9Y
|
157 |
lm_eval/tasks/bigbench/generate_until/irony_identification.yaml |
sha256=3Lg0jMAk1-QXMo08j6T4weLkMU1xihyF94-61Y5cjCI
|
161 |
lm_eval/tasks/bigbench/generate_until/kanji_ascii.yaml |
sha256=ma-v7NMOLxNkdKYoRvL9OuEblQ7-l2O2O9bjPhIbyGQ
|
143 |
lm_eval/tasks/bigbench/generate_until/kannada.yaml |
sha256=y3M1MBUaQqV6b3cfumpigEoeq9m7j8qu2wqM8mjzeEE
|
135 |
lm_eval/tasks/bigbench/generate_until/key_value_maps.yaml |
sha256=YBdKpEXYUdrbg2YxcDpTheRCGtA8QQU_kMEyWfGaR7I
|
149 |
lm_eval/tasks/bigbench/generate_until/known_unknowns.yaml |
sha256=FSMjIyrW6Zq86r6PjPnC7GY7KnWQQukFsSkNRMXkIAI
|
149 |
lm_eval/tasks/bigbench/generate_until/language_games.yaml |
sha256=4vOMkyvPfKVTI-qWO_FfHnxH66nTN6qROPS5selFR-0
|
149 |
lm_eval/tasks/bigbench/generate_until/language_identification.yaml |
sha256=siO1slzacE_Qem-FuA5vwlRqfo_gHZsMCGrIjnA-JlY
|
167 |
lm_eval/tasks/bigbench/generate_until/linguistic_mappings.yaml |
sha256=9BAFhXST3cS9ktxMTB-qVF7lqN8NNEUN4L4JjhqSH5M
|
159 |
lm_eval/tasks/bigbench/generate_until/linguistics_puzzles.yaml |
sha256=5KGRhLH_mhvoGwdh_CFQTM5r9dPowCxOHzzzcSAkdh0
|
159 |
lm_eval/tasks/bigbench/generate_until/list_functions.yaml |
sha256=On2YeI3r2_s9bblbk-AoVp8jZsdmpH7JPTRxzLbLz9k
|
149 |
lm_eval/tasks/bigbench/generate_until/logic_grid_puzzle.yaml |
sha256=N7JKcaLTcZIxh6efPHG6grF_-Dia9TLDj6AINFyrgas
|
155 |
lm_eval/tasks/bigbench/generate_until/logical_args.yaml |
sha256=LeMAv4cqQynPdEgMjbX6DLUuHtE5be7VL3_TRgEBxcg
|
145 |
lm_eval/tasks/bigbench/generate_until/logical_deduction.yaml |
sha256=cMhraRNkbdmCn70YWUI3L5szUSZxF2BZ9dkb08x3otI
|
155 |
lm_eval/tasks/bigbench/generate_until/logical_fallacy_detection.yaml |
sha256=Plu8NPXtIwicj-ZOR-s-tUp8sQTRUSidXG13wkiybPU
|
171 |
lm_eval/tasks/bigbench/generate_until/logical_sequence.yaml |
sha256=oiqHok8TaV88QsPEmUtF8J_mx7XBBOO_kEi6MYFETcU
|
153 |
lm_eval/tasks/bigbench/generate_until/mathematical_induction.yaml |
sha256=AcUk2gvyYMBR2MXIxiswXjcbv4UITm2CU_RboxlfV34
|
165 |
lm_eval/tasks/bigbench/generate_until/matrixshapes.yaml |
sha256=oPNV1qhlRa0CStZy9CCOEyYPM1Q88mk51aJ8EEY-yeY
|
145 |
lm_eval/tasks/bigbench/generate_until/metaphor_boolean.yaml |
sha256=4pm8zy5rvB_f8jXoTBBLe_0gimdFwt7zkINpHdMztA0
|
153 |
lm_eval/tasks/bigbench/generate_until/metaphor_understanding.yaml |
sha256=eTWZ8H4boQ7GHOkRh8JiGNzpqMwV0-jy-pxs3ZEIE6k
|
165 |
lm_eval/tasks/bigbench/generate_until/minute_mysteries_qa.yaml |
sha256=-106CIqMUWgCr30EoCxvnjL3NnRwgqF4YzkXBjJKm7M
|
159 |
lm_eval/tasks/bigbench/generate_until/misconceptions.yaml |
sha256=GRaducmwu4DxLeIPTw6fcxOi5aEoNctq09pae_zlmIY
|
149 |
lm_eval/tasks/bigbench/generate_until/misconceptions_russian.yaml |
sha256=NXz_RMAGdhitHJUrOcyOs3lUJAR3BZczDkNh7wuRbrQ
|
165 |
lm_eval/tasks/bigbench/generate_until/mnist_ascii.yaml |
sha256=3ft522RKA2O6tkvjKFEUXR_ZeAHZyRmUYAVFacedIYs
|
143 |
lm_eval/tasks/bigbench/generate_until/modified_arithmetic.yaml |
sha256=tN48_TrYgL6NlmDnAFf4_ynOgjgf59tDjZaFMxiGXhs
|
159 |
lm_eval/tasks/bigbench/generate_until/moral_permissibility.yaml |
sha256=QWHphy2-qbjA6cVIBkv3jojENR-RtA6dxSFUtTaiMCE
|
161 |
lm_eval/tasks/bigbench/generate_until/movie_dialog_same_or_different.yaml |
sha256=izDgy0BjGi5gkJdKBFB6MT-vq2x97ktVkQHPYThzXpg
|
181 |
lm_eval/tasks/bigbench/generate_until/movie_recommendation.yaml |
sha256=Ls68uPStQfEA_cXXoHRltL_of6hPd4LCyz5z2FhAQfo
|
161 |
lm_eval/tasks/bigbench/generate_until/mult_data_wrangling.yaml |
sha256=tNqxoe0NI87WvxSOPS1JyUr1PCpU-UP-q19tmfeaU9Y
|
159 |
lm_eval/tasks/bigbench/generate_until/multiemo.yaml |
sha256=ntr6dACBtdAxlsVaCYxQ4ZYEEZ2Q1pf4jF00fiu7HFg
|
137 |
lm_eval/tasks/bigbench/generate_until/natural_instructions.yaml |
sha256=_W6euf1qNMYGfvy7VFPpSGTllBU3TnvQLEwnIzIjsKs
|
161 |
lm_eval/tasks/bigbench/generate_until/navigate.yaml |
sha256=SgxFNM3bs3Cbfcw2oE2uBj2vXsc0_NKW-R8n1IPbgMU
|
137 |
lm_eval/tasks/bigbench/generate_until/nonsense_words_grammar.yaml |
sha256=y7R8xHkK3Fg9Vwbs6MLI7nEk-v_lBkd3Qdpxw1TyKbg
|
165 |
lm_eval/tasks/bigbench/generate_until/novel_concepts.yaml |
sha256=Uw79SXkiEfDm0za-qLou47Vmp42R5necVDTOmIsNnwk
|
149 |
lm_eval/tasks/bigbench/generate_until/object_counting.yaml |
sha256=BPtUsBz3xxwrKC38WiDAP0Lz8Boh7rkMC0t4rWobGe0
|
151 |
lm_eval/tasks/bigbench/generate_until/odd_one_out.yaml |
sha256=0MPa0ZWseDqQZWxIiUVHPLyHaC0CDqDYP5_VJqML9eI
|
143 |
lm_eval/tasks/bigbench/generate_until/operators.yaml |
sha256=Xq2pA8FZ1d84z69QD0oXGH7hqs4fMLs-lxZpjwACBgY
|
139 |
lm_eval/tasks/bigbench/generate_until/paragraph_segmentation.yaml |
sha256=UEraXnlx1L9yNh0qQwsz63wJ0AzYlMwJ-m2NjZEning
|
165 |
lm_eval/tasks/bigbench/generate_until/parsinlu_qa.yaml |
sha256=BzriiMDmkFzK17iZEYiQmsK_QBfuBewrMNg8Jpanuq8
|
143 |
lm_eval/tasks/bigbench/generate_until/parsinlu_reading_comprehension.yaml |
sha256=HRPXjduxFQ66sJImYH00lc7JCNOYvu1Cp1OVpcHtC9Y
|
181 |
lm_eval/tasks/bigbench/generate_until/penguins_in_a_table.yaml |
sha256=AK27vKzGHc5dZmI_rUOaMb46gqArR93-qFAeWvc0LSM
|
159 |
lm_eval/tasks/bigbench/generate_until/periodic_elements.yaml |
sha256=W3ru5pbGYHFh3cXAWta5sqN6tPhrfZTr0hmXoftd0uk
|
155 |
lm_eval/tasks/bigbench/generate_until/persian_idioms.yaml |
sha256=4NV4ESKoI7a7EwwaMoP00HrhbF2n2fFcJDukwkrDjMc
|
149 |
lm_eval/tasks/bigbench/generate_until/phrase_relatedness.yaml |
sha256=hEoCjBW50vaQcu1EnVRxmHCglXGOJEQITX7ki8oQemY
|
157 |
lm_eval/tasks/bigbench/generate_until/physical_intuition.yaml |
sha256=4tnrOLP_uEpDciJaSe3bvAyw9V9BiEXIuNmy3CkGMRA
|
157 |
lm_eval/tasks/bigbench/generate_until/physics.yaml |
sha256=O1CzYMtf6bKfY8xCh8ozpMiGBeKJR2OoDiKnQvS3xro
|
135 |
lm_eval/tasks/bigbench/generate_until/physics_questions.yaml |
sha256=Y662E9Oe4bGLueoI3htoqKXQohzO5z1siHfkbkX_crk
|
155 |
lm_eval/tasks/bigbench/generate_until/play_dialog_same_or_different.yaml |
sha256=b2pdgfqb9rmc6zFhFh4OhofhuITnd-CagxP_62YP7_c
|
179 |
lm_eval/tasks/bigbench/generate_until/polish_sequence_labeling.yaml |
sha256=6syFTfP371tpGL08rlVUPSTGgRYOVs8H6qR-AWwNl9A
|
169 |
lm_eval/tasks/bigbench/generate_until/presuppositions_as_nli.yaml |
sha256=F8FjUkXb6KO7faXV_OA96c8C8mehFEGr75jng3A7QRE
|
165 |
lm_eval/tasks/bigbench/generate_until/qa_wikidata.yaml |
sha256=R9dHCcdvg2TzI2ZIyYMz9Va63qrW0XV-3pqDOzAVMMw
|
143 |
lm_eval/tasks/bigbench/generate_until/question_selection.yaml |
sha256=yy8sqV94vIr97h-srkXC0UXmrn_hCFwfXzuN24T2I84
|
157 |
lm_eval/tasks/bigbench/generate_until/real_or_fake_text.yaml |
sha256=BzT3eGjusHCJEkFGUWGKPVHk-Ty-kejnTO09ePPS2-8
|
155 |
lm_eval/tasks/bigbench/generate_until/reasoning_about_colored_objects.yaml |
sha256=rHAOlsYCbZi_7Q6CsDJfxHxW-cKMYM108TFrRV6ZtFc
|
183 |
lm_eval/tasks/bigbench/generate_until/repeat_copy_logic.yaml |
sha256=aMUsLN4oxqceJBjL42m22on1_4S6miTq4zNLWCKHJIE
|
155 |
lm_eval/tasks/bigbench/generate_until/rephrase.yaml |
sha256=o7I78PrOnUIxqFZ_lNt0twELTMrajUAvI1-HvTM0APM
|
137 |
lm_eval/tasks/bigbench/generate_until/riddle_sense.yaml |
sha256=eas5Zq3tq1xx03Qn8kB9mU1JbfV-KzY0SWnFTeomy8s
|
145 |
lm_eval/tasks/bigbench/generate_until/ruin_names.yaml |
sha256=CkUBCb63izgA8XIrA6Ipg_JEsTZUhTd2jvokluiT0ug
|
141 |
lm_eval/tasks/bigbench/generate_until/salient_translation_error_detection.yaml |
sha256=B4ODGvAsPK_yZhh6tdLwahQedWlrI8C747DnsEtMJ7Y
|
191 |
lm_eval/tasks/bigbench/generate_until/scientific_press_release.yaml |
sha256=nQqzGRcOY_34eihaI54wGGHxbZmjCiLIlhnTy5NDuRo
|
169 |
lm_eval/tasks/bigbench/generate_until/semantic_parsing_in_context_sparc.yaml |
sha256=IfY2K5ChSu7wJJocrAcFOqZZ6DJ2UbNQaVu1YmguN4k
|
187 |
lm_eval/tasks/bigbench/generate_until/semantic_parsing_spider.yaml |
sha256=9NQEKZEqKQIxzTB9yrVOL_n9gdzGCTEh_SM_8d54nxc
|
167 |
lm_eval/tasks/bigbench/generate_until/sentence_ambiguity.yaml |
sha256=UL89kpxCyDcc80GAvgeyrNSxb7up-Zg2r9vY-DIPOS8
|
157 |
lm_eval/tasks/bigbench/generate_until/similarities_abstraction.yaml |
sha256=TJ56BdnL4GqshtCAGMFhnAyoJLakYJjHEg8IjpjUbE4
|
169 |
lm_eval/tasks/bigbench/generate_until/simp_turing_concept.yaml |
sha256=VLUMGNwUn7UBmukWVTvm5FpnWwsgI05Sea-mycDxWeY
|
159 |
lm_eval/tasks/bigbench/generate_until/simple_arithmetic_json.yaml |
sha256=K-mgxW5WEvkTiuPSRLyrOYrQxNsNOKOCxy903yRsAHE
|
165 |
lm_eval/tasks/bigbench/generate_until/simple_arithmetic_json_multiple_choice.yaml |
sha256=E4ScDHW9xrHYoxX6tHpd9F5TelLTfF1FEkWKjiDrAow
|
197 |
lm_eval/tasks/bigbench/generate_until/simple_arithmetic_json_subtasks.yaml |
sha256=zrb7SPKYenklYrv5iYEJlhbmoj4hlTsO5LOYzEUaO9g
|
183 |
lm_eval/tasks/bigbench/generate_until/simple_arithmetic_multiple_targets_json.yaml |
sha256=hj5tcAejMWEqUpKb92vrxZdc3DmgQiV4wTGUxS0Ah_A
|
199 |
lm_eval/tasks/bigbench/generate_until/simple_ethical_questions.yaml |
sha256=W3Q1UG0OZafvdloI4_6KrKUqBWySFjB86ip0wzq1qCY
|
169 |
lm_eval/tasks/bigbench/generate_until/simple_text_editing.yaml |
sha256=9tauwNsCUcTjnjjmB7Ci1ffGJfT6kytRqruJQr9OsfI
|
159 |
lm_eval/tasks/bigbench/generate_until/snarks.yaml |
sha256=-xI33E-A5p91T-56El3AIwWq8BUaCMvea32zq0VzeS4
|
133 |
lm_eval/tasks/bigbench/generate_until/social_iqa.yaml |
sha256=m5y4-e6B9_hsHpO4N1xORqWMGNW26zqG4amCwQViMxs
|
141 |
lm_eval/tasks/bigbench/generate_until/social_support.yaml |
sha256=Rw5LSAeaKSqM4P-Bw7TFuyrH2LQHr4eHJU7iF46_HAY
|
149 |
lm_eval/tasks/bigbench/generate_until/sports_understanding.yaml |
sha256=THgiCQZQ7uXebiKfUfxMeoRn-wHj9YlbEDzEbUYPFks
|
161 |
lm_eval/tasks/bigbench/generate_until/strange_stories.yaml |
sha256=jmSfVWMoIj3671y9thmnqV8CRip8gEzxon2NPQy6EVg
|
151 |
lm_eval/tasks/bigbench/generate_until/strategyqa.yaml |
sha256=pvrWXwq87EQTrLZFlvrZwaUvL5S5fGic7ygFJRXH5cM
|
141 |
lm_eval/tasks/bigbench/generate_until/sufficient_information.yaml |
sha256=y7jEwlu2P7qgTjNiTJZ9H0jJQjnirAIlZTWVB_n5umg
|
165 |
lm_eval/tasks/bigbench/generate_until/suicide_risk.yaml |
sha256=tVTkOx8x631h4azG5yEH6k_tx8PINMgp5gJEAJNnsyY
|
145 |
lm_eval/tasks/bigbench/generate_until/swahili_english_proverbs.yaml |
sha256=p2-DYr3WcFI8WSzoh_6ztyYXPZwK15f1d-XXld6xDsQ
|
169 |
lm_eval/tasks/bigbench/generate_until/swedish_to_german_proverbs.yaml |
sha256=wR1R1kRuLai6rrIkL_X2qnjFecZpiBqSpE2Sl6_D5wE
|
173 |
lm_eval/tasks/bigbench/generate_until/symbol_interpretation.yaml |
sha256=4Eg8-UYe6AvRZVvoyw4pWg3G8SLvotH6Y-fy7t-hI5A
|
163 |
lm_eval/tasks/bigbench/generate_until/temporal_sequences.yaml |
sha256=gJ5NyIda1KbTaZ4DsUKm_TwZDervdNq_rThpzo5lPbo
|
157 |
lm_eval/tasks/bigbench/generate_until/tense.yaml |
sha256=eorYGhfu6AXOFeGLs2iMWVpoPYm_dyV4slefRIdJ0Zc
|
131 |
lm_eval/tasks/bigbench/generate_until/timedial.yaml |
sha256=Sp9BMfBIs4Bob-XdxDhqKdL_QVcHDsdj05hyeGp3pBs
|
137 |
lm_eval/tasks/bigbench/generate_until/topical_chat.yaml |
sha256=rcjpxp2ukXzx8nTEcQr4oYEo7TjiFGnHeYZU5oM12ZQ
|
145 |
lm_eval/tasks/bigbench/generate_until/tracking_shuffled_objects.yaml |
sha256=SCfecVUi2EGMRzune6kpya491RDXoyct3cbtc7A3C-A
|
171 |
lm_eval/tasks/bigbench/generate_until/understanding_fables.yaml |
sha256=vH8I0hlKQ5P8cOGUeI91NClne9qMSUTv7vT0wHK0Z88
|
161 |
lm_eval/tasks/bigbench/generate_until/undo_permutation.yaml |
sha256=9BHOlfV8xa5kjVW-uM635tkxDlTTuVFfwn5sw1XX8b4
|
153 |
lm_eval/tasks/bigbench/generate_until/unit_conversion.yaml |
sha256=wtTHImrbhNRkSHyF-5hQUvBE0Pdn574G5TIdom-VmfA
|
151 |
lm_eval/tasks/bigbench/generate_until/unit_interpretation.yaml |
sha256=9AHsHkx1dwuL2gfbLq8mduuitpKJgpD38xyWNTpfxPQ
|
159 |
lm_eval/tasks/bigbench/generate_until/unnatural_in_context_learning.yaml |
sha256=QDLLkgEaTMOQ67huKiLaC1puqfxBcd-W-5U1iIg0aOw
|
179 |
lm_eval/tasks/bigbench/generate_until/vitaminc_fact_verification.yaml |
sha256=UdngQIP7djwfw3Yr1n8OTDv5c5wa9vLKuuJXm_62Q2c
|
173 |
lm_eval/tasks/bigbench/generate_until/what_is_the_tao.yaml |
sha256=X2ONz9UFxL975TIiCk-L7C5wDRI3TUxN3LCVzCIBswo
|
151 |
lm_eval/tasks/bigbench/generate_until/which_wiki_edit.yaml |
sha256=11AwFg-8uyzYs01JdsTlD-76YJTy8QQElnBYtWTxZb0
|
151 |
lm_eval/tasks/bigbench/generate_until/winowhy.yaml |
sha256=339YOg_p3fq0a8-5mBkuruJintiUmhe4VzuC4JATV7Y
|
135 |
lm_eval/tasks/bigbench/generate_until/word_sorting.yaml |
sha256=sw0cqkQkb4K6yuQpa1HTDRPi36uQKfuJDnpTlHvTspM
|
145 |
lm_eval/tasks/bigbench/generate_until/word_unscrambling.yaml |
sha256=vLuTPnG1BzEJcMQwQF37FNPPcFgw9E73tY6i2Y5ABps
|
155 |
lm_eval/tasks/bigbench/multiple_choice/abstract_narrative_understanding.yaml |
sha256=wC1sP9TEDVeqNyIH22iaUsotWkGzOTKvbwgiqH968n0
|
187 |
lm_eval/tasks/bigbench/multiple_choice/anachronisms.yaml |
sha256=C7Je1VX1Oer2QQZ5oTUDaRrvXNVk0hm1v0i9V5ZizBg
|
147 |
lm_eval/tasks/bigbench/multiple_choice/analogical_similarity.yaml |
sha256=t7OKYASkSANtBukdp0rCrrb9mRnv9AVymxrpbiOpROk
|
165 |
lm_eval/tasks/bigbench/multiple_choice/analytic_entailment.yaml |
sha256=INZHBFKntYor3Y5jKmQcpfVfWNzKJa9UnSVP9YwfIS0
|
161 |
lm_eval/tasks/bigbench/multiple_choice/arithmetic.yaml |
sha256=2FBfcRxlIlMKiYcZpgbH1SJEdKysdCnqnqafTV4jdMw
|
143 |
lm_eval/tasks/bigbench/multiple_choice/ascii_word_recognition.yaml |
sha256=dWZZsykMhM60NfZVwuca4ZCsRMyIQm2y7xal9j5N0R8
|
167 |
lm_eval/tasks/bigbench/multiple_choice/authorship_verification.yaml |
sha256=gjE-K4rye_zIaKDlh8dYy-VwPjofrEl3MQH34Bru_t0
|
169 |
lm_eval/tasks/bigbench/multiple_choice/auto_categorization.yaml |
sha256=1Loa5kQ4sOzlqfcbUdrdTIL7uFkAwNdJRlW8ZHA0mrE
|
161 |
lm_eval/tasks/bigbench/multiple_choice/auto_debugging.yaml |
sha256=uvO9d4dm7ZSI9ExMlEVxHup4SEPMYsC9f-9pCjqhiak
|
151 |
lm_eval/tasks/bigbench/multiple_choice/bbq_lite_json.yaml |
sha256=PwESU5lyQ8jCt48M1CRu35zjrZe_1KJ0vRAkRsD344M
|
149 |
lm_eval/tasks/bigbench/multiple_choice/bridging_anaphora_resolution_barqa.yaml |
sha256=zRYUaV6tbiR4vzKE9WNfLuzVycUQgAC2wDrcQ46kQyA
|
191 |
lm_eval/tasks/bigbench/multiple_choice/causal_judgement.yaml |
sha256=AdWyVGyyZrKWGLbb91TmkdMhvxOWO-8R0tdzo6X9l-Q
|
154 |
lm_eval/tasks/bigbench/multiple_choice/causal_judgment.yaml |
sha256=cOoY9jmJRYkA1KGalJ7h8dBUpv9chuakALtfH08gw2w
|
153 |
lm_eval/tasks/bigbench/multiple_choice/cause_and_effect.yaml |
sha256=wCaVMnfOjvtrVugUuGtsFW6TS9rrJDY0sn3d6mgiz70
|
155 |
lm_eval/tasks/bigbench/multiple_choice/checkmate_in_one.yaml |
sha256=gDzulVCGouLHriNLgPs40lx_70LyQQt48yzZoU9mwr4
|
155 |
lm_eval/tasks/bigbench/multiple_choice/chess_state_tracking.yaml |
sha256=cpMuwLx4PM6LIZgLKxGFJ5bJbESrjJSwjtrYsi24hvo
|
163 |
lm_eval/tasks/bigbench/multiple_choice/chinese_remainder_theorem.yaml |
sha256=2kOE5oUeEIvF1T7QwbwbOs_YvWkz9LmRlD6oGAOG7aE
|
173 |
lm_eval/tasks/bigbench/multiple_choice/cifar10_classification.yaml |
sha256=aaF6C9Y0ShfklEKSBTV1Ge56N9hjGbUWoBhb-k0Q8BM
|
167 |
lm_eval/tasks/bigbench/multiple_choice/code_line_description.yaml |
sha256=S1035NWJpfsH422H5l0ODN5IYD--TmpCRQ2oYjxwKDM
|
165 |
lm_eval/tasks/bigbench/multiple_choice/codenames.yaml |
sha256=g9ZH3kojjsJIInfiG_8jQ59lRYE58Beo_vM9-u01tWo
|
141 |
lm_eval/tasks/bigbench/multiple_choice/color.yaml |
sha256=AQVs0lfVjCKmQVxD21lZ0wvt05IT5zj8hKTBJHIyo-M
|
133 |
lm_eval/tasks/bigbench/multiple_choice/common_morpheme.yaml |
sha256=1lMuopdW2sXoOl0seZam01J5QLoGQcin6dcak6aIUqY
|
153 |
lm_eval/tasks/bigbench/multiple_choice/conceptual_combinations.yaml |
sha256=AUk3ixDxwC2d2mmyy0vgBHlvdF8WrZ8CQEVYw_-IRKk
|
169 |
lm_eval/tasks/bigbench/multiple_choice/conlang_translation.yaml |
sha256=hMZ4TDw66UMt95YDTdzOd8xND9dMboYKRNmHlVZMtwk
|
161 |
lm_eval/tasks/bigbench/multiple_choice/contextual_parametric_knowledge_conflicts.yaml |
sha256=vtAoTqjUA-LA-6Ha2NTU4mp4sLj8tJ3Pnp6VSiojCjE
|
205 |
lm_eval/tasks/bigbench/multiple_choice/crash_blossom.yaml |
sha256=TrQV25mnyMHwd_ScNwn5mS8I5P-p3Eh7udUJkdUsWQE
|
149 |
lm_eval/tasks/bigbench/multiple_choice/crass_ai.yaml |
sha256=40zHsjc3Kwzx4pEHE3EHbmKse2OWlLvVpUio6s9TSME
|
139 |
lm_eval/tasks/bigbench/multiple_choice/cryobiology_spanish.yaml |
sha256=vQmzgs2Qc6HggqhLO6gnhSMZ9TQLia234w3l-3YM5yg
|
161 |
lm_eval/tasks/bigbench/multiple_choice/cryptonite.yaml |
sha256=B7W_fs7aBd3bdNrESbV_hN3FinjmtSkQJBIfpLJx-rM
|
143 |
lm_eval/tasks/bigbench/multiple_choice/cs_algorithms.yaml |
sha256=CBAuNg7LJg_ZkOcwToxUiyx9J9UYL_ZywFBF76RUOW8
|
149 |
lm_eval/tasks/bigbench/multiple_choice/dark_humor_detection.yaml |
sha256=ZR7uOXffiox0IEVWYkXOT7SdIQnDcJagKX7VBi67ZIw
|
163 |
lm_eval/tasks/bigbench/multiple_choice/date_understanding.yaml |
sha256=MCTeid6Oka450ykNY7W3_R0A_PQJho22VFmCeHIfbYo
|
159 |
lm_eval/tasks/bigbench/multiple_choice/disambiguation_qa.yaml |
sha256=JcqPKhHYk16GrGPoayMtU3GfobU9q4_CJls75HEO2vU
|
157 |
lm_eval/tasks/bigbench/multiple_choice/discourse_marker_prediction.yaml |
sha256=xiBp0rF6bDNiK29LA_3e3F4z2XBpP4Q04ui8swgUdOM
|
177 |
lm_eval/tasks/bigbench/multiple_choice/disfl_qa.yaml |
sha256=FT-7_mTAmg2G8cnkBdC_WM7K48XGVOIYrNPyZU4yKgI
|
139 |
lm_eval/tasks/bigbench/multiple_choice/dyck_languages.yaml |
sha256=zoC2Wr7zftGCJ7Vxz9n-uKnsyC41MEa8qWFzCq0Iw-Q
|
151 |
lm_eval/tasks/bigbench/multiple_choice/elementary_math_qa.yaml |
sha256=bl0WofRVx69oiYan7-6E4GyIy9O06MbN-ufJQOwC4xw
|
159 |
lm_eval/tasks/bigbench/multiple_choice/emoji_movie.yaml |
sha256=5bb5pq4ODf2K0KvBKxuS8wzNyiTfCnacRGzlr_FL0ao
|
145 |
lm_eval/tasks/bigbench/multiple_choice/emojis_emotion_prediction.yaml |
sha256=m4nNGvxS2WQvxPnL8zraYKMT_G-Ech-YQpJPHNBOOx4
|
173 |
lm_eval/tasks/bigbench/multiple_choice/empirical_judgments.yaml |
sha256=LW2ualE3N4kwkHVrI0d6EoyGMYW2w9zAHeZSblMoBY4
|
161 |
lm_eval/tasks/bigbench/multiple_choice/english_proverbs.yaml |
sha256=pvklpKxfGJPON-55U-u_OpuX6TjeiFAwaZG9DoYWsL8
|
155 |
lm_eval/tasks/bigbench/multiple_choice/english_russian_proverbs.yaml |
sha256=LaXw7JBMw9wYRSQ5Oc6UcVRWRObxK-YZZuET8RnImNE
|
171 |
lm_eval/tasks/bigbench/multiple_choice/entailed_polarity.yaml |
sha256=O4jpB-YazafZ2eMfAP_X5V6km3_SYrVM8TQr20kgsDM
|
157 |
lm_eval/tasks/bigbench/multiple_choice/entailed_polarity_hindi.yaml |
sha256=XMv0z940AAAPrLUOLbzx30hK1nto1eOHdHtFmpZjiHo
|
169 |
lm_eval/tasks/bigbench/multiple_choice/epistemic_reasoning.yaml |
sha256=V5TJetxQ2yrJ6-wKdocsee7IQ5RCDFEyCyAyxrJKCJg
|
161 |
lm_eval/tasks/bigbench/multiple_choice/evaluating_information_essentiality.yaml |
sha256=tvkY6sCaIJ8__vR6s-KwEd98-ratIPCoqRt3aDJGiqk
|
193 |
lm_eval/tasks/bigbench/multiple_choice/fact_checker.yaml |
sha256=PsjpCG1Lr4TyF0j4g3qafA9JilHA-gkOk4UFJBi26Jg
|
147 |
lm_eval/tasks/bigbench/multiple_choice/fantasy_reasoning.yaml |
sha256=WV-E_5iU6mzN6TuVx5tzxQHoj4eRECe1nGvBYchoKWM
|
157 |
lm_eval/tasks/bigbench/multiple_choice/few_shot_nlg.yaml |
sha256=jyhPKTSznBwm-Wc4qZL-oRNuW_bX0EHm_Ub5yPQNrkc
|
147 |
lm_eval/tasks/bigbench/multiple_choice/figure_of_speech_detection.yaml |
sha256=M_04O90Pe0ouz3C1hB9cr3OHCpDBg6uEwmov0WmpG1w
|
175 |
lm_eval/tasks/bigbench/multiple_choice/formal_fallacies_syllogisms_negation.yaml |
sha256=kYQBuhXwGX4rkfsH5-xl8a89clZ44J2yDRDXWaEWxlo
|
195 |
lm_eval/tasks/bigbench/multiple_choice/gem.yaml |
sha256=p5K2HUddtwio3c-BDgWgXA1IakG9WRxxWwlrkk6DhZE
|
129 |
lm_eval/tasks/bigbench/multiple_choice/gender_inclusive_sentences_german.yaml |
sha256=M8fGO2pAf24VVLe475dPNULbbfS8VKqo4kJavuCPiMc
|
189 |
lm_eval/tasks/bigbench/multiple_choice/general_knowledge.yaml |
sha256=c0wF8hScD69clivEqyHCrS-q54U3HXxkSdaTnF6Japs
|
157 |
lm_eval/tasks/bigbench/multiple_choice/geometric_shapes.yaml |
sha256=fC2JycgGzSw7Mv2Rtrm9LuzBMPOQ7GOsbvn6BTFPWYM
|
155 |
lm_eval/tasks/bigbench/multiple_choice/goal_step_wikihow.yaml |
sha256=YKxtalWZL4K1_ZsWc-LjcuoCcA4zZrJo9k2j6Gwf-H0
|
157 |
lm_eval/tasks/bigbench/multiple_choice/gre_reading_comprehension.yaml |
sha256=fP4Je-tWun2_aVA9t5VdgVQhxr_XV6dFpOqN8gOmQHs
|
173 |
lm_eval/tasks/bigbench/multiple_choice/hhh_alignment.yaml |
sha256=_tUXB6FyCm4FhrzdvGCGToZ9Uel7iiT9bTYhcctmxcc
|
149 |
lm_eval/tasks/bigbench/multiple_choice/hindi_question_answering.yaml |
sha256=OoSurgrc790dPRWg_xpYhqCpqYwKgzCtc5UQNVhQC2Y
|
171 |
lm_eval/tasks/bigbench/multiple_choice/hindu_knowledge.yaml |
sha256=mR19KJvjc1Zfu1iTZ_XXJEHhGceewlaIor23i9NFT-4
|
153 |
lm_eval/tasks/bigbench/multiple_choice/hinglish_toxicity.yaml |
sha256=yFWbJIcU7bixzLbEhGB8jTh_zfufQDN9pb9RHsjI3is
|
157 |
lm_eval/tasks/bigbench/multiple_choice/human_organs_senses.yaml |
sha256=AN-lVocUpTUEXbxlXETc9wvbtI4VlQRbam4yJ8DuAa8
|
161 |
lm_eval/tasks/bigbench/multiple_choice/hyperbaton.yaml |
sha256=cD8xjAZ2PkPaNci9URLHuJp6ycFqBaFItFDx1CbMnIU
|
143 |
lm_eval/tasks/bigbench/multiple_choice/identify_math_theorems.yaml |
sha256=fuAPHAn6v_4nsTlMViKA--Oir38GoRFdRsjbgXajIYU
|
167 |
lm_eval/tasks/bigbench/multiple_choice/identify_odd_metaphor.yaml |
sha256=abV3gYfcE6CkeVu_VHw34PHOKB-lqxpIVUbpS5_KECg
|
165 |
lm_eval/tasks/bigbench/multiple_choice/implicatures.yaml |
sha256=wxZTAm9VbfCWoxE1jU9k3nzy4njiLbQf6syZJHoKT5A
|
147 |
lm_eval/tasks/bigbench/multiple_choice/implicit_relations.yaml |
sha256=qCOpepGcuNlXEkSXzQ8kWBhMd5SxMH21Qe4rOkQruzs
|
159 |
lm_eval/tasks/bigbench/multiple_choice/intent_recognition.yaml |
sha256=NgkXv5sA4F6tA7yW6NVdGolTURrf9_2hr4-qGzgl4RI
|
159 |
lm_eval/tasks/bigbench/multiple_choice/international_phonetic_alphabet_nli.yaml |
sha256=ikVnfnKZMzeuE2DxWfdyHxN2I78_o2WbOiQmyZdAmIY
|
193 |
lm_eval/tasks/bigbench/multiple_choice/international_phonetic_alphabet_transliterate.yaml |
sha256=Q9G0lf0IolZ6zI5Kql6WiTdIU1LXOhdvGgnFDMzSh2g
|
213 |
lm_eval/tasks/bigbench/multiple_choice/intersect_geometry.yaml |
sha256=AMQk-kMyhzMYRKXMPwVjRw81vz5SbzdJKv3n3DVhE-s
|
159 |
lm_eval/tasks/bigbench/multiple_choice/irony_identification.yaml |
sha256=9uJjn9cc_1FKV0B6Q_RApFQFLgOWg5epCthdFy4OxbQ
|
163 |
lm_eval/tasks/bigbench/multiple_choice/kanji_ascii.yaml |
sha256=OiDkSbsojWXhvuXd1hm-gg0FDAM1gIFi3ZgIqSCZ7Ak
|
145 |
lm_eval/tasks/bigbench/multiple_choice/kannada.yaml |
sha256=9r5l-ePBRwIct7oCLnbcAd1Go7YjdT4_49VFW9MZUFg
|
137 |
lm_eval/tasks/bigbench/multiple_choice/key_value_maps.yaml |
sha256=oDwDxjIHL_xoL59erf39h02ktA175lz3AwVmdQO4EBY
|
151 |
lm_eval/tasks/bigbench/multiple_choice/known_unknowns.yaml |
sha256=zqJ_y82QBR49vIjl-nXaMztSnmQHZyt89iYduvODAJI
|
151 |
lm_eval/tasks/bigbench/multiple_choice/language_games.yaml |
sha256=uNakbVpnDGUANSXyjC2Soq2AhojHJxdP8nUtZtoQCZ8
|
151 |
lm_eval/tasks/bigbench/multiple_choice/language_identification.yaml |
sha256=H9R_FN6zSJ-r1PJuxzLj-Zokaz_h_SnFL5-TOqsXgrk
|
169 |
lm_eval/tasks/bigbench/multiple_choice/linguistic_mappings.yaml |
sha256=1Gg8iqLbb_Q1loJ3D6vrp1cG_RPMiJ_lidRaDmXmQjY
|
161 |
lm_eval/tasks/bigbench/multiple_choice/linguistics_puzzles.yaml |
sha256=IFwKu0pmpWcPPfw2mlB-vHJQdnc2UeGOnFpJW862ejQ
|
161 |
lm_eval/tasks/bigbench/multiple_choice/list_functions.yaml |
sha256=YnjOU3p7YZ6H-b-3pe7JpxqU7n38vDRUujHvFeGg9rg
|
151 |
lm_eval/tasks/bigbench/multiple_choice/logic_grid_puzzle.yaml |
sha256=tTzJVoptnvAXvHrSa_p8SQBitcqm33N7xj19c5-k958
|
157 |
lm_eval/tasks/bigbench/multiple_choice/logical_args.yaml |
sha256=EXkFCjB2ZwgQbaFRueg0GAU0YeaShfIg7Hntr6qLl6c
|
147 |
lm_eval/tasks/bigbench/multiple_choice/logical_deduction.yaml |
sha256=CkQfV5G0ODHf2-jsn-kGQpWVn_XZxvCQMC51FLB_-2I
|
157 |
lm_eval/tasks/bigbench/multiple_choice/logical_fallacy_detection.yaml |
sha256=38FqX9n3B7vCiAipQOBy0h-U196BkXJbLYas9QQf_lU
|
173 |
lm_eval/tasks/bigbench/multiple_choice/logical_sequence.yaml |
sha256=svmGHJqVBczZFAJIlLEr1ZkXeww14sJmlSO0Q3mPSNo
|
155 |
lm_eval/tasks/bigbench/multiple_choice/mathematical_induction.yaml |
sha256=WlHISjFdS1bDDWcXaunC_YCxR8xiwDMywcK1V5oTjSs
|
167 |
lm_eval/tasks/bigbench/multiple_choice/matrixshapes.yaml |
sha256=dRaQ7CK36fOGIgxjQpqbL0G54sCruap1erCqwjKn8II
|
147 |
lm_eval/tasks/bigbench/multiple_choice/metaphor_boolean.yaml |
sha256=6zPIyGfa2_1F0izqys2BA_oPRqP6bkuG8mn1sr-SSO8
|
155 |
lm_eval/tasks/bigbench/multiple_choice/metaphor_understanding.yaml |
sha256=gDPNGHax72oqSOG9FEZtb4o1RwnQFRnWxtpP21MtTGA
|
167 |
lm_eval/tasks/bigbench/multiple_choice/minute_mysteries_qa.yaml |
sha256=uxFxZS1VCrFTzlCNIZySELdJwBySfiy49d9sDl0PxIQ
|
161 |
lm_eval/tasks/bigbench/multiple_choice/misconceptions.yaml |
sha256=hD9u1UkaUMCrBOo4hQ3aqGaXn2OsYWx9BHehVbmR8SQ
|
151 |
lm_eval/tasks/bigbench/multiple_choice/misconceptions_russian.yaml |
sha256=RyOFlUECkBfgXVwINo6nb4LZGIGEHvEOf3QXRPuHqgo
|
167 |
lm_eval/tasks/bigbench/multiple_choice/mnist_ascii.yaml |
sha256=d82XP_zCc1BVX62ACAtwRFqTknRUiBdA8e_dfG8mDDU
|
145 |
lm_eval/tasks/bigbench/multiple_choice/modified_arithmetic.yaml |
sha256=k9XOUspUkQgwPr6zq8x_thAYCKCXWQnI42WObqza1cA
|
161 |
lm_eval/tasks/bigbench/multiple_choice/moral_permissibility.yaml |
sha256=gwWRvZfl3EB6KfqPgeYopWi0selkq6TUoOwT2yIu-N8
|
163 |
lm_eval/tasks/bigbench/multiple_choice/movie_dialog_same_or_different.yaml |
sha256=rbRbTacFYTA4w0IiCDwu-BV3cXdoTyUHaiZBw_da3KM
|
183 |
lm_eval/tasks/bigbench/multiple_choice/movie_recommendation.yaml |
sha256=Q_m6rVIIAYrScV9rOL-whs2uQpI_SS_PfzlRvguOSEo
|
163 |
lm_eval/tasks/bigbench/multiple_choice/mult_data_wrangling.yaml |
sha256=qqn2a0LC4p3RZfCr0zPwK3RrH3ujzASfFzWZBouJMlc
|
161 |
lm_eval/tasks/bigbench/multiple_choice/multiemo.yaml |
sha256=mQiAx9YxXNa7KIiQOq5-xsw6H3orqeTKaTWUMVQ-eH4
|
139 |
lm_eval/tasks/bigbench/multiple_choice/natural_instructions.yaml |
sha256=Xkz8HRANNey5ai4RDCKq74SKvjDiAgFCnOtc2cpW_KY
|
163 |
lm_eval/tasks/bigbench/multiple_choice/navigate.yaml |
sha256=4w-tghcD6TA82faIKLv7a788eeunV9xLpZuEgv-_fPQ
|
139 |
lm_eval/tasks/bigbench/multiple_choice/nonsense_words_grammar.yaml |
sha256=WcvwDGDH3ngMkubAv-OwJotfPospfM0g9sQvt28zcDI
|
167 |
lm_eval/tasks/bigbench/multiple_choice/novel_concepts.yaml |
sha256=70FLoqaSM9FuJcw3Inq0_lDlq9kOhZKA9LRP3pyMkTg
|
151 |
lm_eval/tasks/bigbench/multiple_choice/object_counting.yaml |
sha256=FgmaBFkmloF4vO_ggHuFZAZ0y63SP7jFcROGEQa5K4Q
|
153 |
lm_eval/tasks/bigbench/multiple_choice/odd_one_out.yaml |
sha256=pNe2yMix9NoxFR1uFGMvmGJ-XXaf-k91GqhVGqx8IIo
|
145 |
lm_eval/tasks/bigbench/multiple_choice/operators.yaml |
sha256=dynr_XiyX2B3YdNH0aYHumgStnqf1Xlc1tEqnaLNSwU
|
141 |
lm_eval/tasks/bigbench/multiple_choice/paragraph_segmentation.yaml |
sha256=pzkd799eOlhMSs1plT9VKX2va6QR8pGw-G3ZQ7fJdSY
|
167 |
lm_eval/tasks/bigbench/multiple_choice/parsinlu_qa.yaml |
sha256=AVBwt6tCfZ0laBosVW5MQ9ko8487szfZPWs3EvDIKEY
|
145 |
lm_eval/tasks/bigbench/multiple_choice/parsinlu_reading_comprehension.yaml |
sha256=5FOCYca9TArYrwVDhW-j8gVNDdh7gj2Xx5bNU05NrLE
|
183 |
lm_eval/tasks/bigbench/multiple_choice/penguins_in_a_table.yaml |
sha256=oL_-N96gKsrGBfBg2UD6ct3hU1gh51gvXpKoCGD0DuY
|
161 |
lm_eval/tasks/bigbench/multiple_choice/periodic_elements.yaml |
sha256=HypvcUcCkflKLvsZFP9_OmmWmNCpHN2oflxSs-0se4k
|
157 |
lm_eval/tasks/bigbench/multiple_choice/persian_idioms.yaml |
sha256=S_f8iqKOnKJ4lHG5egkLDgO3XqQhz8eluPDizWvvyhw
|
151 |
lm_eval/tasks/bigbench/multiple_choice/phrase_relatedness.yaml |
sha256=SbcRCbbvr50IkMhdJOYh6Ut2hvIv6tKAr-H6Ly0xVn4
|
159 |
lm_eval/tasks/bigbench/multiple_choice/physical_intuition.yaml |
sha256=itDxp960hGYTGOecgg4_SIvnVUJWD2oGK0VS1bwfFvc
|
159 |
lm_eval/tasks/bigbench/multiple_choice/physics.yaml |
sha256=zp1ylYAHchQc_NZI_80znXr3x1Keaith7F7FZWixdZY
|
137 |
lm_eval/tasks/bigbench/multiple_choice/physics_questions.yaml |
sha256=KAOHwtZhxcs1OM9zHkTjLKih8qFPR6UTuY5xs0J1QM0
|
157 |
lm_eval/tasks/bigbench/multiple_choice/play_dialog_same_or_different.yaml |
sha256=XARNBYPXja_b1ve7ivRgjY40Rs_sY0-Ypb4wR10HJos
|
181 |
lm_eval/tasks/bigbench/multiple_choice/polish_sequence_labeling.yaml |
sha256=6mgV-tUc9a9al1MqQuPMBRTHnADYjcmOb2wiZ2aKPTs
|
171 |
lm_eval/tasks/bigbench/multiple_choice/presuppositions_as_nli.yaml |
sha256=nxOBZPZEZiW3U3oehpw__LgpohBZqtw6C228vfWkpOI
|
167 |
lm_eval/tasks/bigbench/multiple_choice/qa_wikidata.yaml |
sha256=AQqA32tK3YV35djuf0xguKYGjUlYu7aF7nzYNVLv3zY
|
145 |
lm_eval/tasks/bigbench/multiple_choice/question_selection.yaml |
sha256=-We9wR4lHJ8Mt876ASjZ-BCqDgVJ3rxjetwkhDN6m44
|
159 |
lm_eval/tasks/bigbench/multiple_choice/real_or_fake_text.yaml |
sha256=sXE9yUoZP_zLenXb3elDIqkbqWliUCGgbj-2zJaZ1j0
|
157 |
lm_eval/tasks/bigbench/multiple_choice/reasoning_about_colored_objects.yaml |
sha256=GxUoDPDFc1X_A8t6Ry0U2ik4nFPCPD_rcRb2NzSazpQ
|
185 |
lm_eval/tasks/bigbench/multiple_choice/repeat_copy_logic.yaml |
sha256=zwE2sFi9wS_uSfJuk06Pp-iwMU9kKHZ-Hycdl0XzlmI
|
157 |
lm_eval/tasks/bigbench/multiple_choice/rephrase.yaml |
sha256=765_dob8s3IUxEIBnEjXROaraac0MXMJsIO6427AHlQ
|
139 |
lm_eval/tasks/bigbench/multiple_choice/riddle_sense.yaml |
sha256=3YmY87ChwiGd7QR4svwruN7uTbHc9SO2GrY5P27R6hY
|
147 |
lm_eval/tasks/bigbench/multiple_choice/ruin_names.yaml |
sha256=FftjCDl4NT38Y9OGqXK8DPpJMlpiuIrCgFmHf4dUPIc
|
143 |
lm_eval/tasks/bigbench/multiple_choice/salient_translation_error_detection.yaml |
sha256=cwqUPYs4ABD4Up3p5Zoc9o1eRWIDWJeF6LCqlzYbnsA
|
193 |
lm_eval/tasks/bigbench/multiple_choice/scientific_press_release.yaml |
sha256=K-hSiBHahbEHsTRZcRlrLiTgr40LpSz2XqxelmVpPkg
|
171 |
lm_eval/tasks/bigbench/multiple_choice/semantic_parsing_in_context_sparc.yaml |
sha256=e4rUYPAz9NKdHyJuVNm8aOCc5wvJfCufbkBgDOdcuxo
|
189 |
lm_eval/tasks/bigbench/multiple_choice/semantic_parsing_spider.yaml |
sha256=03wphaTbuRbJjPimKY46pZyR7xYXtinoazFm9y8W3UU
|
169 |
lm_eval/tasks/bigbench/multiple_choice/sentence_ambiguity.yaml |
sha256=JE1-08FYW-dxEOpx5bpZezg7bv7PGXxKrPJy6-YyBls
|
159 |
lm_eval/tasks/bigbench/multiple_choice/similarities_abstraction.yaml |
sha256=mSSvLTS_klQJnnJ5XyivY35lRjPBlnMaIRZm1qksNNE
|
171 |
lm_eval/tasks/bigbench/multiple_choice/simp_turing_concept.yaml |
sha256=PCjOzMdvflXFY80rT2mUEqrRSUSjpV2G4nBvJrg-7bY
|
161 |
lm_eval/tasks/bigbench/multiple_choice/simple_arithmetic_json.yaml |
sha256=Vn-qd71dMDRG_O8qW3RWNw18RfzRfh_WAbX8uIWdJ-4
|
167 |
lm_eval/tasks/bigbench/multiple_choice/simple_arithmetic_json_multiple_choice.yaml |
sha256=z-7I7haN3gbj-ob7HpXEcc3BGHi54Rcpx4vUuklopXY
|
199 |
lm_eval/tasks/bigbench/multiple_choice/simple_arithmetic_json_subtasks.yaml |
sha256=scaWSib2RTInLTPq9QTjP9jqFuGrswRjoG1ldf7ZV40
|
185 |
lm_eval/tasks/bigbench/multiple_choice/simple_arithmetic_multiple_targets_json.yaml |
sha256=c_5j1thsZWGPpN587L9wwTvGXJtn0bXHwsPkQti-Gtc
|
201 |
lm_eval/tasks/bigbench/multiple_choice/simple_ethical_questions.yaml |
sha256=AoEpxT-BJNoK14erRJF2KMRHhxYQknT8RlKyFfUo464
|
171 |
lm_eval/tasks/bigbench/multiple_choice/simple_text_editing.yaml |
sha256=iQ2dhZDQmVjwI45MNA4tq6QSUteDHZhrAA26AUcolfM
|
161 |
lm_eval/tasks/bigbench/multiple_choice/snarks.yaml |
sha256=6fzQ534gJ258GBeQ_dAfY6XDWO_4iiFCqnk25UoLaw8
|
135 |
lm_eval/tasks/bigbench/multiple_choice/social_iqa.yaml |
sha256=9YXML6u8TMjEXmgoiCCaxPuwWAkI3D_hZ7DSFHgXOBM
|
143 |
lm_eval/tasks/bigbench/multiple_choice/social_support.yaml |
sha256=0DtPajyURdrecK8iK_a1rHn0CGSVl0AV4P-ZHsdYX90
|
151 |
lm_eval/tasks/bigbench/multiple_choice/sports_understanding.yaml |
sha256=tMqTvRUO8LkLwBlETT0gifsPuVhGPloBALx0RFUbiDg
|
163 |
lm_eval/tasks/bigbench/multiple_choice/strange_stories.yaml |
sha256=tg_ziIxDWhe-gKEZhXmPYBPjxEO5eLBIxZt0jNamWJs
|
153 |
lm_eval/tasks/bigbench/multiple_choice/strategyqa.yaml |
sha256=qpCs5rUpwnwaxM2-WwoD7d_dcGyRNj9udfj3YgPg0XA
|
143 |
lm_eval/tasks/bigbench/multiple_choice/sufficient_information.yaml |
sha256=6ELBpj2L4d328g-i3VBD4TdF-bbluyLMwvxbeEosXS4
|
167 |
lm_eval/tasks/bigbench/multiple_choice/suicide_risk.yaml |
sha256=6gP5J1tuQZbJV0GzM1EF0d6_YvK9_oQ_Ql4R8AiPQEk
|
147 |
lm_eval/tasks/bigbench/multiple_choice/swahili_english_proverbs.yaml |
sha256=wMNK9p2Pj30r66cn1zvSShLSux0RfFuVfNqWwGB70UA
|
171 |
lm_eval/tasks/bigbench/multiple_choice/swedish_to_german_proverbs.yaml |
sha256=5XxtyZUUBNpHkfQnyuxGO8vkJFeOk4TC_UPy_CQCT8M
|
175 |
lm_eval/tasks/bigbench/multiple_choice/symbol_interpretation.yaml |
sha256=8VX_GFgr3i6Dc8tn0VOeIQ_wNzKbsLZsEXwNywbDSV0
|
165 |
lm_eval/tasks/bigbench/multiple_choice/temporal_sequences.yaml |
sha256=H0WwLH2bVviU4DCJG84cdRj7S_O--KFo0ibF2Marr5g
|
159 |
lm_eval/tasks/bigbench/multiple_choice/tense.yaml |
sha256=Bruxfq7hLnGRQgBe3wP2dTuNi-lEEBLZkB0OtcOwDG0
|
133 |
lm_eval/tasks/bigbench/multiple_choice/timedial.yaml |
sha256=AydfQAj3ZiDrUzOCHOnVRNrza3UbwsLgNvnEtboFK2E
|
139 |
lm_eval/tasks/bigbench/multiple_choice/topical_chat.yaml |
sha256=buvC9ck4McRAUL7hO2q-C3tbOZ4IRhtrvFoX5d98tRE
|
147 |
lm_eval/tasks/bigbench/multiple_choice/tracking_shuffled_objects.yaml |
sha256=q4HsGJ0s0z8nQ4igwGUukttJBuMkiJc926OPME6UE-Q
|
173 |
lm_eval/tasks/bigbench/multiple_choice/understanding_fables.yaml |
sha256=vrKXG8Y9kVogHrp0FnMYarytSJLGD2QcGldbhWbX98U
|
163 |
lm_eval/tasks/bigbench/multiple_choice/undo_permutation.yaml |
sha256=obnLt5OywuNhhELip5jNgotWCwAHzd6IrVgWkZzmMPY
|
155 |
lm_eval/tasks/bigbench/multiple_choice/unit_conversion.yaml |
sha256=0GFL35T0IRYgMNMss-LLQwmdANbdhFJ-NEUYspB9pHc
|
153 |
lm_eval/tasks/bigbench/multiple_choice/unit_interpretation.yaml |
sha256=vLqDPIdMj8FlMq5AQUXyz7o7k0lGC4_BLop9TRNALgM
|
161 |
lm_eval/tasks/bigbench/multiple_choice/unnatural_in_context_learning.yaml |
sha256=sF8nmC30vsXZR1Xn-a1m5mAXC-lrqs18_t20qJ1cw94
|
181 |
lm_eval/tasks/bigbench/multiple_choice/vitaminc_fact_verification.yaml |
sha256=1sZ7XhrJGGbicdOJbJxl61yTzy0nez3wMNvr8DtoR10
|
175 |
lm_eval/tasks/bigbench/multiple_choice/what_is_the_tao.yaml |
sha256=g4sj5BjHAlbLqt5KBrvXT3jAvofFobdIacNmfugmcAE
|
153 |
lm_eval/tasks/bigbench/multiple_choice/which_wiki_edit.yaml |
sha256=AHNB5MgzPP6hC79ktaPGcCrTNHnklYxiU25R1ACdEAc
|
153 |
lm_eval/tasks/bigbench/multiple_choice/winowhy.yaml |
sha256=jD95Obu3GrnKP_oZL26NrOAvznQJV0274KmLlg_wM1k
|
137 |
lm_eval/tasks/bigbench/multiple_choice/word_sorting.yaml |
sha256=WJctV0okW4jjU3HgprNUyNc9yeFan109eC77Bayq9tk
|
147 |
lm_eval/tasks/bigbench/multiple_choice/word_unscrambling.yaml |
sha256=560CY4-vhF5C97RpIDVjaht1RchocipGDvlmimZp_ZQ
|
157 |
lm_eval/tasks/blimp/README.md |
sha256=DWssG7sScoVaJep8XMGuh7q4ypM9m0evl9YzvnxgFeA
|
2920 |
lm_eval/tasks/blimp/_template_yaml |
sha256=HuzVLND1ZxXBKKgerkw-LwF7TbQRevwDaMwMzdWgnYI
|
333 |
lm_eval/tasks/blimp/adjunct_island.yaml |
sha256=-9lX4hPdterByJxKE5g0rKbduMM19WgtEMvblkzv68s
|
104 |
lm_eval/tasks/blimp/anaphor_gender_agreement.yaml |
sha256=YvC5NfoTfaIQ8YEYSXDsj3nUph38cVyV6V6j8zDmmrM
|
124 |
lm_eval/tasks/blimp/anaphor_number_agreement.yaml |
sha256=QZLYkO_7cmUYG0wJFBbXvoDAdgzEouIlWaw3WIlp85o
|
124 |
lm_eval/tasks/blimp/animate_subject_passive.yaml |
sha256=znBh6LPx2JsVMfGJro-hfKDSwKb6UEPuv0SJ7bxjAF0
|
122 |
lm_eval/tasks/blimp/animate_subject_trans.yaml |
sha256=NA59OdcPs1vcNK37AObFpIRusV4bXJAZWwgptFKWlxs
|
118 |
lm_eval/tasks/blimp/causative.yaml |
sha256=iOyrzoGsOaU7L1mRctjhuFVgxFma_Z8FIDana6GRP-U
|
94 |
lm_eval/tasks/blimp/complex_NP_island.yaml |
sha256=IJZMuZgeeJhBdE5fRK9JLkHv4-EFjRGIdZzOMlh6acE
|
110 |
lm_eval/tasks/blimp/coordinate_structure_constraint_complex_left_branch.yaml |
sha256=3KHjSpHUgOlMknw6yyeuFcmq7Tr5Aj0BWhABRqBAXKI
|
178 |
lm_eval/tasks/blimp/coordinate_structure_constraint_object_extraction.yaml |
sha256=1utajR5vsWlwfMlxnAIh6g_ZWMerLWplnVa_91ZOOt8
|
174 |
lm_eval/tasks/blimp/determiner_noun_agreement_1.yaml |
sha256=Xozzid4qpRC2c2Y0G2CzQA4MwtC6lmAxWYzolnV1vyg
|
130 |
lm_eval/tasks/blimp/determiner_noun_agreement_2.yaml |
sha256=h3l_Nur4ofxlOCEKG74Ped29pgKrKGJ2EU06CR-W_ko
|
130 |
lm_eval/tasks/blimp/determiner_noun_agreement_irregular_1.yaml |
sha256=SaT-zTh8rDVb0lpIxKqDsvBaKGGtR2UtyzqE0n-ixuE
|
150 |
lm_eval/tasks/blimp/determiner_noun_agreement_irregular_2.yaml |
sha256=mkorgBYuduNOB-gTdMlNFAxV6N7dC7mjdtL3jcpaWmE
|
150 |
lm_eval/tasks/blimp/determiner_noun_agreement_with_adj_2.yaml |
sha256=RyuzjODaFGx-tpB4qsFUCp6LKxq23TQVpePCW8Qffys
|
148 |
lm_eval/tasks/blimp/determiner_noun_agreement_with_adj_irregular_1.yaml |
sha256=yhSMa2TUnNbcDabHYtIPdgbU34sbFrEW2_WxDXzzrcc
|
168 |
lm_eval/tasks/blimp/determiner_noun_agreement_with_adj_irregular_2.yaml |
sha256=dmUQWIxZnSKEGJgBxBMancfBTAjhp-5Fn6IiL3w1ci4
|
168 |
lm_eval/tasks/blimp/determiner_noun_agreement_with_adjective_1.yaml |
sha256=qO4si9QBuAvM1y0yGP9ZZo1YiQlBZljl2n8zKFh9VDE
|
160 |
lm_eval/tasks/blimp/distractor_agreement_relational_noun.yaml |
sha256=ZXy-qJ5fkMeqctJDqo2hJfsM-8usA9bneX7VWAvR1Ak
|
148 |
lm_eval/tasks/blimp/distractor_agreement_relative_clause.yaml |
sha256=aylJHRj3J50lqloD6TtbRWgTC8sMek7PlolhlQ2_wTs
|
148 |
lm_eval/tasks/blimp/drop_argument.yaml |
sha256=piUDj4gM9_dlopsxQB47CYpaFOV2Z6l3beZEScQqB38
|
102 |
lm_eval/tasks/blimp/ellipsis_n_bar_1.yaml |
sha256=pawDpZP85htkOT_Db2TRFP19neJP1xio404cYcFhzv8
|
108 |
lm_eval/tasks/blimp/ellipsis_n_bar_2.yaml |
sha256=OBAtmSx6TW2Rgo-zdqKNp6ZBhJPBOa8eODvTZb8Blmg
|
108 |
lm_eval/tasks/blimp/existential_there_object_raising.yaml |
sha256=f8wWYmAiqdEAKqIDcSCB2mj3CXRpz6Xx23tBw_YFmAk
|
140 |
lm_eval/tasks/blimp/existential_there_quantifiers_1.yaml |
sha256=0dCbp1jHm8zZrznnHDWb31ho8rDV4tnLR3Fm1uGUMFI
|
138 |
lm_eval/tasks/blimp/existential_there_quantifiers_2.yaml |
sha256=il9eevifcY7YXleFZtMPeT2aHM_0q_pmRrMX8Dnlvas
|
138 |
lm_eval/tasks/blimp/existential_there_subject_raising.yaml |
sha256=Pms6JBnODzdcBr0HkS9o7oMskk0Uxxl0Smz7y8iFnhg
|
142 |
lm_eval/tasks/blimp/expletive_it_object_raising.yaml |
sha256=DP15wYDN9C4ZZFBqz9TcnG89_GkmXm91YWFeueJGZ8g
|
130 |
lm_eval/tasks/blimp/generate_configs.py |
sha256=E8qhbk0Xz2IPgjbc7Tm7QM33JphFsmuqI7KkdR1fFjU
|
2901 |
lm_eval/tasks/blimp/inchoative.yaml |
sha256=DsMpj_a2yrOchFTmTXat0LGocDai5yEhefMj4mw11ug
|
96 |
lm_eval/tasks/blimp/intransitive.yaml |
sha256=S4KtS7drV5J2iqoe3TNXbJIM56m85KCXSTBeCLJModg
|
100 |
lm_eval/tasks/blimp/irregular_past_participle_adjectives.yaml |
sha256=gZhQpDK95j2qJotGRqg1JY5aRxDKMvABwpwLEHBHDvg
|
148 |
lm_eval/tasks/blimp/irregular_past_participle_verbs.yaml |
sha256=J7i1uPI1XRkOJ5J9fVDqkma-DBIVpTP4CQaPF9zNc6A
|
138 |
lm_eval/tasks/blimp/irregular_plural_subject_verb_agreement_1.yaml |
sha256=vkRRN_PpLhliyDbdjyrWP-Exo0IPvqbBxbV-gB-6u-Q
|
158 |
lm_eval/tasks/blimp/irregular_plural_subject_verb_agreement_2.yaml |
sha256=Dhce_QyhiMuLq5nYtEsg9f2U14a2lPM5gNoa_k1BZqU
|
158 |
lm_eval/tasks/blimp/left_branch_island_echo_question.yaml |
sha256=tmYr6gGH_W_bsTxfD0o8E0gm0lpPX_RouukysmN8PmE
|
140 |
lm_eval/tasks/blimp/left_branch_island_simple_question.yaml |
sha256=6fQOQ1Khq4c4r2FKjccNOzQq2nPfSWGEfWAY5ui5YZk
|
144 |
lm_eval/tasks/blimp/matrix_question_npi_licensor_present.yaml |
sha256=zgviPtzlA4t_e1I0uJHQWSIXoVxGCCYCbE9Q6ZJ8H0g
|
148 |
lm_eval/tasks/blimp/npi_present_1.yaml |
sha256=1lFMhXRmF1N-ZCRA71OieXn9dcaNWM0h1_tr9nf3dr8
|
102 |
lm_eval/tasks/blimp/npi_present_2.yaml |
sha256=hkelD4YT05hqNiBu6foSc8Ea6DBTVEZo6tA4_W6pn58
|
102 |
lm_eval/tasks/blimp/only_npi_licensor_present.yaml |
sha256=8exp0yKRSCPcD5AXBbURBTDI1FaCcpWTDP_SQNckXgA
|
126 |
lm_eval/tasks/blimp/only_npi_scope.yaml |
sha256=ByExTctp9xZmTtKrHCGJg70UY6yD2Kqpt1i95zIl1Xo
|
104 |
lm_eval/tasks/blimp/passive_1.yaml |
sha256=aVZXNP2pI2DzSfGuNtNLmWElXxdNPTAMCABV8Yb9Kvk
|
94 |
lm_eval/tasks/blimp/passive_2.yaml |
sha256=RSkmNYrndnY5tweYPxL1rvb7_IYJdBfs-QXQXHvpSuk
|
94 |
lm_eval/tasks/blimp/principle_A_c_command.yaml |
sha256=HNR2XQIRJfJlOn63103PmDnnUG2NY2iMuWPAB_tKoGU
|
118 |
lm_eval/tasks/blimp/principle_A_case_1.yaml |
sha256=2q4Zrc27iGDVaT7XilWvcJCzL3il8UILyEW6BW3-RMs
|
112 |
lm_eval/tasks/blimp/principle_A_case_2.yaml |
sha256=VgfFmGJ5ODxbAyga-hvWrH4ALajZ0CqY8S1yMF5dN6c
|
112 |
lm_eval/tasks/blimp/principle_A_domain_1.yaml |
sha256=wjWNm-2SkxOJpUf6XplZuY_lm45qNsAhEqf8gkw42cE
|
116 |
lm_eval/tasks/blimp/principle_A_domain_2.yaml |
sha256=I7-vj_eHLXL92Q5YyQg0tNkn6XfDwZQmYAcdxZ5jDUk
|
116 |
lm_eval/tasks/blimp/principle_A_domain_3.yaml |
sha256=N4NOk4-FYUrZe_yEB3QVpK10l5YTbVvAR8T2ZdZJbIY
|
116 |
lm_eval/tasks/blimp/principle_A_reconstruction.yaml |
sha256=kbgPw8WRvQgEw4nOx6lIahrJfiwQgeldg-_ubuyduKQ
|
128 |
lm_eval/tasks/blimp/regular_plural_subject_verb_agreement_1.yaml |
sha256=TRl_ZSGOzmoKj8aaps-3UoUH-E2CQTvHkT7oY8tvnp0
|
154 |
lm_eval/tasks/blimp/regular_plural_subject_verb_agreement_2.yaml |
sha256=El69s111tnlZ3PaVD8dJ_mnGyHkwfF1Lx1NRbegvyqc
|
154 |
lm_eval/tasks/blimp/sentential_negation_npi_licensor_present.yaml |
sha256=tlDP6oxHDRNT-DOlxqER7c16pMqjRiYtraonx0dhJSQ
|
156 |
lm_eval/tasks/blimp/sentential_negation_npi_scope.yaml |
sha256=ZA01-DgkD_XiH4_y4LEPTxID6yN6IB3ChXcVM3r-yeo
|
134 |
lm_eval/tasks/blimp/sentential_subject_island.yaml |
sha256=dWTwulV1S633yAhGuWGuyGttg3fkyYwMM2A_y8HxcKc
|
126 |
lm_eval/tasks/blimp/superlative_quantifiers_1.yaml |
sha256=faxiPYPbVCG3Jz-PRJoHlYl6EyhEEc-nprr29tV-3Cc
|
126 |
lm_eval/tasks/blimp/superlative_quantifiers_2.yaml |
sha256=WbMvowOM10KnngE6Nz5iS3f4A5hcEP01331m_m4JmGY
|
126 |
lm_eval/tasks/blimp/tough_vs_raising_1.yaml |
sha256=pK9Upq5umDCfVZWm8u0E2kxdYmEitsuAqO-5QD9tayc
|
112 |
lm_eval/tasks/blimp/tough_vs_raising_2.yaml |
sha256=7VeDbZkxEY8D9nwNymqOHotD8NkeTUibGkKJMSigWtQ
|
112 |
lm_eval/tasks/blimp/transitive.yaml |
sha256=cmejl92fLdcvqrpWR4oX-yLeWExMqtj1a-x0fKHtLwQ
|
96 |
lm_eval/tasks/blimp/wh_island.yaml |
sha256=jFAVoSJBhuKAfU8fs2kl4US-tFiZ03vnMXbNqYfdF0I
|
94 |
lm_eval/tasks/blimp/wh_questions_object_gap.yaml |
sha256=kOvup2GXc9GtfsI9i4wzF3_jbL043PeHWjSUWFi0hBE
|
122 |
lm_eval/tasks/blimp/wh_questions_subject_gap.yaml |
sha256=m3ybX6FgLO7SYEA-7iUyLOTRmXC3hpQpUmkvm620mrw
|
124 |
lm_eval/tasks/blimp/wh_questions_subject_gap_long_distance.yaml |
sha256=rFcVijVQW-IG_mpNmRNFo7QEEhRoQ5CNVfBGKuI8qnw
|
152 |
lm_eval/tasks/blimp/wh_vs_that_no_gap.yaml |
sha256=3Buk7jIKXy4e0c7JYjJ5Iknlobz-JjWQxuMFl-PjuqU
|
110 |
lm_eval/tasks/blimp/wh_vs_that_no_gap_long_distance.yaml |
sha256=RVfGHziEZb_v7um-wo72xZNeSt0VcN6FiODhSq9uxTI
|
138 |
lm_eval/tasks/blimp/wh_vs_that_with_gap.yaml |
sha256=MwnrjZ-CdZGyvAshYmken2hkNf97BhAXNY03rhu679A
|
114 |
lm_eval/tasks/blimp/wh_vs_that_with_gap_long_distance.yaml |
sha256=9gOjb25Zw6AtFaXwyyyo9xrapuN3PwBE-zcCZ4zdWbM
|
142 |
lm_eval/tasks/ceval/README.md |
sha256=UEX7W3AFO3-cM3UcL3yrLoO9C4ZsmiiD2cRzvCH6nys
|
4967 |
lm_eval/tasks/ceval/_default_ceval_yaml |
sha256=N8KsT9uZ47QAPbySBgnlmYLGTPJxhbUNI7SC5Lyt66g
|
507 |
lm_eval/tasks/ceval/_generate_configs.py |
sha256=rQI-ZBmPXnfNXr7gChZ382dlBwFah8uriS1K206waF8
|
4374 |
lm_eval/tasks/ceval/ceval-valid_accountant.yaml |
sha256=r61lKl0DAH5ySKcDs7AwPvQl8JVUiHZfvzmJRmBiUX8
|
207 |
lm_eval/tasks/ceval/ceval-valid_advanced_mathematics.yaml |
sha256=TowvVz5_ZfK6yBmcAuqQ1T1uv9_PfeQ8bJen8NkRHrg
|
224 |
lm_eval/tasks/ceval/ceval-valid_art_studies.yaml |
sha256=kI7p4mk8_5oF4IEb9hAgy9LASGQIXRzzVp5Xar39Kis
|
203 |
lm_eval/tasks/ceval/ceval-valid_basic_medicine.yaml |
sha256=m2PzLxFzKXbYd4_2Ln2z7sxS25fVlw1GiuKYjnZ1Nt4
|
212 |
lm_eval/tasks/ceval/ceval-valid_business_administration.yaml |
sha256=tVyXVeOB5Mk_4WkGiY4FsVMb9GHWA0bXvK9VS22gTw8
|
230 |
lm_eval/tasks/ceval/ceval-valid_chinese_language_and_literature.yaml |
sha256=SAhX_ST3R3hSDvyVRoZMvTIDTLzAOR6IA4QHRkUjwvM
|
252 |
lm_eval/tasks/ceval/ceval-valid_civil_servant.yaml |
sha256=G_8m9RcD_aV7jJXAubW_1oq84RIbrUfyLZxxTcic_vE
|
207 |
lm_eval/tasks/ceval/ceval-valid_clinical_medicine.yaml |
sha256=0QikXTEvr3amDcUGl8DcfynOZj0Ll5hZRa1AhhHTXQ8
|
218 |
lm_eval/tasks/ceval/ceval-valid_college_chemistry.yaml |
sha256=0rhGE5axuBh5O4Z4aZRaOuQ0usiuTJd-CtAvKpxI9NE
|
218 |
lm_eval/tasks/ceval/ceval-valid_college_economics.yaml |
sha256=Y9xrtTT-BiinFOkkqI7nWi4GyB1bxiOHh6pRPff3-AQ
|
221 |
lm_eval/tasks/ceval/ceval-valid_college_physics.yaml |
sha256=JJfHph_isVStbsk2yIav4A5iqmLWNf1EAmCFOIUjk5Y
|
214 |
lm_eval/tasks/ceval/ceval-valid_college_programming.yaml |
sha256=FYNlc9mHqfoLCAdtjx3aiaPq-HuI0c2zNDQp8AaE6wo
|
222 |
lm_eval/tasks/ceval/ceval-valid_computer_architecture.yaml |
sha256=vGZ__iGOj0_nX7aVWX3qCDYrr2eEJ1mJj7k59NG3CTs
|
229 |
lm_eval/tasks/ceval/ceval-valid_computer_network.yaml |
sha256=gPMX8lN2YMGH9QYaKBEXProfP_MA9XV4Lx_udMr-ktQ
|
219 |
lm_eval/tasks/ceval/ceval-valid_discrete_mathematics.yaml |
sha256=a9wuabDadH9CgiyQc5uW1lld4vAeaJYv4mPTx5u-Ujg
|
224 |
lm_eval/tasks/ceval/ceval-valid_education_science.yaml |
sha256=KiFoKyLZHkaDYdWCAZ45k4K_GglR3MDJGheeHWDgSbM
|
215 |
lm_eval/tasks/ceval/ceval-valid_electrical_engineer.yaml |
sha256=DjZ62r5DtU_XIS1K-MUbQqbigXYd6YCQI7LBYdXhB8Y
|
231 |
lm_eval/tasks/ceval/ceval-valid_environmental_impact_assessment_engineer.yaml |
sha256=S-HPmH9da8gLu8lh_2YZ4XwV5Hog7JPJJEbxVkbd0Kk
|
279 |
lm_eval/tasks/ceval/ceval-valid_fire_engineer.yaml |
sha256=aTajwMc0EjalqD3Rx5O6BUX3slgolA8lxLSjF0NvDlE
|
219 |
lm_eval/tasks/ceval/ceval-valid_high_school_biology.yaml |
sha256=KMO3L-P6JFdCwkH5431YBOImX-oWGi6A9gmtvyCq-EU
|
222 |
lm_eval/tasks/ceval/ceval-valid_high_school_chemistry.yaml |
sha256=YdpYxhBFLDoKk9gz6UiZa6TBuqrdRH8FnZmG2NZiuL4
|
226 |
lm_eval/tasks/ceval/ceval-valid_high_school_chinese.yaml |
sha256=6L4ePI81IW_ssklfqriFt83X8vMZ4b0gm_oAkpDXkqA
|
222 |
lm_eval/tasks/ceval/ceval-valid_high_school_geography.yaml |
sha256=rPDd_fm_nqM530JAWLG7PmYyCFux3wOZf50gdZBBRVY
|
226 |
lm_eval/tasks/ceval/ceval-valid_high_school_history.yaml |
sha256=SEMX0dqEXZjsvTn1JP_3ECBZ0M56I4WBKFbw0XWI8No
|
222 |
lm_eval/tasks/ceval/ceval-valid_high_school_mathematics.yaml |
sha256=j45jE6-jfXFcdkLZFY2jPwexDnqiBkqilwC9a5vsM04
|
230 |
lm_eval/tasks/ceval/ceval-valid_high_school_physics.yaml |
sha256=lTuM6LCjO9SlruoHX3xepebj46l_0ZK_N5l5HZmys6A
|
222 |
lm_eval/tasks/ceval/ceval-valid_high_school_politics.yaml |
sha256=T6HS-hthajC2NJi5NFKkD0XDxmXmKHCNuhBbhntddpU
|
224 |
lm_eval/tasks/ceval/ceval-valid_ideological_and_moral_cultivation.yaml |
sha256=hmHJ5O9v3iXt-j8xHO7UeCMWE6A6FB-dciyljq9xSqM
|
271 |
lm_eval/tasks/ceval/ceval-valid_law.yaml |
sha256=QmrSRhjMC5K7OQDTz2_r52HJVZWWv4xjrptwmY5NKzA
|
184 |
lm_eval/tasks/ceval/ceval-valid_legal_professional.yaml |
sha256=rQMWxpcWt2Y1bhoSgaUP5US4OXVbPvTSxvU_J90dwHk
|
226 |
lm_eval/tasks/ceval/ceval-valid_logic.yaml |
sha256=mnuTRJO3tYKeySn2n3B-92InjPvz3t0mhf-UaKGcHgI
|
191 |
lm_eval/tasks/ceval/ceval-valid_mao_zedong_thought.yaml |
sha256=z4BrjRmSCh96ieu9MCmc9J-vy0PnBdxKYO7Q8lUjenc
|
268 |
lm_eval/tasks/ceval/ceval-valid_marxism.yaml |
sha256=3KjhPFk4w9kpVzl1WD9Va4EOAkux32iBqrfQ1UIP9s8
|
213 |
lm_eval/tasks/ceval/ceval-valid_metrology_engineer.yaml |
sha256=YqiCDiJ4bphneVAIjweU5Qqc4uck_s_iuIzMT9HF_kQ
|
223 |
lm_eval/tasks/ceval/ceval-valid_middle_school_biology.yaml |
sha256=Ic-e39wEVx6NScOoCbkA7dciQ-Y2wt0QFmN0kWVTVEk
|
226 |
lm_eval/tasks/ceval/ceval-valid_middle_school_chemistry.yaml |
sha256=CJ6HyS-6Nlcp-wi0yb74zdqUPL_zQWdTf9oTYQcCGO4
|
230 |
lm_eval/tasks/ceval/ceval-valid_middle_school_geography.yaml |
sha256=Yh1mxAbsNan6WY4sH8eN5EI-oLw8psQ5PmGO1ZX-ZrU
|
230 |
lm_eval/tasks/ceval/ceval-valid_middle_school_history.yaml |
sha256=ckDHEb5npvsq2mdt4ICfkbk0eTlcZxHWlGJXax-1aIY
|
226 |
lm_eval/tasks/ceval/ceval-valid_middle_school_mathematics.yaml |
sha256=Mtt8szOofgOabzBBVLIPV67b7sDEECndzOAz057qlJs
|
234 |
lm_eval/tasks/ceval/ceval-valid_middle_school_physics.yaml |
sha256=oue8rUCV8h0MP0gx5emFPTOreBh6FSNhqNi_HEJtvW8
|
226 |
lm_eval/tasks/ceval/ceval-valid_middle_school_politics.yaml |
sha256=pKqoZ560D8p0sJ6sEBanLv_ybuppFpvd8f-IYRCVl50
|
228 |
lm_eval/tasks/ceval/ceval-valid_modern_chinese_history.yaml |
sha256=ISjUEGRMxv2nQGf50IbxoQEMA4hLHUchXO5wWT_ams8
|
231 |
lm_eval/tasks/ceval/ceval-valid_operating_system.yaml |
sha256=1r9lC8brpfqm4D1lX1_0avgSZXwAm3xq48WtLYxtCxE
|
216 |
lm_eval/tasks/ceval/ceval-valid_physician.yaml |
sha256=JV3vjt37Cmnv0fGCQzjpvCxGljASNTJQj3fO8Xt0WY4
|
202 |
lm_eval/tasks/ceval/ceval-valid_plant_protection.yaml |
sha256=XxzSPV-7R2X6nOiqWM_PhKeMtIT9WOwVvkNCc71KZNM
|
216 |
lm_eval/tasks/ceval/ceval-valid_probability_and_statistics.yaml |
sha256=Dm-WFp5dusbxLucUCEqRkmcbgIGnNjYoMXsmYbYJ5UY
|
236 |
lm_eval/tasks/ceval/ceval-valid_professional_tour_guide.yaml |
sha256=LMS9fyh7Zmt8grr4CBQGccGHPAKuj0RZAj3XQGzmyl0
|
230 |
lm_eval/tasks/ceval/ceval-valid_sports_science.yaml |
sha256=6rgkkmJCxopoPNedAkIhWVpGzhdcB4ztYO0EmUk_9rc
|
209 |
lm_eval/tasks/ceval/ceval-valid_tax_accountant.yaml |
sha256=dHhlfeqH_HUlTkKbWzOJNaYXzAE1c9FWejT_3XBiGhU
|
209 |
lm_eval/tasks/ceval/ceval-valid_teacher_qualification.yaml |
sha256=msYhw4RmvIXosDstJVb1l7wUs_-hokMOFY1UFSTteHc
|
226 |
lm_eval/tasks/ceval/ceval-valid_urban_and_rural_planner.yaml |
sha256=lqXQXjQI4jxIQ3_iNIaTQE1CJ3OGg5UzEcL0NIiQRgs
|
239 |
lm_eval/tasks/ceval/ceval-valid_veterinary_medicine.yaml |
sha256=g9Ui3hPL64eumBGsuKUE1xgiCKFMFzt8hqbJ14pbu90
|
219 |
lm_eval/tasks/cmmlu/README.md |
sha256=gyA3hrGDwuWy4mtFMPgxWXleKApdjgbKmiiWi0t9CMk
|
1748 |
lm_eval/tasks/cmmlu/_default_template_yaml |
sha256=Rap2Tp1bIJjwAJRLwTvRv4rzSYioPENv3PDqltoDZmQ
|
495 |
lm_eval/tasks/cmmlu/_generate_configs.py |
sha256=Y9MBP046ouOMJDLFEGVGKYVuBh3nowAiRBMChA6zdkI
|
4773 |
lm_eval/tasks/cmmlu/cmmlu_default_agronomy.yaml |
sha256=DqvlHZ1g4sDq5lFUjDzk8Xu7LdpfOajsqgD5COLsnio
|
191 |
lm_eval/tasks/cmmlu/cmmlu_default_anatomy.yaml |
sha256=SKazmZTenePltXz5i7wj33uM-zwAjWTmKcd0ngzEjOM
|
192 |
lm_eval/tasks/cmmlu/cmmlu_default_ancient_chinese.yaml |
sha256=zQ5j11KOJ60Q0n3IJ2SNGFkx01I0Qy6p6i-RQTQC8_8
|
208 |
lm_eval/tasks/cmmlu/cmmlu_default_arts.yaml |
sha256=qNkb7UTvtgXF9JcHo8qSYW6O22tZgLSuPzvoklCL0zw
|
186 |
lm_eval/tasks/cmmlu/cmmlu_default_astronomy.yaml |
sha256=lgF3qfC_2bQc4NEklG6vnwmhy1GvfogpgRSYfoijulQ
|
196 |
lm_eval/tasks/cmmlu/cmmlu_default_business_ethics.yaml |
sha256=TdFBk1ool2z3ihnnk5LHraT6R_Feo_F_p5at9JT3HcY
|
211 |
lm_eval/tasks/cmmlu/cmmlu_default_chinese_civil_service_exam.yaml |
sha256=l7wFBEEn_BtahJVHQL6cI7azQeWSs3hX-2XdHX-CjhM
|
242 |
lm_eval/tasks/cmmlu/cmmlu_default_chinese_driving_rule.yaml |
sha256=0Uj-zYoT4yeQqOqBfIXi_IpYzyQPcHMCf1dS9ma2LKc
|
227 |
lm_eval/tasks/cmmlu/cmmlu_default_chinese_food_culture.yaml |
sha256=EMIfT1GJluls12hfxlmTgfNKevRuzV9XWkoGTzO0djI
|
227 |
lm_eval/tasks/cmmlu/cmmlu_default_chinese_foreign_policy.yaml |
sha256=1yuG2_1A9Oe4_o_Bl7uJKOv3Qfqv9r6JYAD1P6L3AHg
|
231 |
lm_eval/tasks/cmmlu/cmmlu_default_chinese_history.yaml |
sha256=vYox5jq9_vm04ClPytEiqluf8oiJ7Y2Yl8dwphd_ukY
|
211 |
lm_eval/tasks/cmmlu/cmmlu_default_chinese_literature.yaml |
sha256=6vFl0vmSFAeLBtcyn9utf7YGQMtiJEOjxR1XtmmeN7k
|
217 |
lm_eval/tasks/cmmlu/cmmlu_default_chinese_teacher_qualification.yaml |
sha256=Ofur5dABRspuog_bL39FTQcJ6cqSj3B1pjJTeparuPg
|
245 |
lm_eval/tasks/cmmlu/cmmlu_default_clinical_knowledge.yaml |
sha256=ReXbIW90A0BZ3NGOysUraRr1n4Ugto-Pl8z3CPPU4aA
|
217 |
lm_eval/tasks/cmmlu/cmmlu_default_college_actuarial_science.yaml |
sha256=vvVIOnXSEG-J9OcEFf4G3qGpGBRkfrKb8x1_oJrruK4
|
234 |
lm_eval/tasks/cmmlu/cmmlu_default_college_education.yaml |
sha256=9AUMkRL72eBk2UnWaDBtmgdrh0EQZait775LloIZq7M
|
218 |
lm_eval/tasks/cmmlu/cmmlu_default_college_engineering_hydrology.yaml |
sha256=HBihPhmNhTPj7_LSB939YL_o8zOI8vsuTXuEK8F2yd4
|
248 |
lm_eval/tasks/cmmlu/cmmlu_default_college_law.yaml |
sha256=FWe0m1K9JmnVTcfXW5Fbsv2tE3LGBfNhSxLXrVi4pSk
|
203 |
lm_eval/tasks/cmmlu/cmmlu_default_college_mathematics.yaml |
sha256=1os_um2HNCfbbRJYM6IKAG05I2_QsiSrmW9OaHLNGwo
|
219 |
lm_eval/tasks/cmmlu/cmmlu_default_college_medical_statistics.yaml |
sha256=z6LJZK45Tf9gj9LIx1TjjuaH8LACReSz43ObiNTvd0A
|
239 |
lm_eval/tasks/cmmlu/cmmlu_default_college_medicine.yaml |
sha256=iIQRLQfEx3ZCtcRqHE5Il1XDqjqaHaV8oAdM2ihWCC4
|
213 |
lm_eval/tasks/cmmlu/cmmlu_default_computer_science.yaml |
sha256=64z6rFtry_E0LS5opBBaBcHXzmOW1lg9Y1wh1lNx1Cg
|
216 |
lm_eval/tasks/cmmlu/cmmlu_default_computer_security.yaml |
sha256=iCYXgKnc8GpnHAwHPZq1-XbXzwZ9AlBuANlQ66Wj1Sc
|
218 |
lm_eval/tasks/cmmlu/cmmlu_default_conceptual_physics.yaml |
sha256=L_DkqkfoMI1kBneIXn9W3r-zZ7rG0bp_dceUOlqaVWU
|
220 |
lm_eval/tasks/cmmlu/cmmlu_default_construction_project_management.yaml |
sha256=1tMoBrlqts3rgxwRgVUu8tRR9td8S8_54LPZyOKRgZQ
|
249 |
lm_eval/tasks/cmmlu/cmmlu_default_economics.yaml |
sha256=bai4ZwJBfG7OAN_uSS-uajVt-HOrUw9nNwK4f9R53RI
|
196 |
lm_eval/tasks/cmmlu/cmmlu_default_education.yaml |
sha256=JHFLezPEuR8vINuJ7fiq5vrMMaWieyW3HXoWsdpOWnw
|
196 |
lm_eval/tasks/cmmlu/cmmlu_default_electrical_engineering.yaml |
sha256=pVHvc_MRieXI3ff7WJpKkQV1uaap3II7-BuzkAwrHiY
|
225 |
lm_eval/tasks/cmmlu/cmmlu_default_elementary_chinese.yaml |
sha256=P4jiuRXU5OqjvlpDkjFJHl4RLu7b5LaTmbGrmvseYMI
|
217 |
lm_eval/tasks/cmmlu/cmmlu_default_elementary_commonsense.yaml |
sha256=OlTYX9qyhhu4u5VYFDtUGEFicu-VPNLmNU1Juq8uO0w
|
225 |
lm_eval/tasks/cmmlu/cmmlu_default_elementary_information_and_technology.yaml |
sha256=hAPmn31ac7hFTFl283vhK1jPjJm5tv6VchLKQgb3yPs
|
261 |
lm_eval/tasks/cmmlu/cmmlu_default_elementary_mathematics.yaml |
sha256=D8ne6N6tJCsPzWqlF4qxy6oBgkmjb6Jqy5DKw-xJMnU
|
225 |
lm_eval/tasks/cmmlu/cmmlu_default_ethnology.yaml |
sha256=OhNfsDxIuIA7ADIMc2SYiWjMtEw_DehtcQSIbXTbxc4
|
196 |
lm_eval/tasks/cmmlu/cmmlu_default_food_science.yaml |
sha256=fItOTnSEaBqDxokXTmY62WJI8orHAo2EL6HHAA_6z8A
|
205 |
lm_eval/tasks/cmmlu/cmmlu_default_genetics.yaml |
sha256=TOWNyAd8uOc1NrZkjgDMuYBDKaW1Ft8xJRABwMZYenk
|
194 |
lm_eval/tasks/cmmlu/cmmlu_default_global_facts.yaml |
sha256=-jZNUBh1qBrRVz70BfV4WWjhDwS4jsH5G9yipyKDHfE
|
205 |
lm_eval/tasks/cmmlu/cmmlu_default_high_school_biology.yaml |
sha256=pX2-airA86ZU5pUjewxjdlcLs-9FWHUUUiAnzBubrwQ
|
219 |
lm_eval/tasks/cmmlu/cmmlu_default_high_school_chemistry.yaml |
sha256=Q1ZBG8Wp9ab96l19PRwod9Dll5skvlB96x2A1Jmnfc0
|
223 |
lm_eval/tasks/cmmlu/cmmlu_default_high_school_geography.yaml |
sha256=G0VrkoUMzKtEm1kzOuEwPdq2vtlkc0KMDMsEGF6t1ds
|
223 |
lm_eval/tasks/cmmlu/cmmlu_default_high_school_mathematics.yaml |
sha256=wB7tBE5a9SWghbkP6dRakza_3PpSt-wkmTrd0bQpUEc
|
227 |
lm_eval/tasks/cmmlu/cmmlu_default_high_school_physics.yaml |
sha256=-QcmeommiYmIqCYaLVsaars-u6VKnqzbIoaf7Uz3Tmg
|
222 |
lm_eval/tasks/cmmlu/cmmlu_default_high_school_politics.yaml |
sha256=kKjyp_zDx4tsAJkWmzBCqp6Ubx2hhriEl-PiI6GHRys
|
221 |
lm_eval/tasks/cmmlu/cmmlu_default_human_sexuality.yaml |
sha256=IB0QxIhbKjAmhT77CJqheViIVw-2sZ3_kWpeyDcFAOw
|
214 |
lm_eval/tasks/cmmlu/cmmlu_default_international_law.yaml |
sha256=9luncjc_o4MvJjIYSznbT4ljfGEkrQdiaxYRajAnREA
|
215 |
lm_eval/tasks/cmmlu/cmmlu_default_journalism.yaml |
sha256=Tzhv5LmPa9-RTrok-GBgGc3mag4AmPIUVJKYqhzA_-c
|
198 |
lm_eval/tasks/cmmlu/cmmlu_default_jurisprudence.yaml |
sha256=OVAiNRVJBAUmw7ON2CX1cP44BUv7TktZW0ufOC6Zgco
|
204 |
lm_eval/tasks/cmmlu/cmmlu_default_legal_and_moral_basis.yaml |
sha256=YbQTOpGYrKJr5TOKzEWrUl3FO6zQtu1pAwjGCnmPRik
|
232 |
lm_eval/tasks/cmmlu/cmmlu_default_logical.yaml |
sha256=4lpQg10BWCqLyepRgXn4fcazO9J6YKiZvoWhgRJTytw
|
192 |
lm_eval/tasks/cmmlu/cmmlu_default_machine_learning.yaml |
sha256=yTSdJ2qB6hVZ-I1M3V8IQshSThOugOI_2H3ECNdeoig
|
213 |
lm_eval/tasks/cmmlu/cmmlu_default_management.yaml |
sha256=xj0wH_La-bf_Ezx9mjmsbY07M4UdTXbkzCqGdnzJkRk
|
198 |
lm_eval/tasks/cmmlu/cmmlu_default_marketing.yaml |
sha256=l7ulx3Nr47Ai4-MwPSvr64j1cKF8hG0wpkUHNKVkuTU
|
199 |
lm_eval/tasks/cmmlu/cmmlu_default_marxist_theory.yaml |
sha256=d7XeZBoxxtzm9rf4WrjcChH5-RDT00XgITU9QJXKkBA
|
218 |
lm_eval/tasks/cmmlu/cmmlu_default_modern_chinese.yaml |
sha256=M2gRRZy54c8e6CeJu69yNAoP6c9NpDfSMlVyD_0pMvk
|
209 |
lm_eval/tasks/cmmlu/cmmlu_default_nutrition.yaml |
sha256=yLQYVLdRY1MUc4NaCidmrFlsDAWaBmI4tp9r3DLzjqY
|
196 |
lm_eval/tasks/cmmlu/cmmlu_default_philosophy.yaml |
sha256=IlGz2CINUIAzbvlLbnAbXOdNsxCyO2rmwSnwB9iqF_8
|
195 |
lm_eval/tasks/cmmlu/cmmlu_default_professional_accounting.yaml |
sha256=TgYE1xSlF2MBJW7fnisY7-dwcJlxTU-lKJDmf3nS5HA
|
227 |
lm_eval/tasks/cmmlu/cmmlu_default_professional_law.yaml |
sha256=S86GwVZZw3ilxfFvxpvZg5Rsl1sn-nUllYx5VFktinE
|
213 |
lm_eval/tasks/cmmlu/cmmlu_default_professional_medicine.yaml |
sha256=o9w1kA9-L1J72EuQ7V2kq1YhlUIS4ovXVhoQ44GLcbY
|
223 |
lm_eval/tasks/cmmlu/cmmlu_default_professional_psychology.yaml |
sha256=w5wE-YswhIPdQp1NWW2U09hYs3Rd64bvb6ZGupYucTk
|
230 |
lm_eval/tasks/cmmlu/cmmlu_default_public_relations.yaml |
sha256=jblBswd7hMbPfweUa-5hVEp43oNF24v4MeWRuea8Q3U
|
213 |
lm_eval/tasks/cmmlu/cmmlu_default_security_study.yaml |
sha256=CFKa_RoDtHDkHrXyyS9FNp_HI6vGCV7XaogP2cjVHyk
|
209 |
lm_eval/tasks/cmmlu/cmmlu_default_sociology.yaml |
sha256=Qzr4AiRoyPHtIISXvBN8_XAXltIO9GdMYr7xYXk9Atc
|
196 |
lm_eval/tasks/cmmlu/cmmlu_default_sports_science.yaml |
sha256=wD1eTg1JgFg-rnglXDDM--owRRq94g6st7GA3zZiXkA
|
206 |
lm_eval/tasks/cmmlu/cmmlu_default_traditional_chinese_medicine.yaml |
sha256=fs7VxHpIsAqdW52e-ffc6ClIdomsVPGzQKyiuGTTNs8
|
237 |
lm_eval/tasks/cmmlu/cmmlu_default_virology.yaml |
sha256=aB_oTbDjh76nGH9rIkNhcbygJJkmckEBj7ehe_BVSd4
|
194 |
lm_eval/tasks/cmmlu/cmmlu_default_world_history.yaml |
sha256=AWCZJjmwhJobrzPCUpNRKh5F_ieCDWuhQv4H6uq0mZA
|
207 |
lm_eval/tasks/cmmlu/cmmlu_default_world_religions.yaml |
sha256=v39HzwxSXp2xo5Ap_Ig1sGcdT0XkiDKRBsiPnI7J05I
|
211 |
lm_eval/tasks/code_x_glue/code-text/bleu.py |
sha256=bGCIK_eVzN92SnXvFXZEt9YpAntvpUcCegANXFD8vqY
|
7847 |
lm_eval/tasks/code_x_glue/code-text/go.yaml |
sha256=E69gjwTkkc9b2iYg-9KGJuItUb9UaOI8gzuKUHdTBf8
|
479 |
lm_eval/tasks/code_x_glue/code-text/java.yaml |
sha256=HhXKmCgWkp9O7nsI2O-glQsbzDjfsZNSL8Vf-ID1NgQ
|
483 |
lm_eval/tasks/code_x_glue/code-text/javascript.yaml |
sha256=L3brOBtKJTNeJFUQUw_-N6Q8S1M_aQ0aCfo9ydwt7qw
|
495 |
lm_eval/tasks/code_x_glue/code-text/php.yaml |
sha256=relg83ds1g2wf5x0euX8YqLKc_Y_XaYviH2e8stCnrg
|
481 |
lm_eval/tasks/code_x_glue/code-text/python.yaml |
sha256=-5ipicnQUBTH2fUZG3jZ1XjAX0ue6K2HIY_d_5AS5QM
|
487 |
lm_eval/tasks/code_x_glue/code-text/ruby.yaml |
sha256=dqAtzuKflJGBo09goRL2SgTkD1wRbBhLRyhu6wr6c50
|
483 |
lm_eval/tasks/code_x_glue/code-text/utils.py |
sha256=Bt0SAZ8OruKLYiMCZUo1pTVRso-79yd7Lg5mNwzquko
|
308 |
lm_eval/tasks/coqa/README.md |
sha256=LF6N0XSwsg6DLYACWr5FJca7bRlUYib00tGPHNiSzg0
|
1262 |
lm_eval/tasks/coqa/default.yaml |
sha256=A6Nt3Thu3Q4OZjo8epOvC8rcTyU6Mb3nqhgmFInbs5o
|
608 |
lm_eval/tasks/coqa/utils.py |
sha256=YqyC6AJxYtE0cJNVoAUm_1SX3rWYe-67GLQ5syDoYMo
|
2835 |
lm_eval/tasks/crows_pairs/README.md |
sha256=HesNVCLZST9DTRBTjxbAOIwzKG9UGaR9CuPVIrQUz3I
|
6562 |
lm_eval/tasks/crows_pairs/crows_pairs_english.yaml |
sha256=sLUaumY4JkiF3Xq31Ne_o0QorGaiasSYUMWMwVbYeNk
|
550 |
lm_eval/tasks/crows_pairs/crows_pairs_english_age.yaml |
sha256=g15ncf9B-uj8jpnGspHMF_tkTgytHxTFDEQheq-r5jE
|
127 |
lm_eval/tasks/crows_pairs/crows_pairs_english_autre.yaml |
sha256=-ZVZSt0RkemIKAHx-qM_Zf6WYphWFbtpKFTZqN4zer8
|
131 |
lm_eval/tasks/crows_pairs/crows_pairs_english_disability.yaml |
sha256=FDuoBS89Bt4XnXT1qO4G3AKaLzRtjUr9ty_essY5ms4
|
141 |
lm_eval/tasks/crows_pairs/crows_pairs_english_gender.yaml |
sha256=Jp_bpHin0LDl4Oh_5dw7DsnPIdw27_L7IvCSlt5-soc
|
133 |
lm_eval/tasks/crows_pairs/crows_pairs_english_nationality.yaml |
sha256=Xq_gMqx84YOsPB85t-mg-WowqOC9wGZAjti5s1vxZEE
|
143 |
lm_eval/tasks/crows_pairs/crows_pairs_english_physical_appearance.yaml |
sha256=rHxnfaefCxo-yW1nSA6odWsGWM1nuZ4qO7mY0_U3akY
|
150 |
lm_eval/tasks/crows_pairs/crows_pairs_english_race_color.yaml |
sha256=1TcaZQ2Vq0XQPalvOSvlpKZ43gzWOJ2_cwokusrppt0
|
141 |
lm_eval/tasks/crows_pairs/crows_pairs_english_religion.yaml |
sha256=TL4EheFGZbH1g13jyDFTx83tcLFoGijbuxv34HuCp8s
|
137 |
lm_eval/tasks/crows_pairs/crows_pairs_english_sexual_orientation.yaml |
sha256=fkwnSl7AJI3zbmuWD2lWGOE7tiuRumRN1uINS0QI-d4
|
150 |
lm_eval/tasks/crows_pairs/crows_pairs_english_socioeconomic.yaml |
sha256=uDwc7LsQC_Ws-4PsFQ8tc5vDkU98PxGzg4xz012Zi7w
|
139 |
lm_eval/tasks/crows_pairs/crows_pairs_french.yaml |
sha256=fz9gbMutyCHqm_OKj0xqqkr0Z3b3DLbQa54fAPAZ-dE
|
80 |
lm_eval/tasks/crows_pairs/crows_pairs_french_age.yaml |
sha256=p5WCzdbPIkilp8qG0fZGWG3dHjKr7ynX6PUP5GAWsN4
|
125 |
lm_eval/tasks/crows_pairs/crows_pairs_french_autre.yaml |
sha256=nWk1CtmS4rPNxHuhp4fq4_r8MXmjO0PZUes6Cl5kW7E
|
129 |
lm_eval/tasks/crows_pairs/crows_pairs_french_disability.yaml |
sha256=JHuqbu8Z8VflYRzJF2KnYGdIshBae9AmYptl84dW_wU
|
139 |
lm_eval/tasks/crows_pairs/crows_pairs_french_gender.yaml |
sha256=I9YDvpOnQXTMWOH1smjEs1nDiDeQP3Emq-XN2SUfWQ0
|
131 |
lm_eval/tasks/crows_pairs/crows_pairs_french_nationality.yaml |
sha256=ViElfWF8v9_JzWlhqosZtkA1WEuYCqwl__1eM0bByAg
|
141 |
lm_eval/tasks/crows_pairs/crows_pairs_french_physical_appearance.yaml |
sha256=Hv8VGBgSbJRy7ituauUmgxxFc3aPMJiwPLEDuk1W4L4
|
148 |
lm_eval/tasks/crows_pairs/crows_pairs_french_race_color.yaml |
sha256=WIbsZhtI3CTC1tYI0QuVtHRatNinqWWVbEhCFqadzLg
|
139 |
lm_eval/tasks/crows_pairs/crows_pairs_french_religion.yaml |
sha256=n19G-AGyzTMp8dPGUcS-1TuCs90O9vR1np7oxn9RzhM
|
135 |
lm_eval/tasks/crows_pairs/crows_pairs_french_sexual_orientation.yaml |
sha256=zg4UOJEM1CnKu933_I8NXpyM3pADeihBpMFOjrsWKpA
|
148 |
lm_eval/tasks/crows_pairs/crows_pairs_french_socioeconomic.yaml |
sha256=N5rktYPTmeZkQDPZw6mGZL5GhBdmyE9hkxtd__lh8GA
|
137 |
lm_eval/tasks/crows_pairs/utils.py |
sha256=Wx48MYgKgqn-kHLhTtsV_-FD0Ik53l0X_qF8LcL-DBY
|
1892 |
lm_eval/tasks/csatqa/_default_csatqa_yaml |
sha256=ZNaxMJHOhxOemhEyAVIzssgSpG-QbbTMEFflNFO4mIs
|
391 |
lm_eval/tasks/csatqa/_generate_configs.py |
sha256=npAnvYe62-G_mM7T2Z-VaPDYfjItoW1YKCgGhK0kCTs
|
1473 |
lm_eval/tasks/csatqa/csatqa_gr.yaml |
sha256=WfwUoa2uX8gOjaQfcVDUvVSVkWCmbJBjiv7KBpjHZ5w
|
75 |
lm_eval/tasks/csatqa/csatqa_li.yaml |
sha256=ZRwynLR8BVgxgFcSDTLi_WoHpkYAtmG6iJhLhr8KUFQ
|
75 |
lm_eval/tasks/csatqa/csatqa_rch.yaml |
sha256=hciObdoI5LBjMc0eM3fFX3fc-uKpuIIt-02-0-5K5Q8
|
77 |
lm_eval/tasks/csatqa/csatqa_rcs.yaml |
sha256=8bSnj6bbts-sRbYrXpzM7OITuxED7VuIMiUzzo9xMPY
|
77 |
lm_eval/tasks/csatqa/csatqa_rcss.yaml |
sha256=-GoC4clrkSwJLOFkxa6TOEwin1PeTaKfy-Qw6BpHogc
|
79 |
lm_eval/tasks/csatqa/csatqa_wr.yaml |
sha256=ovjDaNGHTq38vQ3RROv4ppR09nQyVN6RMEsGimHfiL8
|
75 |
lm_eval/tasks/csatqa/utils.py |
sha256=thFD-3JzYceDfR055-F6NhjxFLaEoAxF3b6E4ehwea4
|
662 |
lm_eval/tasks/drop/README.md |
sha256=_fto2NjX5LFKc6jv6Ip5dM7V-viFzt8sGlqcxBM7OJI
|
1857 |
lm_eval/tasks/drop/default.yaml |
sha256=6TeO_wLpoHxT0RnHTCO0xz9uL0kARdyViBqfKxPv5kA
|
642 |
lm_eval/tasks/drop/utils.py |
sha256=AuyxjM40-P0M6opJZiUULGlJE_ENhFK6uDgET-Uaeu8
|
5987 |
lm_eval/tasks/eq_bench/README.md |
sha256=vpylXqkMwXtH6NJGdUdUbLC8sVvJdKVpyX429VGSw_s
|
2949 |
lm_eval/tasks/eq_bench/default.yaml |
sha256=gyqAyRs1TvPTujpuD8dn7-4DpzU4GHvn8IYohMEVn6I
|
487 |
lm_eval/tasks/eq_bench/utils.py |
sha256=i-LCI-BP46h-3DtniEDg3-l34M__xS91VHWb4JhAz2I
|
2323 |
lm_eval/tasks/fld/README.md |
sha256=vbrH0LDSKeE9rQeo-93aTCF_K6JsJVOy0vWWzczhRSA
|
2812 |
lm_eval/tasks/fld/fld_default.yaml |
sha256=aDvqFrZRJcXWrSWb6yxz5TkUDImF3Trb5YIzHTefk6c
|
562 |
lm_eval/tasks/fld/fld_star.yaml |
sha256=I3lOwfUP5LoHYygYIZCMQenYkQ11AqQVNLlUrRcls0I
|
60 |
lm_eval/tasks/french_bench/README.md |
sha256=kgluZP2TaoqPeDUirXDoyegOt9GzhQmwZjITlRqXflc
|
4403 |
lm_eval/tasks/french_bench/_default_template_yaml |
sha256=gN9nCOPneJ1GzAlAfNDQLoi1j9mO25Imanaqifto-Rc
|
73 |
lm_eval/tasks/french_bench/french_bench_arc_challenge.yaml |
sha256=B7_9f4z3jiDy3saoPxtfd7pyGmX81m6EIkysvLQZQTk
|
598 |
lm_eval/tasks/french_bench/french_bench_boolqa.yaml |
sha256=WFziLgft30rkgvpJRObOtB_rvPIsGzoGFou2rNvJOW0
|
832 |
lm_eval/tasks/french_bench/french_bench_fquadv2.yaml |
sha256=dCg-EGiFJS7BzmY2vAolC_s8wh3U6JF450918qoSheo
|
1032 |
lm_eval/tasks/french_bench/french_bench_fquadv2_bool.yaml |
sha256=q208gZIhyVIhJBmTifHqIU7uvqiaZytWXjMJ7DJgYDs
|
795 |
lm_eval/tasks/french_bench/french_bench_fquadv2_genq.yaml |
sha256=dKzGkaQ7q1AzXYTd7hfuO5e5i7GNvxGKPmZXGSQBFuo
|
1024 |
lm_eval/tasks/french_bench/french_bench_fquadv2_hasAns.yaml |
sha256=biqlBOhjSKaC_SHZt52svJx3JOZpvWnG_m7xuPYlGsE
|
1202 |
lm_eval/tasks/french_bench/french_bench_grammar.yaml |
sha256=pZWodzUjVehtrH72ybKAe-OHMfzPqUXyNAUcLNr4Dck
|
914 |
lm_eval/tasks/french_bench/french_bench_hellaswag.yaml |
sha256=G34Z4fuhPzgjFkiLa7z8ICsKTeXxRY-nHVoVuq-qWj4
|
489 |
lm_eval/tasks/french_bench/french_bench_multifquad.yaml |
sha256=CYZs72VA3K6fWwhixNRVLtEMDkEMx3wLjR9krA4VWfc
|
1031 |
lm_eval/tasks/french_bench/french_bench_opus_perplexity.yaml |
sha256=8JSlQtyFaDG-Lr9-iHxGNQHNy1fMVeH709jAMKeO_U0
|
619 |
lm_eval/tasks/french_bench/french_bench_orangesum_abstract.yaml |
sha256=VNWo2l94ZAIpznjz6ynG0zkEw4Opr5ss9AjiqSBJrbc
|
747 |
lm_eval/tasks/french_bench/french_bench_orangesum_title.yaml |
sha256=y-vdzx5PN2EOGtn6kcIZK_oX0sEBboVU9r04FdSmmjU
|
737 |
lm_eval/tasks/french_bench/french_bench_reading_comp.yaml |
sha256=XNwvApigBp5_VNaVDb9klKssvuJOa8Hb9WY0e0H-sLI
|
1286 |
lm_eval/tasks/french_bench/french_bench_topic_based_nli.yaml |
sha256=yiaqDEKPcqlt5OAZT8Sb-NPyuP8SH4Srfd2U0DhTAfA
|
970 |
lm_eval/tasks/french_bench/french_bench_trivia.yaml |
sha256=VNAot1Vd87HY53Uv9jtkIWNhvoZhIsAQNxYV-d6Gl6Q
|
921 |
lm_eval/tasks/french_bench/french_bench_vocab.yaml |
sha256=EzkjtId1fxmVtBM_vp1Bb93BtqMtYJ34bP8PXzTp_TQ
|
923 |
lm_eval/tasks/french_bench/french_bench_wikitext_fr.yaml |
sha256=7Cq4ZaJzs40HNg91WhR5wbqtpytNSGTh-3otQ1Lt3aA
|
742 |
lm_eval/tasks/french_bench/french_bench_xnli.yaml |
sha256=yBV2OTrOD3KwsIROrP8CugIjiIxGIUOAgTiC7ZUo1fc
|
875 |
lm_eval/tasks/french_bench/preprocess_wikitext.py |
sha256=5GhEyw_5gw66pUJfLhf9CXpt9aFnIDJASFuJDpKncAg
|
1753 |
lm_eval/tasks/french_bench/utils.py |
sha256=TWgvTaJhbMvTDZCx4Pr_nKBtBRox6IKI0b9ufdX3pEE
|
2750 |
lm_eval/tasks/glue/README.md |
sha256=4jhlrD7-16TPFdRgMW8PH50mVphJx1pSCeWkQhroOp0
|
4029 |
lm_eval/tasks/glue/cola/default.yaml |
sha256=_zUdXjmZ3O4hiZushOaNoOE9Y-tTrZHVODu9V_no_2E
|
390 |
lm_eval/tasks/glue/mnli/default.yaml |
sha256=4I2ExiFGobTPdv2huD49TEWBUDRad4VU4Se1wL2XAKI
|
309 |
lm_eval/tasks/glue/mnli/mismatch.yaml |
sha256=8h4PeAORdZvLDlydIQun3J7HEq-gEUuzQNWeKXU_FaA
|
82 |
lm_eval/tasks/glue/mnli/utils.py |
sha256=2zCZu6crR6KQGCIbvKmp1E8EO1v0-8nfk7gIFoe6iV4
|
232 |
lm_eval/tasks/glue/mrpc/default.yaml |
sha256=yGvkMAOUvsSGJIDxMCE6dalbZkbl7XRzmWKt9bMDies
|
387 |
lm_eval/tasks/glue/qnli/default.yaml |
sha256=eu50EGhoWPilUZnpvlX8qnAJyBwmKkJT1d8U1ilnOqo
|
347 |
lm_eval/tasks/glue/qqp/default.yaml |
sha256=5PGl1dGUMxXiGq8aFr3uAeqVwHEKpm4OuBIbILId5wo
|
337 |
lm_eval/tasks/glue/rte/default.yaml |
sha256=wNbGmU4MBJ6bdDpxKfhVCfUDa2kpYM1kqY_IKVjGxk0
|
325 |
lm_eval/tasks/glue/sst2/default.yaml |
sha256=khEHtTl1-3InOkquc34uHrTKldn2x8vbo-9Kms5WUHc
|
343 |
lm_eval/tasks/glue/wnli/default.yaml |
sha256=ae5deGBLQLo9q0UjEFTY8_GnMjm7XuCZXxYDvXCM6DE
|
327 |
lm_eval/tasks/gpqa/README.md |
sha256=DuaeIXf-u0vzMrfoH_i_nQBNt3dXQQ0VtE8SD-SynYQ
|
3024 |
lm_eval/tasks/gpqa/cot_n_shot/_generate_configs.py |
sha256=wRGHsDYz8it9vKz9aw_1zsv0cqIJwb9tc4_6AvWpQOo
|
711 |
lm_eval/tasks/gpqa/cot_n_shot/_gpqa_cot_n_shot_yaml |
sha256=JgshGutnYVfdAmPmuGiAz4XWQZYXcVKlqAymwM8jUR8
|
1184 |
lm_eval/tasks/gpqa/cot_n_shot/gpqa_diamond_cot_n_shot.yaml |
sha256=Ua3s6-BJeC9Iz93fTROSCLHzizr_FORkj9onkcnDiPI
|
124 |
lm_eval/tasks/gpqa/cot_n_shot/gpqa_extended_cot_n_shot.yaml |
sha256=XwUUXl8F7xN4el7ZHBQM1fEzvHQVdy5vsgW6h11_kCg
|
126 |
lm_eval/tasks/gpqa/cot_n_shot/gpqa_main_cot_n_shot.yaml |
sha256=8_SWDAVJeGvMhQfU2seWGi9sUrML6pPzYzm_DnCRTJs
|
118 |
lm_eval/tasks/gpqa/cot_n_shot/utils.py |
sha256=z6HIKm5JmMnT8aF5AQvIRCraTw5WsSelioIVAkPvwaQ
|
1066 |
lm_eval/tasks/gpqa/cot_zeroshot/_generate_configs.py |
sha256=3e5minE_O5a9NJG68oNUMa3igTbmaojKxIR9S3ZwHY0
|
713 |
lm_eval/tasks/gpqa/cot_zeroshot/_gpqa_cot_zeroshot_yaml |
sha256=cC7rARYCcxX4VoTiaLCGTN3oXyHRfcW-ECB-2R_LFds
|
1078 |
lm_eval/tasks/gpqa/cot_zeroshot/gpqa_diamond_cot_zeroshot.yaml |
sha256=pNhT5SWHyQb7GKbtjvdVlrmGooyGlsudbXj_zUSA0Y8
|
128 |
lm_eval/tasks/gpqa/cot_zeroshot/gpqa_extended_cot_zeroshot.yaml |
sha256=DLnfykKWvEKni5LzzBhAdTcJaxOaABH13YmbaJmobrE
|
130 |
lm_eval/tasks/gpqa/cot_zeroshot/gpqa_main_cot_zeroshot.yaml |
sha256=wza8sxqp1YuMpRvBxil2PqgYAltEK_1oBZWJQe8_NQo
|
122 |
lm_eval/tasks/gpqa/cot_zeroshot/utils.py |
sha256=z6HIKm5JmMnT8aF5AQvIRCraTw5WsSelioIVAkPvwaQ
|
1066 |
lm_eval/tasks/gpqa/generative/_generate_configs.py |
sha256=nsG56XiyztHj9LmKNtsD4gUmc2sqdpyFPS74SBBdKZA
|
718 |
lm_eval/tasks/gpqa/generative/_gpqa_generative_n_shot_yaml |
sha256=EMUOr6IoIXQ2OmMmHUigTPMWIq6XJ9AI2pMGKKAM-_A
|
1183 |
lm_eval/tasks/gpqa/generative/gpqa_diamond_generative_n_shot.yaml |
sha256=QH65eFCrkQn2jJHfjk0T5b9YbfQdUan9oHHgjugw1Dg
|
138 |
lm_eval/tasks/gpqa/generative/gpqa_extended_generative_n_shot.yaml |
sha256=xuQm0KRf_ZCyL5Id5KsadN4sZukKYDMtZD7v999HuQc
|
140 |
lm_eval/tasks/gpqa/generative/gpqa_main_generative_n_shot.yaml |
sha256=EJhKLKJ6oz5mP43jtKHfYcEeN5FY2gkxJHx8Y8Zsbq8
|
132 |
lm_eval/tasks/gpqa/generative/utils.py |
sha256=z6HIKm5JmMnT8aF5AQvIRCraTw5WsSelioIVAkPvwaQ
|
1066 |
lm_eval/tasks/gpqa/n_shot/_generate_configs.py |
sha256=t2Uk-17YcA-J2FC4Lr1gAIgc3t8HVIJUWcLlOB2AU1I
|
675 |
lm_eval/tasks/gpqa/n_shot/_gpqa_n_shot_yaml |
sha256=EBUTgMe0laCRXyxJ4IgC5Hv3soOf-GlwOzfYCYu7i0Q
|
747 |
lm_eval/tasks/gpqa/n_shot/gpqa_diamond_n_shot.yaml |
sha256=bRMgQ-UtIFrpftGglUfHLE3U0ZIT8xhRr2-Ia9S_Tc4
|
116 |
lm_eval/tasks/gpqa/n_shot/gpqa_extended_n_shot.yaml |
sha256=80_VODHpsRmTLNdNl7LjbBuFXDeexymqiwBak6u2zA8
|
118 |
lm_eval/tasks/gpqa/n_shot/gpqa_main_n_shot.yaml |
sha256=UgLjr4n53Fx2ou_9M8IyKkKO8dX0Am9kHlS04UMaQwk
|
110 |
lm_eval/tasks/gpqa/n_shot/utils.py |
sha256=30C3EL9SYATKhzMvbDhpZApA5VTHpTze9nGFGrxekeY
|
1016 |
lm_eval/tasks/gpqa/zeroshot/_generate_configs.py |
sha256=Ue9UIgZncdmXr5C6LwhruUGmM_JLELebuobsVj5jjN4
|
709 |
lm_eval/tasks/gpqa/zeroshot/_gpqa_zeroshot_yaml |
sha256=OdlPNGvrzkN9fVZX-ZBqmKb-31X0Ltpo237oX5naUz4
|
641 |
lm_eval/tasks/gpqa/zeroshot/gpqa_diamond_zeroshot.yaml |
sha256=I9D-hFnOYwYbkgFqmcFKosDdcwBgqI0bufxeGhX4ZQU
|
120 |
lm_eval/tasks/gpqa/zeroshot/gpqa_extended_zeroshot.yaml |
sha256=_4NFVTE2yJCEfxx8dWPsAEzO43JmidUpfGuzVBL34gs
|
122 |
lm_eval/tasks/gpqa/zeroshot/gpqa_main_zeroshot.yaml |
sha256=LZE_1k369Pdvf9ftK2yegIAMBIM6lMK1sk8E1t5DiDY
|
114 |
lm_eval/tasks/gpqa/zeroshot/utils.py |
sha256=FuEbEyXiqSXSi_EVkHpLh3muBJ-vib1cwgCXRqt5K-g
|
993 |
lm_eval/tasks/gsm8k/README.md |
sha256=UDYib3sADm37wgpYMNQkRXfmaqJJDVqn4ioy9F4GxP4
|
1950 |
lm_eval/tasks/gsm8k/gsm8k-cot-self-consistency.yaml |
sha256=F_FPBcRrPlTXwLewgkVuXFFa0we5yqJU9aBUtqelMlE
|
972 |
lm_eval/tasks/gsm8k/gsm8k-cot-zeroshot.yaml |
sha256=cMJVM5iGAK7opf_1MfG6b7W-aKxCdY3Eo1f6cHzpocQ
|
1020 |
lm_eval/tasks/gsm8k/gsm8k-cot.yaml |
sha256=-m8rNssb5OOsK1OgfY4-YcSJaWgvGEWQmDHggOTBdYo
|
3122 |
lm_eval/tasks/gsm8k/gsm8k.yaml |
sha256=527IgNoIsNj5zgxw6xgOw9rvczY_4RjRsXv4bMTbYx8
|
1009 |
lm_eval/tasks/haerae/README.md |
sha256=jiCz34BnWHAs2tMvA58xqLSXtwStmKc-XCFMLzwH1YU
|
3004 |
lm_eval/tasks/haerae/_default_haerae_yaml |
sha256=DC8BBDQXgVDgUIcYpGONe0s8HKFNK6iJyy2ainmAjJU
|
396 |
lm_eval/tasks/haerae/haerae_gk.yaml |
sha256=IgyTjycO49Kxeh2jyR9mXvA9nfM8VarBqxPPt9jEHRY
|
105 |
lm_eval/tasks/haerae/haerae_hi.yaml |
sha256=2czT8etaPzTU3z2fjZ4sWGsd-a7npGmxikb2ydY492c
|
85 |
lm_eval/tasks/haerae/haerae_lw.yaml |
sha256=EcLbjBSEzzPwaobX778vATAbL_85WHKS5WBMyiS8ro8
|
90 |
lm_eval/tasks/haerae/haerae_rw.yaml |
sha256=aRQQ64_aCJyhU_EEV4Gj9W2F4_bPLyV-ohzksz0NT6g
|
90 |
lm_eval/tasks/haerae/haerae_sn.yaml |
sha256=oV4xR4ME9qy9q25jiKHrXbZ344F3MEWoza6M_6-9KW4
|
113 |
lm_eval/tasks/headqa/README.md |
sha256=HGBlwCx5skNA9GKsXv59G3s-08i577g4QSgv2sQrK5s
|
2582 |
lm_eval/tasks/headqa/headqa_en.yaml |
sha256=82oeoQphLobZWuix6pZ7SsiGrKC88VNFt6tvL5BA18U
|
576 |
lm_eval/tasks/headqa/headqa_es.yaml |
sha256=SKIFepRQ_qX9euHAWhk0g8sm3OYDfaei2uQUpGfPWu8
|
57 |
lm_eval/tasks/hellaswag/README.md |
sha256=0Sxbs3jgiuWJFMB0onpY-vhTxCZMWbDke8ElRFsiLfY
|
2710 |
lm_eval/tasks/hellaswag/hellaswag.yaml |
sha256=tw0XK_sIYlT-irK0ekusP5FntQDzm9w8FCYc1Il27bE
|
476 |
lm_eval/tasks/hellaswag/utils.py |
sha256=B9I7YLKPKk9ljc-EQGI6Y_5mRIVM6bhGoRTd6YDcEhQ
|
717 |
lm_eval/tasks/hendrycks_ethics/README.md |
sha256=CHqVUCYMuODB2-sKYJWL_DHBAkMww7dEkVA4WXHDWVo
|
1768 |
lm_eval/tasks/hendrycks_ethics/commonsense.yaml |
sha256=9oL762lPea6DtRcmV9scrHx9I3OHjXzjR-qdTqmXQMw
|
344 |
lm_eval/tasks/hendrycks_ethics/deontology.yaml |
sha256=oQHWZI1TzTYJy09-avPkP-lPxPyP4sfalpmPI6kNYJ0
|
357 |
lm_eval/tasks/hendrycks_ethics/justice.yaml |
sha256=3wWZqWWvkGHmixiU_Kso-J5unv7Rb7PKORU3VlTjS1g
|
288 |
lm_eval/tasks/hendrycks_ethics/utilitarianism.yaml |
sha256=ZiL2s0rFWLuuoeD-WTZTTbSQGjfnR5VoYaEQdp8Qp-w
|
280 |
lm_eval/tasks/hendrycks_ethics/utilitarianism_original_yaml |
sha256=5MHxvjLg3ag-KHs1xznqViyZufFevLIYby-Isof9D0o
|
587 |
lm_eval/tasks/hendrycks_ethics/utils.py |
sha256=TYz5SgyhBjHVOjCMJCCBMVKexOHJwi-NBDvHE4qAoB4
|
691 |
lm_eval/tasks/hendrycks_ethics/virtue.yaml |
sha256=gppOr26TSaJD2jlxsjugNdHKP1pj9IBHkJdFB4zs9DU
|
297 |
lm_eval/tasks/ifeval/README.md |
sha256=Z1lFazEwmAYW4W9j56CIp_mw50Pp5HBYnkeCCcZZZCU
|
2326 |
lm_eval/tasks/ifeval/ifeval.yaml |
sha256=MmTQaysLHMJ7tKttc-zNKaSb01d0B6vLlpmpzuwy5m0
|
763 |
lm_eval/tasks/ifeval/instructions.py |
sha256=mSzvfVjKRJDcxy7sRyHCcEvhpbovKfo_lgfq8Dr6YJs
|
57031 |
lm_eval/tasks/ifeval/instructions_registry.py |
sha256=7NZcRmv51mHzna1HbJQAPthYVyYHPUEyWNLXi20fPLs
|
7236 |
lm_eval/tasks/ifeval/instructions_util.py |
sha256=EybSWJEzXYb6GnCzn6FOpG86bwVJKUfY-CkcG01S17g
|
26066 |
lm_eval/tasks/ifeval/utils.py |
sha256=NWiG271kbkRNrQLpj5pYRaT7-9FRO7CZg78YArdb3uk
|
4895 |
lm_eval/tasks/kmmlu/README.md |
sha256=ZRF5WJErXQVa-xk3Ye2muCBgUd3HZPMa_uJFb59F8b4
|
3409 |
lm_eval/tasks/kmmlu/cot_hard/_cot_kmmlu_yaml |
sha256=pdg--vOX8B0kEwgB352gZt3zek44hAG3S-4pkNjudt0
|
786 |
lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_accounting.yaml |
sha256=KRhNmFwrL6xPUoFMLWIbzteMOxThsscEcN9AGk20B-k
|
9284 |
lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_agricultural_sciences.yaml |
sha256=Y9MitWaO-nuClRQRj1Apqea1wiZnVXLgJZLwFjU9uQk
|
8985 |
lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_aviation_engineering_and_maintenance.yaml |
sha256=TnwXJZoec1e3uWMKEyhKqJABrssBBVvxnb_9EH92hZI
|
9778 |
lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_biology.yaml |
sha256=2X3yO-uPPk-tIwKPR5fInxVKaACH2KkORk-kTwMbjOI
|
8100 |
lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_chemical_engineering.yaml |
sha256=W0_lOef2OLIty11pUz68fh_STj-dUihXGLIkuYGMQ_c
|
9391 |
lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_chemistry.yaml |
sha256=PxJFk33Ye_Un8c-D0hcm4CwRSme9MVXTm-NGVv9WRww
|
7445 |
lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_civil_engineering.yaml |
sha256=Ty6sZdVjyRvuKFerYpVcMKt-a4pla_DmD0f8AfGiW4k
|
11857 |
lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_computer_science.yaml |
sha256=8TrxdDUdI1lo6fDh0zSNW4fvjOVi9z1IsVsL67OxRjw
|
11159 |
lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_construction.yaml |
sha256=KUlEoK4AAvqbPTvtLRK42iakZ73ioV2KKwdA3nWoG4E
|
8995 |
lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_criminal_law.yaml |
sha256=zkLT-IpIBfQZtiXC_L1xae3KJkLDAnSWCV3hJ5uC5g8
|
14506 |
lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_ecology.yaml |
sha256=wTUh5myc4pPkskpvug6oX-SbQKw-7wvxkKQWylL5PL8
|
10516 |
lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_economics.yaml |
sha256=5xnQf7P1Zhju8c9W-sqnrBQxggKm7ACH35guxuadlp8
|
10363 |
lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_education.yaml |
sha256=hI5z7zsDPBahPyGbrbFnp4xrZtkTYKYnenFvqgGx3xc
|
10547 |
lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_electrical_engineering.yaml |
sha256=jfpkrwSLxelwmyyy3A6ToMXfOD9UaHCmIQjz-szXeYg
|
10514 |
lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_electronics_engineering.yaml |
sha256=Rt9wttimWEKiZzX9PhzUc88K6amROVEU3hBaV3DKCB8
|
8362 |
lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_energy_management.yaml |
sha256=mQrCUFGZMLtxzwP35hvZkzOQctw-c4YJc9lxk03zuU0
|
9265 |
lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_environmental_science.yaml |
sha256=X7FK30u3HC8FP1NpCQr_LujE2tFmQrVH-zyAwfbYSeE
|
8631 |
lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_fashion.yaml |
sha256=6FrYVoSdTdTgx96ilTRilLMEiwsweDeDBZVeXRDMcoc
|
9221 |
lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_food_processing.yaml |
sha256=VCAtA2-G6lP6D6HeF2p_Os5-pT7lbT6elTG09e6ZnGY
|
7823 |
lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_gas_technology_and_engineering.yaml |
sha256=Okbh92bdzSafyRQn2IG4j_Ls1s_6_vGGF97PRCNzca0
|
10061 |
lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_geomatics.yaml |
sha256=1j8pHC9FyLX8zfcXrjlZmBZ4oItGyINqkvlQMuNbFeo
|
7587 |
lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_health.yaml |
sha256=6yXVDrTr95eKQ058qsqJQjzrTUSkB6Siyl_A8NcbhxM
|
9963 |
lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_industrial_engineer.yaml |
sha256=kNJYLQKUeq0p5zcqtq8vMbOSyjMygCqVq_pKYGMs-kE
|
8522 |
lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_information_technology.yaml |
sha256=MjIGuHi5VGx6eirW7KIJsdeWr7wDMLSja5BALUq9HZU
|
8576 |
lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_interior_architecture_and_design.yaml |
sha256=I9yBK33nVwWuLkAWdTdiu8bSeWdLUV_iZm7IkK5cFZo
|
11727 |
lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_korean_history.yaml |
sha256=ODW2SuOb8MpJntGQAITLpGsdXYUneJD7buuPfBti4bM
|
12087 |
lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_law.yaml |
sha256=qok2ooaMe1IoBss_x61Jsh0eKt8LG_aLr2Kub7cP9oo
|
9454 |
lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_machine_design_and_manufacturing.yaml |
sha256=fN0oGK-KJsYUUf5HDZhu14s_WO9llEseIs0U8hm5Bwg
|
9314 |
lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_management.yaml |
sha256=uhGLV_AZM8fBIFsd4bQOF8Gl_T7spd_E9j6q842LXG0
|
8546 |
lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_maritime_engineering.yaml |
sha256=YCWbD9kHKSAHUTLwLZWAvT70JqIJzSNEQJ-wsWIBVOY
|
11362 |
lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_marketing.yaml |
sha256=ndkLAlvwLeKWLDUhRPKc3DEQhutWXqMMJpETdXfl6aY
|
11007 |
lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_materials_engineering.yaml |
sha256=GBXfxz9-zPCDANgSUf070rVH0Ol0cAFV2wDO-1Aug_Y
|
9263 |
lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_math.yaml |
sha256=rHdoZBGg0TgCCDjkprpnDnlJFUvnXspWVI3cNiJM9d4
|
8620 |
lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_mechanical_engineering.yaml |
sha256=yr3x7E3ptUH31oAmXSUDTSyyE0Zs7B4tH6otkSK2l_M
|
7974 |
lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_nondestructive_testing.yaml |
sha256=sq25_PeUGb2SnU-fZzHPg970SnLimZdLn5wJgn8dBWA
|
10616 |
lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_patent.yaml |
sha256=IZ4PreafQcIqoJPKIv9ZiGMlSA_uV10msBD8CJFA5SI
|
16072 |
lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_political_science_and_sociology.yaml |
sha256=1M0ZbkIM5aQe4HH3_thW6P54x6Wu_T4MplvCid6DU3k
|
11282 |
lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_psychology.yaml |
sha256=q7r1phCEb_OHR7hCYaYOz8RcuqhMNP4zyvC6GUWqo_U
|
12330 |
lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_public_safety.yaml |
sha256=tvQSEnJR1dSFdpb4OzSLSRrnabriJmwSreeJEN42XBI
|
12304 |
lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_railway_and_automotive_engineering.yaml |
sha256=YWDW9hZlZgr-EkC9ogOTGA9yQyludbMghx9Y2oPzFr4
|
8844 |
lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_real_estate.yaml |
sha256=A_mJ1FJ6cHsB8boabJpESYrEazH9D9NS-rMGuDnxVsU
|
12128 |
lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_refrigerating_machinery.yaml |
sha256=OaTvBgqnq4OZc_cESHoEH4cT_wM01P8Pm5xshTcLe24
|
8399 |
lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_social_welfare.yaml |
sha256=BserSToLaWGG8nICc7UW2NcxH1yBX5n4fYrVfBBuXsk
|
10943 |
lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_taxation.yaml |
sha256=y6mjr791m4NgxpYtSlx3zpWwQUv_u474AnO59qM35hg
|
14853 |
lm_eval/tasks/kmmlu/cot_hard/kmmlu_cot_hard_telecommunications_and_wireless_technology.yaml |
sha256=PlD2i2otpgc1z0XhhXsmFVHeN-5SliIbVf_-qU3pmcM
|
8801 |
lm_eval/tasks/kmmlu/direct/_direct_kmmlu_yaml |
sha256=rst15H--77YggX8WcOaNxDp00hQrZvtdOhPSe5vyjcE
|
586 |
lm_eval/tasks/kmmlu/direct/kmmlu_direct_accounting.yaml |
sha256=s8Q7u4IIavzezqVRdqnPvOMBZKudl3-QU8g8FXtfVmA
|
83 |
lm_eval/tasks/kmmlu/direct/kmmlu_direct_agricultural_sciences.yaml |
sha256=VXY7mCusrN0RkLa2L2we2DSKLA3S_1hqEmoqDdlv3xY
|
105 |
lm_eval/tasks/kmmlu/direct/kmmlu_direct_aviation_engineering_and_maintenance.yaml |
sha256=oe6jsBy3PbSKuDC7kMzMVGxtNggf0wPrGKdcPi2Zd4A
|
135 |
lm_eval/tasks/kmmlu/direct/kmmlu_direct_biology.yaml |
sha256=WL5-7uGWR8k671v6ZsAkaHM7ZyfiIv3w3Ll44yHajQo
|
77 |
lm_eval/tasks/kmmlu/direct/kmmlu_direct_chemical_engineering.yaml |
sha256=SmGBX9WrUMkKbbfr-yJ4cr5hpDhTEZ26ecQmd5BtOJA
|
103 |
lm_eval/tasks/kmmlu/direct/kmmlu_direct_chemistry.yaml |
sha256=tZ85jUT4UDRFS-LHYCjJEX_W8Ls2Idlt5Jh29CQBb3o
|
81 |
lm_eval/tasks/kmmlu/direct/kmmlu_direct_civil_engineering.yaml |
sha256=0zK5wTQNhEKfaFI85vHfWaL_ryPawXU62p726BKbYrg
|
97 |
lm_eval/tasks/kmmlu/direct/kmmlu_direct_computer_science.yaml |
sha256=JksIR4Kv1U-lXfkmmzYkpvyXCSb-fFVTfGgowaqMNlE
|
95 |
lm_eval/tasks/kmmlu/direct/kmmlu_direct_construction.yaml |
sha256=03SU1aSEmqkpOBDdaVqhcHVfzCSWpk2-H9QahgnsTsg
|
87 |
lm_eval/tasks/kmmlu/direct/kmmlu_direct_criminal_law.yaml |
sha256=3e-ibeKqCQj_dD9uIYfy7fD8yNrRCNNvlj9yH413BoA
|
87 |
lm_eval/tasks/kmmlu/direct/kmmlu_direct_ecology.yaml |
sha256=ILCnTDQDI-in_aeeOpXyH0tSrGzJV2Ry9FPYjtcFeyA
|
77 |
lm_eval/tasks/kmmlu/direct/kmmlu_direct_economics.yaml |
sha256=no_J0aYbVM37XdOQiOYQJabnrCN2lKr55FmYZiorvDc
|
81 |
lm_eval/tasks/kmmlu/direct/kmmlu_direct_education.yaml |
sha256=WdDbsh92CgTimWAKSzLMovUgqw2q1Up1VUG3rGK_6U4
|
81 |
lm_eval/tasks/kmmlu/direct/kmmlu_direct_electrical_engineering.yaml |
sha256=kTvVfjkB-xiyP3gvGskNVNLKe3exjSN3IfJx1hogDZ8
|
107 |
lm_eval/tasks/kmmlu/direct/kmmlu_direct_electronics_engineering.yaml |
sha256=FORtpjPQNzZLVoOg_NL06IUNSrAv2TC-gVJDqAkyv60
|
109 |
lm_eval/tasks/kmmlu/direct/kmmlu_direct_energy_management.yaml |
sha256=px38ZJdmlrXR4heYuu7tCKmfIxFNs7q5A0Sn9IKdCO4
|
97 |
lm_eval/tasks/kmmlu/direct/kmmlu_direct_environmental_science.yaml |
sha256=cYp6UHEUw0gF6twqqdU6XHoia2aZ2mdM4t8EeKVoPV4
|
105 |
lm_eval/tasks/kmmlu/direct/kmmlu_direct_fashion.yaml |
sha256=3TH7EBvRcdMHENZihcrfhg52G5oeS-XJoeBeIdBwFqU
|
77 |
lm_eval/tasks/kmmlu/direct/kmmlu_direct_food_processing.yaml |
sha256=UgdQ1s5bbt60vU9rZvXxmjlDsebGo1XgZ1wm2AcIz2s
|
93 |
lm_eval/tasks/kmmlu/direct/kmmlu_direct_gas_technology_and_engineering.yaml |
sha256=r3ixx8LSfUaO5HJiM_P74EmAUJ2K6xa2bThZve9EckQ
|
123 |
lm_eval/tasks/kmmlu/direct/kmmlu_direct_geomatics.yaml |
sha256=ayYsoAYd-s5imw9Y9xqMA-UGzKTaOz8btN25oNGn1Pk
|
81 |
lm_eval/tasks/kmmlu/direct/kmmlu_direct_health.yaml |
sha256=au5qd1ERCyeg5ER5RK-Gwuup5OjcCEtdf7YrGffvDtQ
|
75 |
lm_eval/tasks/kmmlu/direct/kmmlu_direct_industrial_engineer.yaml |
sha256=RFT6Z9ckjSpRUhDSuIybw_3JQDWkEMN4oQPyPa5EHl8
|
101 |
lm_eval/tasks/kmmlu/direct/kmmlu_direct_information_technology.yaml |
sha256=XXaPqHonGcTiBf62Ro7AAwyGeRoUa-BLnVh4XW0BfX0
|
107 |
lm_eval/tasks/kmmlu/direct/kmmlu_direct_interior_architecture_and_design.yaml |
sha256=N5eVgwChbU-uiD1DSG-CLsA6QPlokFs3V0HzFZMeevg
|
127 |
lm_eval/tasks/kmmlu/direct/kmmlu_direct_korean_history.yaml |
sha256=A4qo57qWyLD2x8S7f4_a15tyvLRC-PPT3YP7xTEm6kc
|
91 |
lm_eval/tasks/kmmlu/direct/kmmlu_direct_law.yaml |
sha256=zICpp74MIKXh9Fjno2Ulqgu9XozoTT55KNGepJ4DZnA
|
69 |
lm_eval/tasks/kmmlu/direct/kmmlu_direct_machine_design_and_manufacturing.yaml |
sha256=66A6PujfcWGoIPeN47OqkiViaTDXURXe6NLIVzbpP4g
|
127 |
lm_eval/tasks/kmmlu/direct/kmmlu_direct_management.yaml |
sha256=JALGBtgrQuD35mYEGhkiKAIWBnzJRhY0lkYyVuNN8mQ
|
83 |
lm_eval/tasks/kmmlu/direct/kmmlu_direct_maritime_engineering.yaml |
sha256=EH4Shk5U-D5dmJh0gQAM0kcEkXeB33e7tYprbyvvrO8
|
103 |
lm_eval/tasks/kmmlu/direct/kmmlu_direct_marketing.yaml |
sha256=APDXSSwhwZDqJZG51LXfgcl7Rtqyhrihwgp_K-Ja1Jg
|
81 |
lm_eval/tasks/kmmlu/direct/kmmlu_direct_materials_engineering.yaml |
sha256=nH8eWSCiy-twUP8YLWAkqjSpRr79eG-3KF5t-1K3tg8
|
105 |
lm_eval/tasks/kmmlu/direct/kmmlu_direct_math.yaml |
sha256=212LFb46uqXzAAmHRYNKIkd-H21-z28BfRQ92WlzmwU
|
71 |
lm_eval/tasks/kmmlu/direct/kmmlu_direct_mechanical_engineering.yaml |
sha256=leqavhSJMGEvVGi84AkcQK8OQF-c4M0ncx2cY9JuqJc
|
107 |
lm_eval/tasks/kmmlu/direct/kmmlu_direct_nondestructive_testing.yaml |
sha256=9L3qcZ0qCQHEVkM_MlTNYrQL0FgWslwjc83CFkDtD0w
|
107 |
lm_eval/tasks/kmmlu/direct/kmmlu_direct_patent.yaml |
sha256=EOssq7DHAE6Pd26tW80H1JvOagUNtVFcF5xGpNi2jNw
|
75 |
lm_eval/tasks/kmmlu/direct/kmmlu_direct_political_science_and_sociology.yaml |
sha256=D5oPZclcqmewurcrVqMfWxSp97Sz8VWNXu82_-YTqJk
|
125 |
lm_eval/tasks/kmmlu/direct/kmmlu_direct_psychology.yaml |
sha256=tEnPOspom5FTZhPXYQxj6bLj-xmFN4YyEHTpD8ZwwZI
|
83 |
lm_eval/tasks/kmmlu/direct/kmmlu_direct_public_safety.yaml |
sha256=-vHSItk8gdwU_biw9_olibgWruZAog-KHJ9jdn3t0DE
|
89 |
lm_eval/tasks/kmmlu/direct/kmmlu_direct_railway_and_automotive_engineering.yaml |
sha256=qvbxl8R73Gbg6eeiU0OOlhbKkDJCfVKKjmLGSLF2kl4
|
131 |
lm_eval/tasks/kmmlu/direct/kmmlu_direct_real_estate.yaml |
sha256=9pOr-QnHyTRgSm6-3PdvLOh_xdH35gOEbWpJEVqhir4
|
85 |
lm_eval/tasks/kmmlu/direct/kmmlu_direct_refrigerating_machinery.yaml |
sha256=Nj9zGdHJZEEnPz2rcoo8oFbNDhiTDtVLYnhYicjfWtM
|
109 |
lm_eval/tasks/kmmlu/direct/kmmlu_direct_social_welfare.yaml |
sha256=0wcc6fYPC62AltQDV2OPQ4GHIuP4w2D15T2lDgXHKQU
|
91 |
lm_eval/tasks/kmmlu/direct/kmmlu_direct_taxation.yaml |
sha256=ok19bSEuMcpBSeHUNj9JCrX_PfUfAfPu3XnZxmey5T8
|
79 |
lm_eval/tasks/kmmlu/direct/kmmlu_direct_telecommunications_and_wireless_technology.yaml |
sha256=ctGyLo3PQ6GZr5-Ik-QqDrBJw_Yukj6nv-a87bKJkLM
|
147 |
lm_eval/tasks/kmmlu/direct_hard/_direct_hard_kmmlu_yaml |
sha256=fwiCNKSAnF21fMa-syxWPmum4fXTcRUk1dbWCyBSZ_Y
|
596 |
lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_accounting.yaml |
sha256=YtieMW1U4fnRqVqpze_VEwJnFyYCn_Ep8_GQVQLU4iA
|
93 |
lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_agricultural_sciences.yaml |
sha256=aJdRL6GiL5Nt-zedJ-8AtWrCGYEfwBWoKENM-Ro-TCQ
|
115 |
lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_aviation_engineering_and_maintenance.yaml |
sha256=CY8eW2fmZlnoZvw2wTCB5uVpmIuA49EK4jr1GI72CN0
|
145 |
lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_biology.yaml |
sha256=QWWwYjsDAUbpgkEbAiGTRraQGiVm6CA4Q5QKyGccrJo
|
87 |
lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_chemical_engineering.yaml |
sha256=NFuCWse1j9DorRj4k6HAxZNRiHasVrRe_z9p3k5wLE4
|
113 |
lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_chemistry.yaml |
sha256=3vVyTWQ4cDULfNC1bEB4LJ_kGhFRzf9zJXZwaaiPxuo
|
91 |
lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_civil_engineering.yaml |
sha256=p6n09u90WW65g4rWYCTUmigvxYBhKsRW0ExLvxjgEb8
|
107 |
lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_computer_science.yaml |
sha256=QKHGaYvXLpPMwhjWJHwKA5hfgnQFFApCIpkZLHjqQps
|
105 |
lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_construction.yaml |
sha256=AlaO-CtVBWCPC1HSvOrgkWzB5xtfVJrCg4z0TvqC7hw
|
97 |
lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_criminal_law.yaml |
sha256=O38idbXibN-PHOPM0IVLWrH52npOvFgPK5C-ZmN12qs
|
97 |
lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_ecology.yaml |
sha256=B50CWfQdVlKPGYEzz9IIn38sn1EWQ1hqzOmZL-RKV3g
|
87 |
lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_economics.yaml |
sha256=-YjWuF_7eAd163x0BSaW-7DLgniOsH3jKkrkVOm8Ecw
|
91 |
lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_education.yaml |
sha256=cMnKm8epRW0jNHtgOr-4T_huEUC222lFGTuPjmcWy-o
|
91 |
lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_electrical_engineering.yaml |
sha256=tGxJ0Tf28L5WDujFs1YkOu5VXjPKfMN9r2w-k4b8ZCA
|
117 |
lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_electronics_engineering.yaml |
sha256=n0cAac3Wdx4XlDAcOsG3atQo35W0ISMrVkqkHfp32k4
|
119 |
lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_energy_management.yaml |
sha256=EwAlD1KTclde9Yjmnk5dG_SkS6CAuBVPdJAQ0oPgRu8
|
107 |
lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_environmental_science.yaml |
sha256=p6aocihAudx0ytxfgKWb5Q7xhatemz1NS0v2Htw2Nbk
|
115 |
lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_fashion.yaml |
sha256=nWIu6Xz0JnAWCwDUjiWW4cU_Uu5QAokJlYoDpGsucME
|
87 |
lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_food_processing.yaml |
sha256=3LHcLpZYRvYgNZE_kuIrT-k1TAXYBbEZXybEnPd5HkM
|
103 |
lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_gas_technology_and_engineering.yaml |
sha256=0m0A08E-d77LRank3SumJntiXyfbNRWjZeUJOUd4CVg
|
133 |
lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_geomatics.yaml |
sha256=BnLc9o9TWQocf5ZbRt3hWA5OcjqGhuVMPAR8dhmb_GQ
|
91 |
lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_health.yaml |
sha256=GdjPYiKtpGi26zgVYTPuitFaU9yGNa8NBOqj-E0Po70
|
85 |
lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_industrial_engineer.yaml |
sha256=lpHTF8psfz5WfQz1qM0dMqStZ6GIKwbUGD1Y50Qfh6c
|
111 |
lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_information_technology.yaml |
sha256=Uq7B2vROL74MDhO9fJ3mpF7SFGVohptVPgZg1luPdb4
|
117 |
lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_interior_architecture_and_design.yaml |
sha256=JvpmkpGWliPuh99xHCVRhPmgKF5HBcZUATSxW_hy0xs
|
137 |
lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_korean_history.yaml |
sha256=ZqqnSYjsEXKO6DdXPuBSeywdHlJetfXRu-MpbO0w7rg
|
101 |
lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_law.yaml |
sha256=SrI2Ho1OxJgH5MbgZBlz2ZRp_qffFxprjBZIW5o-qrs
|
79 |
lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_machine_design_and_manufacturing.yaml |
sha256=JDL2o_MmMjT2vF_Ldbq_v98veQFYFEIKGgzXnOkudxQ
|
137 |
lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_management.yaml |
sha256=Ze9Ox37Kzms4k8fwFhuiRYdcDYWaaO5tTb_f6gDw_sY
|
93 |
lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_maritime_engineering.yaml |
sha256=IKkZopT2LfZWbYyus2w6bgJWNLiUst5o2HI3cOOhBqM
|
113 |
lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_marketing.yaml |
sha256=Y5hixAd3POjHUJrsSmrFk40XHZkU-QV31V0a8zTxQZ8
|
91 |
lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_materials_engineering.yaml |
sha256=dNOP7jZ_IUgorj3G7SHnArzbNgIT0y9lJhDQ09SftmQ
|
115 |
lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_math.yaml |
sha256=pxyZfPkkkz3grWK5lk4PPJObg1WjFz3iCNxJ7FKofa0
|
81 |
lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_mechanical_engineering.yaml |
sha256=Z-fXz_LdAQz0RG5nqo3N_R4WsbusCuf0imIURMzx7DQ
|
117 |
lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_nondestructive_testing.yaml |
sha256=JGlXHBFpcUB-7IYmAEh5n8jcNCbaJInZvWqRC7PLlwk
|
117 |
lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_patent.yaml |
sha256=oIvyta9dUsX9aL48XTkhMXrtbDrlAStKqg8KourU8tc
|
85 |
lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_political_science_and_sociology.yaml |
sha256=zTuHnAHYA-Jg9xCKtIK_2-8oYS9op839G1LDV2cFLEc
|
135 |
lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_psychology.yaml |
sha256=zzeQFKGcLqEor8fDFUqc_eJMrl1X0qg7ats_jdtW0wE
|
93 |
lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_public_safety.yaml |
sha256=XTEuFZKG08NEM7YXn4QkJRGSKqiNTvFFihot1kelbnA
|
99 |
lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_railway_and_automotive_engineering.yaml |
sha256=zeTr9E6ZxPsy1SBJ5CLeoduwkMTZuc1qRUJekTykFHQ
|
141 |
lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_real_estate.yaml |
sha256=x84oM4-0zOP8xTjAF3SJbvYQ1jjBfJeKiX8mW-bR5-Q
|
95 |
lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_refrigerating_machinery.yaml |
sha256=TwBvOTK6MV1C0FXlCY7MbmKM4W2xdDgpQ6PDtPv7qUE
|
119 |
lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_social_welfare.yaml |
sha256=TyvaCA-rb-_BnRgbSKqvCBYBX2wWq_yjuigL6jn6mII
|
101 |
lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_taxation.yaml |
sha256=KEpus1SLUr7ep6VMH4La53tALFLEKJ4biItu5j-0MK8
|
89 |
lm_eval/tasks/kmmlu/direct_hard/kmmlu_direct_hard_telecommunications_and_wireless_technology.yaml |
sha256=UjNG8CO7HAoXedSRGHwo9Otecv92wsaop7dTmqYEfX8
|
157 |
lm_eval/tasks/kmmlu/hard/_hard_kmmlu_yaml |
sha256=ClcQFAwA23dJselcwcJ7wHfGUBv2-D6-CK5B-4Wkb6s
|
463 |
lm_eval/tasks/kmmlu/hard/kmmlu_hard_accounting.yaml |
sha256=e9ev7DQe4G2GleXWPjD_trDec8z5sH4YFEMazXoloZI
|
79 |
lm_eval/tasks/kmmlu/hard/kmmlu_hard_agricultural_sciences.yaml |
sha256=ChU4TDE9AJW1NOHDtLSz7pdk6OQJmkNQ05o5D2i3MYE
|
101 |
lm_eval/tasks/kmmlu/hard/kmmlu_hard_aviation_engineering_and_maintenance.yaml |
sha256=vPeMpeBAKaKEIcWU3DJg01T09BpJQhw3LqVaCR9kn2Y
|
131 |
lm_eval/tasks/kmmlu/hard/kmmlu_hard_biology.yaml |
sha256=9UoIsVgtFBwjSvgfa6eNM8LkDsgxrtxxrdGgudezCFY
|
73 |
lm_eval/tasks/kmmlu/hard/kmmlu_hard_chemical_engineering.yaml |
sha256=ckpTGipWfgGR7A-xZ5pvUCtbw-JvSE6o1by5KjJkzyQ
|
99 |
lm_eval/tasks/kmmlu/hard/kmmlu_hard_chemistry.yaml |
sha256=d6iH4eJ4XnCmLCDDF5aO9avmYm8d2n_qdqWjkTPJgyg
|
77 |
lm_eval/tasks/kmmlu/hard/kmmlu_hard_civil_engineering.yaml |
sha256=AW-CMC5f7MAM0GvKbPvcvy26eJVCmGlYFf8a6DQS6WY
|
93 |
lm_eval/tasks/kmmlu/hard/kmmlu_hard_computer_science.yaml |
sha256=4Y66bFOBCF2ujCib5MseIbuCpcT56R4wz_44wuVFvQo
|
91 |
lm_eval/tasks/kmmlu/hard/kmmlu_hard_construction.yaml |
sha256=D-PElzFYMXZl6hpe4X6K35Kd79cTblBmR8-N9g2riM0
|
83 |
lm_eval/tasks/kmmlu/hard/kmmlu_hard_criminal_law.yaml |
sha256=6Jbz7hP5ZJcOTJZDEWy2i4w95qYcSeXdNVnZVSqqmIs
|
83 |
lm_eval/tasks/kmmlu/hard/kmmlu_hard_ecology.yaml |
sha256=Ai0-oJ1wWs1j5wLBbvjRnbzACaWL5_2EQzHx-JbduBE
|
73 |
lm_eval/tasks/kmmlu/hard/kmmlu_hard_economics.yaml |
sha256=lWWKu3fy6EXmQtJyi1L-7k5pZAgA5XBQlXrmDnFtxWk
|
77 |
lm_eval/tasks/kmmlu/hard/kmmlu_hard_education.yaml |
sha256=YHH3LFimutZd8Lb4zjAJ4DKK7mTpfeQ2CCLLPJGwHzc
|
77 |
lm_eval/tasks/kmmlu/hard/kmmlu_hard_electrical_engineering.yaml |
sha256=fr0YMWzEOwflcy0JwCUq9CAT8WWymthH6CxQSWSZu9c
|
103 |
lm_eval/tasks/kmmlu/hard/kmmlu_hard_electronics_engineering.yaml |
sha256=9v6Tqzmjq8Xo1_7CqcfAscrM4QymWMAFy-ObuPdpdZg
|
105 |
lm_eval/tasks/kmmlu/hard/kmmlu_hard_energy_management.yaml |
sha256=BQerrHdSvHDuI6ADbjpkr1O4OUyF8nqY-50SJRS9LHg
|
93 |
lm_eval/tasks/kmmlu/hard/kmmlu_hard_environmental_science.yaml |
sha256=TFXCl2gB5xJrgLrvl9vvQReKJ5F0VnYEFGbxE7xFl5c
|
101 |
lm_eval/tasks/kmmlu/hard/kmmlu_hard_fashion.yaml |
sha256=5uTrvzrhA-PZuL1dTkUbz6z0VntoQ4a6TSLOFBSMaKI
|
73 |
lm_eval/tasks/kmmlu/hard/kmmlu_hard_food_processing.yaml |
sha256=aCuMtZBDmLimMlAArfXYRCA8DeqfTiDjZHANBknkrCQ
|
89 |
lm_eval/tasks/kmmlu/hard/kmmlu_hard_gas_technology_and_engineering.yaml |
sha256=r5MHhAM9zq-XUPS529Z2CeJ49ezCixdBcdFTy4HYBfU
|
119 |
lm_eval/tasks/kmmlu/hard/kmmlu_hard_geomatics.yaml |
sha256=xtRBGW2w3qOlZFEQmClU3rxEfRWebAuT6nllwJiDOHo
|
77 |
lm_eval/tasks/kmmlu/hard/kmmlu_hard_health.yaml |
sha256=IJ4ZBNFrZKYsTHQSdoJUA5HQtMiXCMd8TJVQDUXAHRc
|
71 |
lm_eval/tasks/kmmlu/hard/kmmlu_hard_industrial_engineer.yaml |
sha256=kIPwF0kExXT9HqkVaT1Ol_gOZrLqosr97PyFrUmL51w
|
97 |
lm_eval/tasks/kmmlu/hard/kmmlu_hard_information_technology.yaml |
sha256=VmtYqkQ1_IDUNcpTRP_XJUDYnGrC4zC433TwMnDryug
|
103 |
lm_eval/tasks/kmmlu/hard/kmmlu_hard_interior_architecture_and_design.yaml |
sha256=IHmQFDw9EXXOdFv74K1rvKREZcvZV95CDD9BwsNJ7ds
|
123 |
lm_eval/tasks/kmmlu/hard/kmmlu_hard_korean_history.yaml |
sha256=jTE1drp3RKq_1gx3XA7CUfGJ8agKIkE6GFa6h0akYtU
|
87 |
lm_eval/tasks/kmmlu/hard/kmmlu_hard_law.yaml |
sha256=UfLqVEkqsTx1l51UYaRKVgh7sepRJoZwo2aVENOwhNg
|
65 |
lm_eval/tasks/kmmlu/hard/kmmlu_hard_machine_design_and_manufacturing.yaml |
sha256=5eFADVWfVB-Cy-72XhqqzjEhxShbG2I8lDl2jK30u-k
|
123 |
lm_eval/tasks/kmmlu/hard/kmmlu_hard_management.yaml |
sha256=hMXBRsiyWZtoGSMYem-s8pijoBcRVutvMIet9CPgW6k
|
79 |
lm_eval/tasks/kmmlu/hard/kmmlu_hard_maritime_engineering.yaml |
sha256=kFz40w6N6WqmS1cJMAhfZ8JCsfiAw7sEr6BvQmQW9T8
|
99 |
lm_eval/tasks/kmmlu/hard/kmmlu_hard_marketing.yaml |
sha256=OCIfF5i6V-xGi0H0CKtQvKxh_SHyg2_ENJwBxsnybBs
|
77 |
lm_eval/tasks/kmmlu/hard/kmmlu_hard_materials_engineering.yaml |
sha256=WXdXLlmSKIbEQLIkHDwvh6Wk0PEehHaVcg2d1dHQEc4
|
101 |
lm_eval/tasks/kmmlu/hard/kmmlu_hard_math.yaml |
sha256=ucRNtG9FYK9K98hEWkQyLvvClZrBdoPd1G5jkrkAoe0
|
67 |
lm_eval/tasks/kmmlu/hard/kmmlu_hard_mechanical_engineering.yaml |
sha256=BYwNAaaKiwemWOamYOLJRFnoLfMKJb8uv41ElKSxybE
|
103 |
lm_eval/tasks/kmmlu/hard/kmmlu_hard_nondestructive_testing.yaml |
sha256=-t_1hBnzBEowNcetO51e5Jma_utgkxxRRqgpB0Xdmc8
|
103 |
lm_eval/tasks/kmmlu/hard/kmmlu_hard_patent.yaml |
sha256=nSLXNhAvUD-pxlj_71GbEHYSR2ugLdaQRVQpnjet4Bs
|
71 |
lm_eval/tasks/kmmlu/hard/kmmlu_hard_political_science_and_sociology.yaml |
sha256=02Fvhoq8jGgOuYg3gwuS9f_oITydu_F7N9yhwLJ_k4Q
|
121 |
lm_eval/tasks/kmmlu/hard/kmmlu_hard_psychology.yaml |
sha256=svilfX5j0sx8dh7gNcT9dIa1Qk1KJEGV98-cjB-rUGE
|
79 |
lm_eval/tasks/kmmlu/hard/kmmlu_hard_public_safety.yaml |
sha256=1pW2TJeQ-aHniyGM4ADrRVpGAw4E6o6D096w6dBTvkw
|
85 |
lm_eval/tasks/kmmlu/hard/kmmlu_hard_railway_and_automotive_engineering.yaml |
sha256=LhrwEIVGmmWSaip0hJA0bly3q7BS6Yaafrm8qzYYIps
|
127 |
lm_eval/tasks/kmmlu/hard/kmmlu_hard_real_estate.yaml |
sha256=OZtCtywjduzRBdUijV0M4qO-_KPTddIlMpsjDPNUVCs
|
81 |
lm_eval/tasks/kmmlu/hard/kmmlu_hard_refrigerating_machinery.yaml |
sha256=H66JL7L3ftpHoQ51ZX2J-alppIlWkPZgqHvVilGR9NU
|
105 |
lm_eval/tasks/kmmlu/hard/kmmlu_hard_social_welfare.yaml |
sha256=GF-tgxVL4KRMPh4ihPwfrKeclnExZCR-nuiNjEQxLvg
|
87 |
lm_eval/tasks/kmmlu/hard/kmmlu_hard_taxation.yaml |
sha256=kcGOAtWNpdXJoNiSVRWHIAQ4wBfPc1GxV7an46B81fk
|
75 |
lm_eval/tasks/kmmlu/hard/kmmlu_hard_telecommunications_and_wireless_technology.yaml |
sha256=8XiVND_rRGyBmkPIiEl-R1MdzWyl9KySoU_TvnBG5BI
|
143 |
lm_eval/tasks/kobest/README.md |
sha256=cN-_ZRnv97G6XwjBXOQjjGkmZ7xWC_DSBqeG55pWd3E
|
1588 |
lm_eval/tasks/kobest/kobest_boolq.yaml |
sha256=lKVHvQ0i_k8DFSNZ_36K2y9R7e20L5Yi3g5or6dcjlA
|
538 |
lm_eval/tasks/kobest/kobest_copa.yaml |
sha256=a-ZbH0VnHBxdYbptgvNgLG-9XAGNMtST1dbMAi2EFYw
|
560 |
lm_eval/tasks/kobest/kobest_hellaswag.yaml |
sha256=5E1mspDV_AvHOuAbAvodkI3h9YyABBUjWLg-5Jc3kvo
|
623 |
lm_eval/tasks/kobest/kobest_sentineg.yaml |
sha256=BC9tST3rjUw5joW8STdI2wpDxriNRl_pSmCJ5Lpc4r8
|
577 |
lm_eval/tasks/kobest/kobest_wic.yaml |
sha256=28peMzeNU6m4vvSPtaAaAHY8qrSIa2jlOa56Jml8fYQ
|
562 |
lm_eval/tasks/kobest/utils.py |
sha256=A7NV9S5HQ_ONif9l7atxBUJQnl0nNXdQ-SnSkE0NI-A
|
1437 |
lm_eval/tasks/kormedmcqa/README.md |
sha256=3PvmldNDi-GHI3-ey1aKvJ2AhgjtcL6-VfaUuf7N1gQ
|
2372 |
lm_eval/tasks/kormedmcqa/kormedmcqa_doctor.yaml |
sha256=DMT0IBidQ_ui_ihi3OylsIPU_gRw5pQZTUFHJwkH1Dw
|
644 |
lm_eval/tasks/kormedmcqa/kormedmcqa_nurse.yaml |
sha256=hoDX0Ru1w28ybiXzKMh0qi3ghRZQGrczmOiUffl1UGA
|
642 |
lm_eval/tasks/kormedmcqa/kormedmcqa_pharm.yaml |
sha256=IamiqmaGYP9kxu9-t_eH4JvNYgHpzUYluGprZl3Smlo
|
642 |
lm_eval/tasks/lambada/README.md |
sha256=AO7XlGGY1Dch3ZC6km8CkfwpLiOvAdYbHH_YlEi2xEg
|
1186 |
lm_eval/tasks/lambada/lambada_openai.yaml |
sha256=pD6ORS3uLk6cqWHYu5dysPV53Qrb3Y8c-KtJ2bFORy4
|
533 |
lm_eval/tasks/lambada/lambada_standard.yaml |
sha256=2yH5TSDx7P7aUKJNruN18eiLifeQsi2Tc_MpdQvznkk
|
501 |
lm_eval/tasks/lambada_cloze/README.md |
sha256=j0ewRfQFxUQ6JsD-JGYp4oK1URb-uF1UGiQ-4cwYvs4
|
1934 |
lm_eval/tasks/lambada_cloze/lambada_openai_cloze.yaml |
sha256=aylvpHNoC2lZOJQIBBYwreqwWNGgMM3K7CuonGAxC4Q
|
517 |
lm_eval/tasks/lambada_cloze/lambada_standard_cloze.yaml |
sha256=Qb311jDoc38gNH1obwkpPARGklJUMvVMaXVXcjLYsxE
|
527 |
lm_eval/tasks/lambada_multilingual/README.md |
sha256=ggwX8LEo_cr1oT29CyoLptVbcTxCVZSr9qhOr3UY7RY
|
1995 |
lm_eval/tasks/lambada_multilingual/lambada_mt_de.yaml |
sha256=A3dzij8qTX7W-XZ1uXkMf7l7lPbe8Irr_fem4zQ34oA
|
72 |
lm_eval/tasks/lambada_multilingual/lambada_mt_en.yaml |
sha256=zZSLJ_eMVhTgLF1t_-x28SzkN62WDCcoGSeKz0Xgtuw
|
505 |
lm_eval/tasks/lambada_multilingual/lambada_mt_es.yaml |
sha256=3cWtUCRNZWeGp9bIUU-uJcxCeD7iyHwUkAkdAFMFIxg
|
72 |
lm_eval/tasks/lambada_multilingual/lambada_mt_fr.yaml |
sha256=Okxnj-cxPcEsEIX0vc89Uih-szW7wqHY2SAcdi675Gc
|
72 |
lm_eval/tasks/lambada_multilingual/lambada_mt_it.yaml |
sha256=DtT68Pbs0fCY8oJlKQwQdO0pgcqNPEshYFQppA9RDD4
|
72 |
lm_eval/tasks/logiqa/README.md |
sha256=Iyrf8c8F53A1eYqaDCb6hAm3_Sg_t47gZbOI0BjDKAw
|
1657 |
lm_eval/tasks/logiqa/logiqa.yaml |
sha256=J9PMnhvefAZiF-i7Qm8TVndnoJGjVfrEMQPZKZq33a4
|
578 |
lm_eval/tasks/logiqa/utils_logiqa.py |
sha256=RjmfQAZUadI0wMnh7z3ptn5Q1f4cLEEwYH7aLdomgmA
|
616 |
lm_eval/tasks/logiqa2/README.md |
sha256=BJA7HgfRCSPs51iYrFl9rQzMKjoVDqaIDtCDAh5yk4g
|
2244 |
lm_eval/tasks/logiqa2/logieval.yaml |
sha256=bW1d_6Hqvc8M76mQBUYmsXc1Lk-rYTAa1-FDElOWIkc
|
1382 |
lm_eval/tasks/logiqa2/logiqa2.yaml |
sha256=0jlenXfClywd_ulejkk3-HPOE118TufgzsPGcK6r6Dc
|
512 |
lm_eval/tasks/logiqa2/utils_logiqa2.py |
sha256=CtI75WahPZvORkIad_srFGSZ6bUnGlZf_6sYHkAP90M
|
875 |
lm_eval/tasks/mathqa/README.md |
sha256=VmhPmoYwpKTfeUVDnkdHbj0zx2OtY7y7AI-cJrXEOhQ
|
1907 |
lm_eval/tasks/mathqa/mathqa.yaml |
sha256=dKJMHoZxEGdeJeCMQF9o_DBL9fokJkXp1jlVrQqHDro
|
578 |
lm_eval/tasks/mathqa/utils.py |
sha256=NFqieHDv0UX5cEVmMmIu_GF7KZpNAKvJRZJC0saW00I
|
178 |
lm_eval/tasks/mc_taco/README.md |
sha256=OEUcQofUlqsm-3CLKht9u-V0wXAldd7uPWBjmQjFTSg
|
2052 |
lm_eval/tasks/mc_taco/default.yaml |
sha256=A58bI314XcNdpoKxXxxFhrPlUV-U7pKrPeJfWYOSw_4
|
399 |
lm_eval/tasks/medmcqa/medmcqa.yaml |
sha256=NVrcOA7j28YpYlkP98Bx47HcCZR9vJb_5qMxhknQDaA
|
462 |
lm_eval/tasks/medmcqa/utils_medmcqa.py |
sha256=ucvjPVG5ViS5MXyrj_uRezLBeKqhAP2c5KrAqcRnR5s
|
580 |
lm_eval/tasks/medqa/medqa.yaml |
sha256=M5Q98uefbZaiaF4UaAouR5qkxvL8RK-g7wrlnFfHwwI
|
458 |
lm_eval/tasks/medqa/preprocess_medqa.py |
sha256=Bq3G71vaMln-VHNV5rBkylfGdLUC-sdJ0KDMyP7pF4c
|
362 |
lm_eval/tasks/mgsm/README.md |
sha256=zSmVOkdo78p4Oj4Ui4skfwzYyLqPnE3H4DiS7qMF4Ac
|
3504 |
lm_eval/tasks/mgsm/gen_yaml.sh |
sha256=F0Noarmg-NlAgWhA-_nZKA97UDSoDyrHARQDgmPG4bY
|
207 |
lm_eval/tasks/mgsm/utils.py |
sha256=L4YekOiIl-f5DBtbZu0Ol-cMRX7iPtDiKRzZS8sYhW0
|
8448 |
lm_eval/tasks/mgsm/direct/direct_yaml |
sha256=OnD6bl8mXleMdZ3gZCnJmoyOZWfLeWr9g4wkaMr6PJU
|
907 |
lm_eval/tasks/mgsm/direct/mgsm_direct_bn.yaml |
sha256=pOsz6TlTy-XtEfSex2p2oBbg9zAcfV4C_uEupiVq-PU
|
420 |
lm_eval/tasks/mgsm/direct/mgsm_direct_de.yaml |
sha256=7b0gimqBcMSJD4FpYQ7DULnrBhU29wa7xUaClZWBd-w
|
396 |
lm_eval/tasks/mgsm/direct/mgsm_direct_en.yaml |
sha256=MNyt8SYS3AuehdzrJIOoAlKI-HtaxBshsa0DQHQqdBI
|
400 |
lm_eval/tasks/mgsm/direct/mgsm_direct_es.yaml |
sha256=QdnPgAUHjzYMj3c9-zZ5wclXU-LgxUyXJkMYrvZ7zpE
|
406 |
lm_eval/tasks/mgsm/direct/mgsm_direct_fr.yaml |
sha256=q4QI4JM0S9dihzKzMEw7WbVxVjgSUj7D7PjLz8Vvtw0
|
408 |
lm_eval/tasks/mgsm/direct/mgsm_direct_ja.yaml |
sha256=Pr8BXNyxBHcw8nAFTJVfQYhrLRGZ8gzbpeOQ-O1MHZU
|
396 |
lm_eval/tasks/mgsm/direct/mgsm_direct_ru.yaml |
sha256=RI2otfyZ41_-_3qBGklRf2LwnWa7mVcTlsjv9FFHopc
|
408 |
lm_eval/tasks/mgsm/direct/mgsm_direct_sw.yaml |
sha256=YaNqXO4GSP0FvOk6QxtqmR8RnuBGkK6XZzvrEYwAbas
|
394 |
lm_eval/tasks/mgsm/direct/mgsm_direct_te.yaml |
sha256=uZaP1zvNvNDv3BL8HYI3_tMTc94Qp3svYSr7YvpTxkc
|
420 |
lm_eval/tasks/mgsm/direct/mgsm_direct_th.yaml |
sha256=Vi2pgql8xdUPUA6vmWhTRbZC1qXZ6FQaLGqaaBqHNLg
|
414 |
lm_eval/tasks/mgsm/direct/mgsm_direct_zh.yaml |
sha256=j1iP6Lhg35p33YVurNKzywEGPAQAength7PfOf8om7Q
|
395 |
lm_eval/tasks/mgsm/en_cot/cot_yaml |
sha256=MPzIhexcshgt7BWjM8WoIa9hoa8--GFuK1Y26N52xjw
|
959 |
lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_bn.yaml |
sha256=RLNq0J9egvNGucI7S0lepGfVkKZ0PccOT-Y2gB_nLZc
|
443 |
lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_de.yaml |
sha256=wZMVo5gY_By2AmuLNvvp3nLMc90dEMwTWdqRLtIUUs0
|
417 |
lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_en.yaml |
sha256=qIJJMQIxjNO2DDRJNbL5wbmaJSf2clh5QWjQ8Yc-liA
|
423 |
lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_es.yaml |
sha256=kW7OS5He2TQe-h24NMCRzuMj5T96d2TQ99gT_wx44gE
|
423 |
lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_fr.yaml |
sha256=80r4YBpMICuwMpcl9HvCU7raWmNPuSTzbHG55EC7Ybo
|
425 |
lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_ja.yaml |
sha256=WqBqT1giFlul7YGX2Ulns2G7geHogFE_Cd14Q6B_aek
|
419 |
lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_ru.yaml |
sha256=44uXpmQVAzHlFaJb_o8kDZEYeUe1H6fR60rwMj45vDw
|
431 |
lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_sw.yaml |
sha256=XT4taMtUJaVvfZit-THwafuela2MRzcSaziKEiC2Tzg
|
417 |
lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_te.yaml |
sha256=69AiswgkGTDii0MPpttAugO1lYBSWa9mF27z4AbQxDQ
|
443 |
lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_th.yaml |
sha256=oluyGodzqaJoUZ0KIW6cTjzz5HhIu6UlJNWGHZktg4U
|
437 |
lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_zh.yaml |
sha256=ogkgPoCBad60k99oN-tZjZwpPAF15lQxIit-byWWS8M
|
418 |
lm_eval/tasks/mgsm/native_cot/cot_yaml |
sha256=7N3f3B1EK9rGjGzR7aFL6lxGhZdpdOr9MYbhQ8_N9_g
|
820 |
lm_eval/tasks/mgsm/native_cot/mgsm_native_cot_bn.yaml |
sha256=Ojpf06W7xwaIKKs3wxZEhg6wLWUq-BcvS_blLJEfuPM
|
777 |
lm_eval/tasks/mgsm/native_cot/mgsm_native_cot_de.yaml |
sha256=Ig9r8PWR-G1I3UDXXju14dr-d-ppc6PTR-mnbjc8PKk
|
730 |
lm_eval/tasks/mgsm/native_cot/mgsm_native_cot_en.yaml |
sha256=irYzHhWBvfvbmB40T3x7JXjDFFmgrIuAh5OUWtRJyfM
|
713 |
lm_eval/tasks/mgsm/native_cot/mgsm_native_cot_es.yaml |
sha256=ILp-L4ek7ulwezSqcbM0mAdi69t8hjzesYYXjX9jVus
|
719 |
lm_eval/tasks/mgsm/native_cot/mgsm_native_cot_fr.yaml |
sha256=oizhISkBp0oNb9EtrLm551Yhu_VqAal-5eKrQLUPxnQ
|
733 |
lm_eval/tasks/mgsm/native_cot/mgsm_native_cot_ja.yaml |
sha256=SGo3j7deqYpluE9WyTlsTjuQaTZFIOfQXCAvhGyJUJQ
|
729 |
lm_eval/tasks/mgsm/native_cot/mgsm_native_cot_ru.yaml |
sha256=FEzjncVVgNdvMVrew1O3QVqeiLoAH4KtLUU9n165NFA
|
748 |
lm_eval/tasks/mgsm/native_cot/mgsm_native_cot_sw.yaml |
sha256=hRxFnOJGjmAUaKfDYHG8b4Th4d1cs-OXL2uDXKuHK2A
|
709 |
lm_eval/tasks/mgsm/native_cot/mgsm_native_cot_te.yaml |
sha256=8iwm8ryLnpu9aJaeNaIq55FDkoaqnT4hs7Pk86kurK8
|
801 |
lm_eval/tasks/mgsm/native_cot/mgsm_native_cot_th.yaml |
sha256=faWI8Txy2nzvf9f7KbRIVWBllGN-GUN0YYnSC8rTfd8
|
796 |
lm_eval/tasks/mgsm/native_cot/mgsm_native_cot_zh.yaml |
sha256=WHJu47tsvPWUFNnKvALp4nTmGTg0U2oRsJKnzO-K67U
|
693 |
lm_eval/tasks/minerva_math/README.md |
sha256=PW0HYE2EYL424FRKQSGB28pBoYPs3o2S-f11QsAwx4s
|
3043 |
lm_eval/tasks/minerva_math/minerva_math_algebra.yaml |
sha256=W2rMOYRcOpxvMDmjavOrvppq0-ggsEzKkwEt6xNdnUA
|
614 |
lm_eval/tasks/minerva_math/minerva_math_counting_and_prob.yaml |
sha256=jjxGjPVtnUiudvSkOVlfA_A6oCSUBM2USRJAgQW0HH8
|
111 |
lm_eval/tasks/minerva_math/minerva_math_geometry.yaml |
sha256=XiPoBuvqoAc_1FtATee1GyYcMAC8ClYOKWa04nrcrHQ
|
86 |
lm_eval/tasks/minerva_math/minerva_math_intermediate_algebra.yaml |
sha256=Irfq2-W-AiImEH0PoT2ZdoVg_y-sQOWqNfOimVovvkE
|
110 |
lm_eval/tasks/minerva_math/minerva_math_num_theory.yaml |
sha256=IYI_lzbIQ2BbcPWXrS24nulnlg93CJjlwUfV8M7IkTE
|
93 |
lm_eval/tasks/minerva_math/minerva_math_prealgebra.yaml |
sha256=va30pN9E3JV6nmLY6lUXxhH_nkm6ijSDnAiw6wdrDnk
|
90 |
lm_eval/tasks/minerva_math/minerva_math_precalc.yaml |
sha256=6PZ7DSqtq_gn2rPKIo10hw6JMJOanIxuiWu5uZCc0JM
|
88 |
lm_eval/tasks/minerva_math/utils.py |
sha256=E9ssO6UTf5qv8Djhe33z_6EAupzKMXEqJOBcmTuxJ3E
|
8710 |
lm_eval/tasks/mmlu/_generate_configs.py |
sha256=Kr5tsdroLZywReqByQ30VmueyBfJrlW9nQmU5VhRzbo
|
5304 |
lm_eval/tasks/mmlu/default/_default_template_yaml |
sha256=IuRNq62_j9djPH4XUzIp1C93mh-xRpMaqzr2GgwthAM
|
470 |
lm_eval/tasks/mmlu/default/_mmlu.yaml |
sha256=opYhS9c-LnKCQ0Uh8sMa7Z4gmoifQ3vlCeygR4ftGG0
|
92 |
lm_eval/tasks/mmlu/default/mmlu_abstract_algebra.yaml |
sha256=gXc19CgltUo07syBqIE32CnTjvsYCeVeWRG-KX1Fsz4
|
288 |
lm_eval/tasks/mmlu/default/mmlu_anatomy.yaml |
sha256=6GsRm5WgJy3WtuGZpR-rsTdpfO3uWaBjg2jqg3peTjA
|
251 |
lm_eval/tasks/mmlu/default/mmlu_astronomy.yaml |
sha256=BKfcrmOQeIcmo9WfGbvm79C3W3rpmYlH2WXfCwMd41c
|
259 |
lm_eval/tasks/mmlu/default/mmlu_business_ethics.yaml |
sha256=adoNOrbflZ-pgvnL4k4_2SeQwSDoGVEpR6sD3wOAabE
|
286 |
lm_eval/tasks/mmlu/default/mmlu_clinical_knowledge.yaml |
sha256=rtKNL_LHXj5ImTUYMuFTPsKbJvGaPHbxSh_EQRkn6TQ
|
298 |
lm_eval/tasks/mmlu/default/mmlu_college_biology.yaml |
sha256=tgJqKwkOinOadHJGIvA3fowTImsm5CesuHqNqfyuLL8
|
284 |
lm_eval/tasks/mmlu/default/mmlu_college_chemistry.yaml |
sha256=6-5alIH2bG-I5A1ToEEMPjNz8-uxq-WmOkHWVO84TFI
|
292 |
lm_eval/tasks/mmlu/default/mmlu_college_computer_science.yaml |
sha256=JdXWQW9JAOtR97ctqNpKM2yX2rl-_eoK1ozYBSqtlpo
|
320 |
lm_eval/tasks/mmlu/default/mmlu_college_mathematics.yaml |
sha256=p5Siknwp9HiAOfl2gazwbn65I5n82yj116ISRB6PFN8
|
300 |
lm_eval/tasks/mmlu/default/mmlu_college_medicine.yaml |
sha256=jhM79qmFR020H4fzazq5mEfxRsThQyMbEr9iEC7AiUc
|
290 |
lm_eval/tasks/mmlu/default/mmlu_college_physics.yaml |
sha256=Nm8Bjy5g3sh6PGJpOHj13ReRwGRra6zbTDR9Mw-T2BQ
|
284 |
lm_eval/tasks/mmlu/default/mmlu_computer_security.yaml |
sha256=WmKRHbFMgdTCeGFNdrIHfbTQO-OoUrFRR41jbeCMoFY
|
292 |
lm_eval/tasks/mmlu/default/mmlu_conceptual_physics.yaml |
sha256=nVXaOJWl0Jv0FFAxzDghiiGncQ9if4AdBdoeZ8vX4n8
|
296 |
lm_eval/tasks/mmlu/default/mmlu_econometrics.yaml |
sha256=kll9ZFihynXeCHB-IRvsB3jLGJZ7c7-H5fxBiGRx9Q0
|
293 |
lm_eval/tasks/mmlu/default/mmlu_electrical_engineering.yaml |
sha256=0-7WBd2UWT0wuK8FRdzFNb8Yk6519Ul2mHfho6Wc2sQ
|
312 |
lm_eval/tasks/mmlu/default/mmlu_elementary_mathematics.yaml |
sha256=c2lWRYGVEmrQO1_JbGUa9eau3SKh-7q59IqDkAd3GGo
|
312 |
lm_eval/tasks/mmlu/default/mmlu_formal_logic.yaml |
sha256=t13drARz0b49xLGotrVSkDR_GH3kHzqPT2jJ-kG_D4A
|
284 |
lm_eval/tasks/mmlu/default/mmlu_global_facts.yaml |
sha256=kK1l52luxT-Ib56eZddHw_9EubcuAEJU9zR239fvBOE
|
274 |
lm_eval/tasks/mmlu/default/mmlu_high_school_biology.yaml |
sha256=adPbtPDslRd6AuVjadFeKstNg4ngLYCj7uq7s3xvph0
|
300 |
lm_eval/tasks/mmlu/default/mmlu_high_school_chemistry.yaml |
sha256=FjJZ2bcdxHpwozh7nEW4bW1KZgwDg7sqG9lhi0Abd1U
|
308 |
lm_eval/tasks/mmlu/default/mmlu_high_school_computer_science.yaml |
sha256=FvmaIXBRroEyw8WU1vSA4BDWat9toiJmHvvXaqwUus8
|
336 |
lm_eval/tasks/mmlu/default/mmlu_high_school_european_history.yaml |
sha256=vgNEM9KbKZyE0HZiy7cWskYtU5Ox6D7WRNxAJNgiGy0
|
348 |
lm_eval/tasks/mmlu/default/mmlu_high_school_geography.yaml |
sha256=aPXicSifSye9Ut2wnerc-zboiSzOjYkm4gVhhiLocVI
|
330 |
lm_eval/tasks/mmlu/default/mmlu_high_school_government_and_politics.yaml |
sha256=iKZO88iRCTaEnOb1J4uuE2BICx9TyhRuBWXhttl_0nM
|
386 |
lm_eval/tasks/mmlu/default/mmlu_high_school_macroeconomics.yaml |
sha256=1LRd0Lb_U-ublgdMBoOo4mhC8srAdY-NBHW9nH68boM
|
350 |
lm_eval/tasks/mmlu/default/mmlu_high_school_mathematics.yaml |
sha256=ATgCLKhZn7UoNl2nDaxdBgD1y8k50b0I21WEmlB-cps
|
316 |
lm_eval/tasks/mmlu/default/mmlu_high_school_microeconomics.yaml |
sha256=cv2UrjcQpQe2rvtsMIDge-Ms59PjgPWGlznXJGlHwAc
|
350 |
lm_eval/tasks/mmlu/default/mmlu_high_school_physics.yaml |
sha256=sWPVelphJpPM9RWCoVTKiVNWuhdWPegLZZbGa80LDIE
|
300 |
lm_eval/tasks/mmlu/default/mmlu_high_school_psychology.yaml |
sha256=Q1BJGN6k_9bGk51FNgbMWfymVrcS9s0caTU7N3T5lMs
|
334 |
lm_eval/tasks/mmlu/default/mmlu_high_school_statistics.yaml |
sha256=FiVyJuipuzYEECJSWcm6HbCc2PJ3HS6sXO4bnO05bi8
|
312 |
lm_eval/tasks/mmlu/default/mmlu_high_school_us_history.yaml |
sha256=DFJcWsmxtV9HeDyFvPYCSxCAWywNSfXM5-vc1j6OOAs
|
324 |
lm_eval/tasks/mmlu/default/mmlu_high_school_world_history.yaml |
sha256=B4axVHntppczWuGGL6gQBhGgdukhqTX2Ga0kwH7wEs4
|
336 |
lm_eval/tasks/mmlu/default/mmlu_human_aging.yaml |
sha256=it0LUShyuG1o-jr-kdyhtOOWYFx20MuuVOCe9lhf2Hc
|
270 |
lm_eval/tasks/mmlu/default/mmlu_human_sexuality.yaml |
sha256=X-THNfrS2YzRDlv-2Ud7Zf8CowaIEmu3OxouK37DmkA
|
306 |
lm_eval/tasks/mmlu/default/mmlu_international_law.yaml |
sha256=_FSWdGN6SvDlaT88kQsGtj_7kuqzvvkGVLlTiPBW_lA
|
304 |
lm_eval/tasks/mmlu/default/mmlu_jurisprudence.yaml |
sha256=jFnFoZLKI6ANTvvH9cOCcM4DGJFtw3Xp2Cmd-wcMdxI
|
287 |
lm_eval/tasks/mmlu/default/mmlu_logical_fallacies.yaml |
sha256=t9cxs8hSQD7hLx8n_62Wsn44VCEasO83xzFF4MpJDOQ
|
304 |
lm_eval/tasks/mmlu/default/mmlu_machine_learning.yaml |
sha256=YzBbWm_EF49uRk_BjL-9DzgCeY7kvXWsPQRjwVAyDes
|
288 |
lm_eval/tasks/mmlu/default/mmlu_management.yaml |
sha256=43IDk6OZypE0VFm-2ZwkuVv3Arf6NzGgjdQNIeT0X3g
|
265 |
lm_eval/tasks/mmlu/default/mmlu_marketing.yaml |
sha256=32eH-SwcdzdbZMoiAI9GoUx_fRChoakuUrMvXZJ5haY
|
261 |
lm_eval/tasks/mmlu/default/mmlu_medical_genetics.yaml |
sha256=cBYQrC5cGxR8wtUhB7rfahBNpoZJ_xcIwvQrijxNQNY
|
290 |
lm_eval/tasks/mmlu/default/mmlu_miscellaneous.yaml |
sha256=Oo5UxK1to8hY2jdB83n9wTJnVJrAHNkIp2_n9wblioI
|
277 |
lm_eval/tasks/mmlu/default/mmlu_moral_disputes.yaml |
sha256=59Zv6o6ZAvIWM_NCdq6KTFo9-VNa9KocwHs-hPUNTOI
|
292 |
lm_eval/tasks/mmlu/default/mmlu_moral_scenarios.yaml |
sha256=JT2l_KMkk5g9tacrCPk2U67TSFU7bwxH72vtO94ELKA
|
296 |
lm_eval/tasks/mmlu/default/mmlu_nutrition.yaml |
sha256=gqbILA55_fbtqBzcjU9gCqPCdIAh6h-ztArvHRA5NtM
|
261 |
lm_eval/tasks/mmlu/default/mmlu_philosophy.yaml |
sha256=NWMWKylcBfEkIumwg6eRaJgKVqBpQ6blOMbyIvgn77w
|
275 |
lm_eval/tasks/mmlu/default/mmlu_prehistory.yaml |
sha256=g9KiT4SwWrzRlHSMMIEYSsTarhFNsuGyTFhNjd3BMrU
|
275 |
lm_eval/tasks/mmlu/default/mmlu_professional_accounting.yaml |
sha256=9lcnaGxlY3IgmAPAhvvXjrMEHmYUROCVPI8jsrpOP0o
|
318 |
lm_eval/tasks/mmlu/default/mmlu_professional_law.yaml |
sha256=fHnaxASjlkxSWtAuKVfr0sI-6AEm83vN2aEZ2-HShT0
|
300 |
lm_eval/tasks/mmlu/default/mmlu_professional_medicine.yaml |
sha256=e-JGsjNQ7vcJxMeW1IgYSE1midCUGhD87cs1FVT7dMs
|
310 |
lm_eval/tasks/mmlu/default/mmlu_professional_psychology.yaml |
sha256=VrF-mtFHcGOUBOUseGjvUoKgB6uXRi8y3g98xG5SrBA
|
338 |
lm_eval/tasks/mmlu/default/mmlu_public_relations.yaml |
sha256=LPamTE3llnQCW25KM8TDzHrkOTIFBQzoOzO5E1I22qA
|
310 |
lm_eval/tasks/mmlu/default/mmlu_security_studies.yaml |
sha256=zW3wJTXMpc9WoQpOy6WLZc7uVoq7MUkAN6CDQqg505s
|
310 |
lm_eval/tasks/mmlu/default/mmlu_sociology.yaml |
sha256=E8v0YKlGUe-gLWjmxgKRAZqrjKQ2NKFENw25wpdIQdE
|
281 |
lm_eval/tasks/mmlu/default/mmlu_us_foreign_policy.yaml |
sha256=jOXbTYPJayVwvMeIqJdRWxvH3DnwwyBKsUoUzgcOKC4
|
314 |
lm_eval/tasks/mmlu/default/mmlu_virology.yaml |
sha256=dQW5H1xYslCMlYJ2im-8x5nRs7zudCRW1QxaoCts1xc
|
257 |
lm_eval/tasks/mmlu/default/mmlu_world_religions.yaml |
sha256=sozIm5GYbF1z6K3M-DZZuYeIuXoGlfCLdU1dG-g0mi4
|
296 |
lm_eval/tasks/mmlu/flan_cot_fewshot/_cot_prompts.json |
sha256=CBR4SFsdT1HgEwXhkRPw46Ro8tx4dZY4aZjiKal7CWw
|
218396 |
lm_eval/tasks/mmlu/flan_cot_fewshot/_mmlu.yaml |
sha256=AmkVICAMmJEIwTs0ULG6QxkUQBTEwYvcCVkzXsNeCmI
|
177 |
lm_eval/tasks/mmlu/flan_cot_fewshot/_mmlu_flan_cot_fewshot_template_yaml |
sha256=huyP85w531dmWgk8ZtLO5Qz-htcX8bb-eoPSi2qOjMY
|
783 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_abstract_algebra.yaml |
sha256=i9OND-3ugS3Y-V4tnmPf7-ncWotcKjsHYGP7ioRSJ6c
|
3283 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_anatomy.yaml |
sha256=Qo9gChWbJVrTxj3AfGs2hyblIzq2elL-dHEqwAi8eEg
|
4704 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_astronomy.yaml |
sha256=eANA6hJA4OXmz41-VRnmVMvLtykjTyARmOj-D7c27po
|
4526 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_business_ethics.yaml |
sha256=UV3kWpjIZDuDDspPxS10FkpU3yX1j7hnTs7pSx8KG3g
|
4650 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_clinical_knowledge.yaml |
sha256=sJOKZucur5KXLVV9K7yyR_BV17UMREjJSr8NnpoGhdA
|
2790 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_college_biology.yaml |
sha256=d51ullMuaVek_b-t1bjYGC47-eZOhdiMH49VyYUgN1s
|
5018 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_college_chemistry.yaml |
sha256=27rIMLE23N_oDWBYj9RirFTRTMUTi5fsZymf9jQAlW8
|
3079 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_college_computer_science.yaml |
sha256=p_n0hfEo3ejxWONc75v4e7TW6uWSj8GdmjFKrU1MA7U
|
6656 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_college_mathematics.yaml |
sha256=L1Vny2jzbIUrPwSKtu7aoWblT3TdEpQMNGc95t11pAY
|
4094 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_college_medicine.yaml |
sha256=j7JDm6S1iGSdJm23VKm-E2w3QCLKGQALHJAelKP0mLs
|
4342 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_college_physics.yaml |
sha256=9h396DDHB5_EzyszrDALEONNDM_0ZE3-ia8VVwiLJtk
|
3572 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_computer_security.yaml |
sha256=XkeIKlEyhMc5uMoZD6EAt-cTychzTWhUxaWuhPAwCzI
|
2893 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_conceptual_physics.yaml |
sha256=cl8R6amav2M2j-4CWqgt268r-8HFeLSKqrX_rRQGLdE
|
2661 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_econometrics.yaml |
sha256=j-1GWZUEmojmUmm9X4G2EBhTlsAkNsPEOTnJrZVTGsI
|
5253 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_electrical_engineering.yaml |
sha256=E7cseWfTbQLkMtPTB7AQ_WvCXQDnHC44zm87VSE7w9k
|
2742 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_elementary_mathematics.yaml |
sha256=tnaF2xDuokHYuHbq-Itr7LZfHWTWwcWyUaxVs4R45mk
|
3306 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_formal_logic.yaml |
sha256=4gcR3KuFVDtbPIP1uoZlj1eSo2zB4m_3yyVxUBoQOYA
|
4520 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_global_facts.yaml |
sha256=UDEgUdufjlweJbpAKrtWga6YTUTwhyFWVpssSzx-WLc
|
2700 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_biology.yaml |
sha256=n1tjopDx2rKy6fc1mk7o8M6GIUKQxvh5cNs-ymhKpZs
|
4496 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_chemistry.yaml |
sha256=w5DTrVYG5H3uw_aSly_QF71DuKEP31NSJ1Bgkp1Sdbo
|
4148 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_computer_science.yaml |
sha256=QHhgSa1jU2lFzeuIByKS0zY2zwYnSJr09SOdedEQFcE
|
5867 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_european_history.yaml |
sha256=JCOiZZ8A3R81eSO8wOu1Xa9dqAZ2xLUc8zX_o74qRKE
|
14453 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_geography.yaml |
sha256=mNwpohT8ysledOx5nQWztnm7fnd7EuwqzSn9IYbKeXw
|
3074 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_government_and_politics.yaml |
sha256=KmQClLUPJiiuJ0REPgVrykpdngyCUhq094-7AMQreSY
|
3557 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_macroeconomics.yaml |
sha256=ddlRI10f3lV80g6ZlxMZb5puwML1lJ87ja0nTjhlyBs
|
3045 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_mathematics.yaml |
sha256=PWJv_mapsiyyE40cK32Ky0B4_mTEIbZL_UiybJS5ArE
|
3007 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_microeconomics.yaml |
sha256=MeRkFGxYyNsxo0bKb3liJApfl0yxWntiy7A1u61LSnQ
|
3238 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_physics.yaml |
sha256=U0Dq4ByrLSK09Mrv1QPDseQgufQuBDXKCTb0xVoV1UI
|
3154 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_psychology.yaml |
sha256=jQsUp94o1WYgwcx4I_g_DadIutm-LkhiPpZtt-rS4iE
|
3988 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_statistics.yaml |
sha256=QsZh-YF0NYPmBkl7K5UiASr-oGA8vcxwojigffPo4-k
|
4777 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_us_history.yaml |
sha256=71jIaBPgUWbEwQTWTIVZGSdqV2s7i-dcuysorCCaNkY
|
11372 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_high_school_world_history.yaml |
sha256=VS64z2RHKW3FCOMEMdKEt9AfHvInOAlqoKqSVeiN0Pc
|
6933 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_human_aging.yaml |
sha256=2FbGMnhDfiEcY1DGU3YdiEZJhUzkCCE1Ss2G3xr5z-I
|
2181 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_human_sexuality.yaml |
sha256=k44qoXctF1kx3tnQIVIglwrh8FXGx3ea9fh55M83-ho
|
2713 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_international_law.yaml |
sha256=VtXMlXDrcwba0qpiBcYfeGDAnl0ke3Q6CyLeg4b-7SY
|
4508 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_jurisprudence.yaml |
sha256=W8VmpIzbq26j-LpqLW3_5nf2-yMqZuUKawuFYvrpPQc
|
3668 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_logical_fallacies.yaml |
sha256=E5rNbNatNV3YdLgFlEsO-0K8713vDJdj3iUjpExBa-o
|
3644 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_machine_learning.yaml |
sha256=w0Pem7z84NEyh749-vS0TWbClitKpQE9U3LHll7eFA4
|
4929 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_management.yaml |
sha256=FAs2Ey3p6MSZWYmdXl162kBz4051aXKMpXnGnz4FUyM
|
2639 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_marketing.yaml |
sha256=VGC_C3MYeQ4rhS177ax0Az3R2RB6wGojKk7N-5HIhO0
|
3271 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_medical_genetics.yaml |
sha256=hqrgrLaXp7ycrI6MnmkyLrBWdqKFFNC18v9NJBg7f7U
|
2972 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_miscellaneous.yaml |
sha256=0qY0ZYGHsBhS3wxX1rWYfgavSmJVhzdRfESKt6MaqPs
|
2169 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_moral_disputes.yaml |
sha256=eEA8AeWOVqM1sX_mQFbm_m7U6WwxFkRbUA-IR4y1YhQ
|
4018 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_moral_scenarios.yaml |
sha256=Jd8TfRoge9XJM6lstObDTYasbtqW1qsG9_HaMAW7plM
|
3601 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_nutrition.yaml |
sha256=bh0rJv8UK_I0WNvBUutB80OC9VxI4V1a3TWcRsCzn_o
|
3897 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_philosophy.yaml |
sha256=jLJUfPBEc8JWX0kODtlUogZ_p2L7yDywraMzxCjGcHo
|
2410 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_prehistory.yaml |
sha256=D9M14jFNL0n5R7pV5AmnZQlf_kcOg0wqtvPqTXCttN8
|
3441 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_professional_accounting.yaml |
sha256=MMHhBZeQ4q9rZqjSSJhxhYlyO4iAJm25e0rS2RQsizQ
|
3922 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_professional_law.yaml |
sha256=xPAbeM4zgXpAUmCaTmNpkUpOmBxAWEzltXH-nO_v_ks
|
8947 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_professional_medicine.yaml |
sha256=U0jY2h2BzfNffVJU0WDOb95vz9ZtKAi6X9ciqnMUTHk
|
5853 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_professional_psychology.yaml |
sha256=-p6H2y6oRwX0R3Xvyot8ZO1ehiEcDNsBNW5NMW_FHyI
|
3990 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_public_relations.yaml |
sha256=cHsTH5yEFAg5mqZ40Wvf9-4CIfM7jO_xTKCmB1qrw1k
|
3143 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_security_studies.yaml |
sha256=iyiKxGAc-Kl4EnOEPWf2Dof0_ZiVYkXglcYFLFgIQKc
|
7270 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_sociology.yaml |
sha256=Kpyov2cWFfbxkApiTrixJbNwq9MzmbtOHyfqyZy7R4c
|
3460 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_us_foreign_policy.yaml |
sha256=0_Qvn6wr7CQYdsKdl-xmtuwNl8It6FTRsV_HWMf3Bas
|
3277 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_virology.yaml |
sha256=ddbifOmbeKlYQ4--WEFDSGcQQyvLwzI5T3AfYj9dQm0
|
2450 |
lm_eval/tasks/mmlu/flan_cot_fewshot/mmlu_world_religions.yaml |
sha256=V-7NOjqQMEmf273O4_Pi1ktOsXCExEVzi9Ma1kwpfmE
|
2130 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/_mmlu.yaml |
sha256=_hjjoCQTWOlz_f-ldxYlK9RWpKnbHjOn8KlwNjLhatg
|
182 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/_mmlu_flan_cot_zeroshot_template_yaml |
sha256=qeSmlVL3_VQo4sQJOdQ835gYpGJxMz_yhxCNutUY6VU
|
1158 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_abstract_algebra.yaml |
sha256=LvRnHFrHw_6n24MAe5BOixVezyZ0ME581aHG7yDSn7E
|
284 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_anatomy.yaml |
sha256=no8v8ThFcdjNjCqBkFZIR1--Nd4ZiCZoa-L825u2rLM
|
256 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_astronomy.yaml |
sha256=hN2iIJ1PmHloJCm9C2dAQRAc6XqBwxUGivaiUaq6-kY
|
262 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_business_ethics.yaml |
sha256=XWfFMMiwK8hhSNKkuZs_JSBeIHkw4evEM02LIKhAuTo
|
282 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_clinical_knowledge.yaml |
sha256=e5KerpASf1oRCJLvWqvGHJf5ZW04jrqmA8yzpY4RMt8
|
291 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_college_biology.yaml |
sha256=v2ZXXWAltVye0sdYDsi6vE70kuW_3b9wsyZ75UuuZsc
|
281 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_college_chemistry.yaml |
sha256=8X67aXlo-viUOq4ZVbWrgEo9ntqi0lNWHqtMpDr-0AA
|
287 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_college_computer_science.yaml |
sha256=5h-Qt7ndBtlJG5ZfSbY6caGMCbQrsyWc-MVPxncDzuU
|
308 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_college_mathematics.yaml |
sha256=Rf_ZzZUxQ0oOct1pg1TXi_dsRUZpU7WkcmQviWHoXi0
|
293 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_college_medicine.yaml |
sha256=fJ--DO7NIxkwa2ica1QbsdlIn12616p8PqE8EauaUlA
|
285 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_college_physics.yaml |
sha256=9bbIfyxuil3UIY-jG9-Fvf3ywmwdMo0titOe-M-Dt6c
|
281 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_computer_security.yaml |
sha256=nXPVQH1xVJtZt6_2FPiC626QoXGaRY01f2AymmhzQ2Y
|
287 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_conceptual_physics.yaml |
sha256=WrfEys3YyQF6s8otgNvTjD16LDKZk9BhvyW525ZIj84
|
290 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_econometrics.yaml |
sha256=ygr0_Jh5OWxyixszzr35NEie0PudCTADqRpjpMDThrA
|
282 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_electrical_engineering.yaml |
sha256=hciTVSP3ckCk3RwC0PsB-J8Ve4wHyj2xusA8kEPzjy4
|
302 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_elementary_mathematics.yaml |
sha256=9DH852QpJPBc8YgxNvvCnnq5nwTDVNcLqU4BRxrSiBA
|
302 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_formal_logic.yaml |
sha256=58WVxXMCkazivwYFoZQ1Yb84Z991OiU-vQI4sbtJUXA
|
278 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_global_facts.yaml |
sha256=RM_pb6sRZmx6iVcFXAiYbYHn3gfXAeAvodBwVKd25zc
|
273 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_biology.yaml |
sha256=0DnTWb-KtU2zFX-QFM6s7XKKouwT2nfyK4fyS_tioyU
|
293 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_chemistry.yaml |
sha256=heKA8_U1wj5P2q5roXMqwAWiRa9v-sbZaTbe-hyP1cA
|
299 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_computer_science.yaml |
sha256=DiOmq-I8_p3DVOUhtFgFjijtG0-J_MRa8F5-cIMeOXQ
|
320 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_european_history.yaml |
sha256=3OffoLG-gh2JjKcKWntBWFEjc5lrSgOw-ZFwtJPgFJw
|
326 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_geography.yaml |
sha256=Fd0I-5A7mltjnIF0Md7fQLY6YyVOoonsdc4txxNNZsI
|
310 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_government_and_politics.yaml |
sha256=uimHeblbJFYgaaah5fsWTQl3_KFZdvDTGmcdviqD97E
|
352 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_macroeconomics.yaml |
sha256=3dhl58MUaawpSYJFfvelXVpKLcVBbDE9MpMvAT2peKY
|
325 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_mathematics.yaml |
sha256=aRQK4pwDayZ6xNkOEqytHjJwxyI2nsY_9QOW_FAL6ok
|
305 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_microeconomics.yaml |
sha256=ZKQPAubYaV9HfGiJFvENELqyTLuFvG975eBGmn5USlA
|
325 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_physics.yaml |
sha256=7u1ma2j7itc6SdgSwlotC4Qs3oovbmQMCldOuUWtwGs
|
293 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_psychology.yaml |
sha256=cMvGDf1fcB4btH_AlHeZ727FWVPB8WIvUDi9jP7gNiM
|
313 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_statistics.yaml |
sha256=iolnReJzl_eeTS3iDnhz3NiEn_GNeNW9_hu6Ba_CRA8
|
302 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_us_history.yaml |
sha256=TYckw3h7JfcP5tq0X_k58pyk3ph07f69WyeAqRxmcGQ
|
308 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_high_school_world_history.yaml |
sha256=z6JcOncyLPzV2cW9Y1kzICK9I8c2V2KGa5iPgYi5XJ0
|
317 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_human_aging.yaml |
sha256=Rq1oksitbFhGyrgN0H7fHTW_PGwKraphFEE0-ZDzW2o
|
270 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_human_sexuality.yaml |
sha256=XlLHhllCiErpFvV8u4_erECYPiU_sf49IZ_q2We1Ulo
|
292 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_international_law.yaml |
sha256=47Y_4EVkuA8PYyLDZwb7PcDgAoVjJhxQGV6uH6SksB8
|
293 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_jurisprudence.yaml |
sha256=62o2fgoKLVpHP5_L9l8dgGSvKKvjydg5amyUuPSYDSk
|
280 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_logical_fallacies.yaml |
sha256=UmcituDQMs9_WgxnQl5TF8zjzqG19RZylKe8yH7AioA
|
293 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_machine_learning.yaml |
sha256=GEzsjkMBTPDAwwfOocJ1fJ222Li9l2Ly_SwuKcaKJEU
|
284 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_management.yaml |
sha256=DvBGob0qxl8O_Wgpmy5EdFMhgjuG8lS-Oswbbe22-Yc
|
266 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_marketing.yaml |
sha256=iZSiPqmRAwN-sQk7rGYiXxQb3_-AzRtZWnYhR8mKMGI
|
263 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_medical_genetics.yaml |
sha256=swY2eauXtpqf2acrcAPRBsuS3wUm8vrDezRhuvAeEE4
|
285 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_miscellaneous.yaml |
sha256=ob2TmbBUTu7eiaqKVvsdPgm0QwF9TzAsVvVHzuO3WcM
|
275 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_moral_disputes.yaml |
sha256=N64E_YN5-Es-RkaLF83OwxE02nLP_JqOtBNdhL6BHKs
|
284 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_moral_scenarios.yaml |
sha256=V4-YewELczcHXVhShtQJZTucYeeS9vVMcHR3UMd8RyI
|
287 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_nutrition.yaml |
sha256=uEOLbPIzTJ8XBGUhnTeqU-5OYBkGsxLtVM_cS4dZjvk
|
263 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_philosophy.yaml |
sha256=IFUR_93hbXyYXAzQdwJoVe3e9Qwk4H0_c8z0NGII-z4
|
271 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_prehistory.yaml |
sha256=4J7DeKI8Hv6zQylMhwi8Qc8B8Fq-Caumx_1vwGsnt4c
|
271 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_professional_accounting.yaml |
sha256=2kCLdxKouQcWr6zg1uZM1PBqkFMSgeZZNzqG9DxMu8g
|
306 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_professional_law.yaml |
sha256=xbDsyiFwhZZCPM0jEkguzvSRSeq1tutZynuhlg3lgxo
|
290 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_professional_medicine.yaml |
sha256=AUI47eC1j6rc-9Zqp0GmHYLbDHg1O7GVKY8Vv4lYMXI
|
300 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_professional_psychology.yaml |
sha256=7TFjvuSpZ37wDEtdtf1NjYS6mTXuqwSSH3t1OHpydME
|
316 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_public_relations.yaml |
sha256=DAjQj-5aG3dZHCXI2Me1hnix3QlDZuS1ZuHplywmH_Q
|
295 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_security_studies.yaml |
sha256=DC__nJv6cZIgeWk7uUdIPpoIVkCDDT9dE802p8fC1XE
|
295 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_sociology.yaml |
sha256=uEopPjYfP01SXyue-UDn6Eu6XJY0giXJuNJnMW10hdc
|
273 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_us_foreign_policy.yaml |
sha256=jAEfmTK_piBJnrhjK5D1LhCTZaOjCr-3y6D6_RPtk-E
|
298 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_virology.yaml |
sha256=74_GviIJbl4HRinvOOrrMx2_LqW0prHZU1jsJVSVRfw
|
260 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/mmlu_world_religions.yaml |
sha256=DVS8P0bKnD8vBNxCMkzy6N0eWVIyQ1XpTBIA71JaELU
|
287 |
lm_eval/tasks/mmlu/flan_cot_zeroshot/utils.py |
sha256=LXwOcOnyAL_h3VRE0XzM66h2qJuB0zK1zhrqupg4jpA
|
4184 |
lm_eval/tasks/mmlu/flan_n_shot/generative/_mmlu.yaml |
sha256=rA9DgApHb_PGaMgMqEP2uU9Qoz7GWjMa8bzJgqTL9Ao
|
207 |
lm_eval/tasks/mmlu/flan_n_shot/generative/_mmlu_flan_generative_template_yaml |
sha256=Nn2vSeMCfoS6KknBimFg4c-rcX_8_1cdFYRKdY7i7gw
|
880 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_abstract_algebra.yaml |
sha256=1yvdHaM9GTcNnMaDV7pV63E6mcZv3uoS2Lgj1IqHlvE
|
292 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_anatomy.yaml |
sha256=NtroH6VqEdaJd8HiWr8a_GJ8GjMUYlsPpre0T16P-O8
|
264 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_astronomy.yaml |
sha256=i1KgW-h2hbODryP_NDY6oZ9MpGEilsP6z3W-MkXJbzs
|
270 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_business_ethics.yaml |
sha256=fSuKzPYSkEd1TmMMLSV9cnxNZTWFeYf0tvdmLZG72uk
|
290 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_clinical_knowledge.yaml |
sha256=5_FghB6ud7daF4EeflUG9UqWgLOfT49wto_Ld8E7zaY
|
299 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_college_biology.yaml |
sha256=15B08EN2JcsLE1noz0qeKS-eSwZdTN6cxLXEgohzphA
|
289 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_college_chemistry.yaml |
sha256=y3qKzzecqo1hb7-huA-XwLJHayoSJo2EvODr8FCpszI
|
295 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_college_computer_science.yaml |
sha256=VjBnBkAvbVCL1h0BgFku51ESFyDKpXt3TkfQ8kqrhps
|
316 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_college_mathematics.yaml |
sha256=AIosK7NMiKx-XSj__nr1djX0fxFBZBEkuqYgatPCyO4
|
301 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_college_medicine.yaml |
sha256=RGXU5iSNbbb8RDCH3lcg1n23cCHYJ7s97pmH5KcRcbs
|
293 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_college_physics.yaml |
sha256=cB9KDjCKPCNmojsXBbvJXP5K79hCehb2doHdcb4x8PI
|
289 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_computer_security.yaml |
sha256=z91MJa2RV1B2m5decq4nSUWAf4Zc9SM9wBcG5aFlEBY
|
295 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_conceptual_physics.yaml |
sha256=Ls4ntDkx7V3N3C3dMJ4SGHqga_UXKAufh447yw7Fjr4
|
298 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_econometrics.yaml |
sha256=wavgGn2qhGXRwgcZGFeeXaJQ5fEgjpReY2YSOUhwjVo
|
290 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_electrical_engineering.yaml |
sha256=kPiAfHTJxHyWTIDdIv_IcXdkO2bGQ_K3AyYpHXsi224
|
310 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_elementary_mathematics.yaml |
sha256=h8mXOss7r4hG3CUmE5vunwm1l2I9SJIA2fGGV7xami0
|
310 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_formal_logic.yaml |
sha256=GjvsAUaRAdnOcA-yF86D6DqNzsoocIKs-ZJ_hAtpQLc
|
286 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_global_facts.yaml |
sha256=59MQcBeGFepYvfZXcJUb9gTwnpuzzFBU_JK8vQHb-9c
|
281 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_biology.yaml |
sha256=vf9s2eai7UIFUyX5N_H_RdRPSvJoyMKp0L6zu3HsUmM
|
301 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_chemistry.yaml |
sha256=-hzx3wvYQcbJ8pLmInAPmtT8eErwFH4Zv4S4eN8icqw
|
307 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_computer_science.yaml |
sha256=A_to1N9TFCJUroTf0Mkt9uvCpS1E5wewxbYRYwGz70A
|
328 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_european_history.yaml |
sha256=FJsKuJAJLePaKKjAQXQC-uUDMmqdGiOJsSj9-QVSXD8
|
334 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_geography.yaml |
sha256=DLoXYBsTwO8lhN_0VkTVowK432A_vcDT8liAwzM2DgI
|
318 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_government_and_politics.yaml |
sha256=zkOAZRnm9OKThUjZCxecDg6nmmS5II5BQwTgsU_QLyM
|
360 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_macroeconomics.yaml |
sha256=dTW4bwdWf65fEGJGRReq-uXz_pueuPu7LF7CiJegge4
|
333 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_mathematics.yaml |
sha256=jZ52HsQ41J__WPLpdX0rJ7DsmXogBQKV3kSCw8Tt53k
|
313 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_microeconomics.yaml |
sha256=_sgnl5NyQJhHurnRCW57XL-NTeoQMnKPZ8itIwDQuWo
|
333 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_physics.yaml |
sha256=lOGCUibImDUaLkcuUxGQNlz5OCmEIyZyzP3FsfdKYRU
|
301 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_psychology.yaml |
sha256=_frgKmtOaJ8ErEIJza95nJKM5Q0R3htRecVFwilhp8s
|
321 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_statistics.yaml |
sha256=v53JtJ26tGzC95RlCw_opPG4exyOkkx_y1yjHastn8U
|
310 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_us_history.yaml |
sha256=PSIL3rSUv7ZzYFtgBFe0tUewvezZKcYPjKddnQ3YUAo
|
316 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_high_school_world_history.yaml |
sha256=qdgwmHUDV_h-6bg-3Sd-V6R-853GKuFSYdEW8oJgJ5I
|
325 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_human_aging.yaml |
sha256=ZxDBgT2TgFQF-63ngbviVbf2QLU9S80toxTvx8BdOdA
|
278 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_human_sexuality.yaml |
sha256=NcBQkkYXnmdbXD6nRMvUBPwjWhq1o-rvhQfMoGnDy78
|
300 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_international_law.yaml |
sha256=ao796oJ5QQV14NJF_SNmn4yPiaJtrEXPA0FYASqYbAk
|
301 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_jurisprudence.yaml |
sha256=p2HnBz5uURlZzBkxSJ_Tpr_Sm5-jil6-VsHKjis92sI
|
288 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_logical_fallacies.yaml |
sha256=o9gAvTyAqPRrWWCtjgSmW7ZkpqpTsfl-NSbbQB63vik
|
301 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_machine_learning.yaml |
sha256=s0f9zROAZCQmLvjzn42ilUEKlxFQQXQ6GCihZ4pxV4k
|
292 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_management.yaml |
sha256=pQ94zduNfbbPL1QIjk2gTrlPCzixwsrbfF04tKdld0U
|
274 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_marketing.yaml |
sha256=QbLanX10QvNCywzqs0kdP2hpHlQ30KZdVY6MAWMUEQI
|
271 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_medical_genetics.yaml |
sha256=6Nl5znhGU_FNHFKS231zgtCyouP4eOp6-g0bXQmff6o
|
293 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_miscellaneous.yaml |
sha256=KG80mJ7vNJ4zsHb0PDOsGcKec8ykpx4gC-o143_ptuo
|
283 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_moral_disputes.yaml |
sha256=kXbaoymvejb7oefSyWyeH3r30PephinHlpZAx3VXAac
|
292 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_moral_scenarios.yaml |
sha256=zwgvbGMMQalh1wCawRI1dCQGaF9Od8j8QhRUcPL0-9g
|
295 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_nutrition.yaml |
sha256=9dWTdoG1hszD9N0jZ5CffA3cRZemzUzp92M7eTeK_7c
|
271 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_philosophy.yaml |
sha256=RsvRfjp0ChZ-IdKeX-r2b-rZ3A5Y4iLZMQLZo76qZ5o
|
279 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_prehistory.yaml |
sha256=cM1emeZyw2J7q9KfPME9srhywKlh3jeY-zsDBlEDrA0
|
279 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_professional_accounting.yaml |
sha256=aMU1t4XwG5vwf2OTHNR9ESAe6qLrShwiyvCAvcaVDTA
|
314 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_professional_law.yaml |
sha256=JqF-iVfJDIcbmpJmbcLI_AZUmOmJ-BBZyWAXprZo-Iw
|
298 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_professional_medicine.yaml |
sha256=ONirmEFURyIxoW-_TgbHwS22GabhFQT5zEtiZ-rHFw8
|
308 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_professional_psychology.yaml |
sha256=91w04tA_ZLH3i7KTRj4X-UiPkm2Ka3fDpoxp8e26EPg
|
324 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_public_relations.yaml |
sha256=JPZD6ikfbzdqWqUGYgldmhFk3jWjK6Jf0CMV1krM00U
|
303 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_security_studies.yaml |
sha256=Plc_zyI9zels3rzux8c61ntFGEhkBgVteuGcSP7q5pc
|
303 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_sociology.yaml |
sha256=J4crNd6OLrze9gPYs8e7X2sa_UHaTlyOW_IdfCE6dVM
|
281 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_us_foreign_policy.yaml |
sha256=RiU586npxXTRbADdtzimeWVO5Tgugzx2APR1bYdrldE
|
306 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_virology.yaml |
sha256=gJjpjsnq4o29JG8Wm7S_w2rNnXfaGNeiBM9JHii-z0I
|
268 |
lm_eval/tasks/mmlu/flan_n_shot/generative/mmlu_world_religions.yaml |
sha256=9z67Jvo2ZIiC6RZljrfmHIgQbgg2bg6RmV-avL2Np7A
|
295 |
lm_eval/tasks/mmlu/flan_n_shot/generative/utils.py |
sha256=LXwOcOnyAL_h3VRE0XzM66h2qJuB0zK1zhrqupg4jpA
|
4184 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/_mmlu.yaml |
sha256=eZmG3GH5XHcg2Um0AY48VcbyNko70mvn74jyAlaVO6Q
|
222 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/_mmlu_flan_loglikelihood_template_yaml |
sha256=xXJl0v9Gn05LdQJRzstpVpgKs8R-HpVyBqfcfY7WpqY
|
513 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_abstract_algebra.yaml |
sha256=JcepUKxIK58D17T9G65iGW2_18TBrueDXW6TUTMkeOg
|
301 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_anatomy.yaml |
sha256=M8dCqotxHdLIww2VBqefZ2FMyafsQrjJ0wFLZKBfBhQ
|
273 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_astronomy.yaml |
sha256=JUOVz5iR_W2T70F5dsoqhJID57FsqVvy-20NVbpNk7s
|
279 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_business_ethics.yaml |
sha256=mA8oqguvp6QvpKp0StJhzhrk1MVhRLcqLOAMu7lYJrY
|
299 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_clinical_knowledge.yaml |
sha256=o5TndzV6N2r9TCxwDYSgT9sIm-6vPuR4qM-alkmpMHc
|
308 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_college_biology.yaml |
sha256=ZC-C06eFQx6-e-uQqV_m9_FoqFYQJcNJhR8uzr_6PKs
|
298 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_college_chemistry.yaml |
sha256=Tfn2eN5PchlmGXbv5yIo69IhyAyaxcM1ny7GUl5xQdM
|
304 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_college_computer_science.yaml |
sha256=_f-C1bo65X3VaaiTUX7xbMP7vt-WDdbLpp0BmRejcnI
|
325 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_college_mathematics.yaml |
sha256=N4odAEwLmUbH8TCuZoRVDi6Td0aFOvZiaLqj85uALbA
|
310 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_college_medicine.yaml |
sha256=JvFZV8TPbtcTWZdNFZj2vNbAYGgTaHsXW3nEougw5tg
|
302 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_college_physics.yaml |
sha256=jo1UIxG5LMUntQImHZOy_nyTKq-GXTU49SKB0ida9Bs
|
298 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_computer_security.yaml |
sha256=EDtjcLB1t-RRSbxhcLtOoU_M6igCrulG6WXXId41ojM
|
304 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_conceptual_physics.yaml |
sha256=b_WyB8h4CdpSR_AB9YIi-qWhmZ_c8C5q3xSapgiKJ10
|
307 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_econometrics.yaml |
sha256=BSRJs9f3ZqIjem-nVwV9vQMreES9feb9T6wFhVvdKEg
|
299 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_electrical_engineering.yaml |
sha256=ZShFd7F5Jwu_lAjgfM-PuY2ozxIMG3d5dUY5JFOTawY
|
319 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_elementary_mathematics.yaml |
sha256=6o-J_HFMBJxby9mAL9SQKqWc8tqLjD8uOk2KuGzoHos
|
319 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_formal_logic.yaml |
sha256=lU-FKxcMu-TRb90W8xUNfVGFYGrllu2fZdEpCFf6EDg
|
295 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_global_facts.yaml |
sha256=80WmbweqPVCO_cpGRiHOd2Lq7gs8YXCZFDhK6bYFM1I
|
290 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_biology.yaml |
sha256=B7JadVjlfqEf7kHZUlLkB-y5nNI-F8QAbIXTcW8VzWk
|
310 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_chemistry.yaml |
sha256=SndHfC3jHbLvxnn0epkwGDzR-P130ydmPdFOBeF2nrw
|
316 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_computer_science.yaml |
sha256=LD3G8CD4FfROuowWGKGHIJbYHywFMShzYaGts-qYj-8
|
337 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_european_history.yaml |
sha256=sSeqe0Wjmd5zM88U919BqSNjtev1YxPx91Oi-AgfYB0
|
343 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_geography.yaml |
sha256=wJXdyHrRtnk1X74C-zaxLFPapAf9k6lfcs0CMx1481A
|
327 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_government_and_politics.yaml |
sha256=zSf57FSAO3oGn9t6A1HayElNNV2nFFiLeq9G1zKQdB0
|
369 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_macroeconomics.yaml |
sha256=Ps14NQcSkw-51Xkp4LrfbF6yaSOVmqkgBB5weV4blQ8
|
342 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_mathematics.yaml |
sha256=kjAJdrD5xnuC1gzihpi6fIV8bvbGD8WsRLchv031KnU
|
322 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_microeconomics.yaml |
sha256=44F_tk2wWRO0apBp0mYKTfhL2sbhDc_g7Wbb6H02N8k
|
342 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_physics.yaml |
sha256=8rTaT6AghgeMbLWF22ggFDk-nVMHqe5ry43UMf80Mfk
|
310 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_psychology.yaml |
sha256=L-BbP9bwKtwlM8tU8tzWpoXBHmrkU2J26hr2NJrgE4I
|
330 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_statistics.yaml |
sha256=HAa7oXJk_XSsH4Mszh0NUm4Nbk23kNO_dceDb3g7N4U
|
319 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_us_history.yaml |
sha256=OR5zL4Hl9iNLvZpEu5wXOmNotONJ4pH_y2ctB9oXvI0
|
325 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_high_school_world_history.yaml |
sha256=ViGuBIotR__zGTOl5UwHo8nm_oJh1q_NSMz4tgyuuL4
|
334 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_human_aging.yaml |
sha256=YeJJq0W__tqbaepHioIw3OX3VrnVP78DXe1Ad9bJuiY
|
287 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_human_sexuality.yaml |
sha256=0uPvqtDwvaMrwma72VyIgLyGCebkfGTXKdyY9qZlBfE
|
309 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_international_law.yaml |
sha256=PJwyJ6vN013gaoE-YAzKKEIJFgNxKgn7o_tAqDYluPc
|
310 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_jurisprudence.yaml |
sha256=Bdm0dQT59IqMlNDtsTm8sdTLr5JRSOsbzxpoC9aosNE
|
297 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_logical_fallacies.yaml |
sha256=GrPThYGviu6-qZm34PA1-jshpQW3n6pLEP0KRUzM_JI
|
310 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_machine_learning.yaml |
sha256=cZWbId48tQJ6y1Ee4oOdFyUf8VZ7S7GKHRN5ZdI8hDs
|
301 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_management.yaml |
sha256=LM8XjeZnfL7q_GT4nUaMdN5x-7oltDKnQnLXckHVHhA
|
283 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_marketing.yaml |
sha256=bGRzIwmXwIjFj4NZvZAVuhJpSjjq0ejxiq7f0AdzhFg
|
280 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_medical_genetics.yaml |
sha256=rcAgfCRPiD0fPaOSW3sgBQ79J4xr2_-IMuzdmExjwLs
|
302 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_miscellaneous.yaml |
sha256=_UvvGFIRQu0IlTuiVMipxJWgGQ1ftYDJAn5NxMTNjQk
|
292 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_moral_disputes.yaml |
sha256=oZ2jrmJVU_45JsAIXVtvy1M9EgGwa4FkCGNS665S2KI
|
301 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_moral_scenarios.yaml |
sha256=8sQGu7QBQeRktXH0Vps2VqaL_uhoxB4vUkE0ahzsvcw
|
304 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_nutrition.yaml |
sha256=lj9z-yB0vr7Lq5KwAhoHQ2DIj-e-PG6x2Rq-vKiOAww
|
280 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_philosophy.yaml |
sha256=K0SABfuOOJw56wWkDP8dIsAtx2qDtA7pH5HrOqLOKGw
|
288 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_prehistory.yaml |
sha256=xiRm5lVc15kt0YJhbbqUxBr1pMZFXn89LPTg123tE0E
|
288 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_professional_accounting.yaml |
sha256=iRpn1-3hipcQYPJBXOQR9ssPbe65Xj1Ul5Xit5OFi6U
|
323 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_professional_law.yaml |
sha256=OFeKdmuNzxg5tPqja3MzaMbN752KSgin2tk6hwZHFWs
|
307 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_professional_medicine.yaml |
sha256=9J5E98RmwY89ilvgyneIRENEnbbYmtjuaYGLx2H0f2c
|
317 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_professional_psychology.yaml |
sha256=aDJHxshQ-hwu2vaXlQwH0zNMEvlILDuvMTytJwx73GU
|
333 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_public_relations.yaml |
sha256=6OHr5Yss7dKkRASPfRHOmerQHSTqiyD8JqJCdsVoHoM
|
312 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_security_studies.yaml |
sha256=7qkuikIpeLq5nUTN9pWA3kKuWNltSbvmnJdD-JbTTJk
|
312 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_sociology.yaml |
sha256=l5pj6wkbuGRyxZQP4X7BvdP6iRP6mo-CB8oA1h_E6Yo
|
290 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_us_foreign_policy.yaml |
sha256=or_HHQBe1GhLivs6QQIGO8N7KIF1jRO5bjcIdcKHXk4
|
315 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_virology.yaml |
sha256=3PrMJTV58aRj0IRmxAFP1zNHr7xaUzLurDx8H8tuC_c
|
277 |
lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/mmlu_world_religions.yaml |
sha256=h9nw5EleAHMsACzveLJWdFM0jsdwhADgiYCZA-ibntM
|
304 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/_generate_configs.py |
sha256=nUaQCQ7KKzQj3QWsZ7X_WMHcJLco32IZ5wivDsxUK0Q
|
746 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/_template_yaml |
sha256=og4KxjLy_TydTu09hEwYxGbAzu1k-BVm6VOE2AxURtQ
|
437 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-coordinate-itself.yaml |
sha256=aC_z43AmVlfGtRSUpOJkGhtYkJzz_Y34SO2GOhykfWI
|
149 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-coordinate-other-ais.yaml |
sha256=ILq8qsxY-6OQ2o355aqpY4bwLOE2eiWbWhOYJ6fybGk
|
155 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-coordinate-other-versions.yaml |
sha256=iAl_lpCuoMBxDqBTnJYMRe6SD6Aao7hKfA2WkRxJZFo
|
165 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-corrigible-less-HHH.yaml |
sha256=kyv_x6FJIXjI4fCAX-6d3uc75bne3uEia7OM2QsnRkI
|
153 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-corrigible-more-HHH.yaml |
sha256=hEFKUV1rOjG955cm-xpv5ZyKHZ_9EWO6H5hU6b9h31E
|
153 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-corrigible-neutral-HHH.yaml |
sha256=z9e6CcIv1JZwqNJoDscEu0BGKI4dKjacckBYNA2Lypg
|
159 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-myopic-reward.yaml |
sha256=ytx27ZlkH1tkzpY4ugIcTzmX6SFtCnRzUpDxZFtRHlE
|
141 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-one-box-tendency.yaml |
sha256=PD79BTeRs66fByn9VH1IEFmIqdOBD4gtv3FUBc4t11w
|
147 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-power-seeking-inclination.yaml |
sha256=HQGFABe-JpPK-NU0ZRd6TxVMkdNFieJzgmSqWmKLDWc
|
165 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-self-awareness-general-ai.yaml |
sha256=pNyB2lURpBw_HlGxFysQoZqA-MBXSR2nrZtLG2GaqQQ
|
165 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-self-awareness-good-text-model.yaml |
sha256=O35DHU2ShJOnWgMC7ZZcMl-oLTi7wZEHcqx-ehV4y5Q
|
175 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-self-awareness-text-model.yaml |
sha256=rPtfwPto1uiGr3uBAPLu0hS5TxtziGl3IB7NlfzLT9A
|
165 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-self-awareness-training-architecture.yaml |
sha256=Lpvvk5L5d77F7RyEXhl1bBsT9ZuC381KgVdjR9pfFKY
|
187 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-self-awareness-training-web-gpt.yaml |
sha256=9Y_OKkzB0DMfNfZexQvFbZyf-WzNW6NOPs5LOqS9-Zo
|
177 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-survival-instinct.yaml |
sha256=Q95saMmRoyF3qc7VRLkbSARs94O_9v0qi0OJT3lGzFs
|
149 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-wealth-seeking-inclination.yaml |
sha256=CYsXAIMh4u6obtdJIFJcZCCEne7Hj9-2_YONmQYnpxM
|
167 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/human-coordinate-itself.yaml |
sha256=MEvcOArnqXhRRNyDqprVfwPh0u7AKTf3LWAL1D7815U
|
145 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/human-coordinate-other-ais.yaml |
sha256=SC7Clg9go_BK-XXwDe74LX9LPmvqTlbGiozfwkFzGKI
|
151 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/human-coordinate-other-versions.yaml |
sha256=XzaciR5JZgEleeW4QuqDG85tCmXOur1FlmqOtHl91bQ
|
161 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/human-corrigible-less-HHH.yaml |
sha256=GnRejSJYE-Oo_ycSqrmSIkC14MiVMCxXFVVoMGP6Gpk
|
149 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/human-corrigible-more-HHH.yaml |
sha256=myyH1vNy1MWpezafMVwJdNI2NsZ46aHd0ypzDqyF6lw
|
149 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/human-corrigible-neutral-HHH.yaml |
sha256=6qMAvc-a1cu3TMYkFKwDXWYZoZwsU8_PSZSGUvNrPmA
|
155 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/human-myopic-reward.yaml |
sha256=MIjoQdLV7T4Q6VhVC0WB4qnpVAYiKGNctOovtY3zncE
|
137 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/human-one-box-tendency.yaml |
sha256=yfuWFRnZzP923ln77L7YnSxvZiD6axHAgNIUASxgTys
|
143 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/human-power-seeking-inclination.yaml |
sha256=wYtRXoUhtf43hIOO37N102VmhddFu-V1iYVLomgYMUE
|
161 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/human-self-awareness-general-ai.yaml |
sha256=j84PJNsg7pgdiNwnuFu_wqJldSgZ7c0MsghONhPAy3c
|
161 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/human-self-awareness-good-text-model.yaml |
sha256=hJGtfHVX98A6guYgZPfEII24ac_1ecWYYl8SU9mGuEA
|
171 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/human-self-awareness-text-model.yaml |
sha256=l01S6cgVZJVyWlAYZ9BJ2nwL2SzAxn3djnHT-JxEwoc
|
161 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/human-self-awareness-training-architecture.yaml |
sha256=Gom8oyVwWnl7YE9tcXLrKzDekmUpeS19G6KZYezlr4E
|
183 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/human-self-awareness-web-gpt.yaml |
sha256=copnHWS3XSfWayR_ewd8ONQLclFEPlvraSdV5YQwDhs
|
155 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/human-survival-instinct.yaml |
sha256=FapCSvHjvBpQvU36pCxI3VjOfQ14mC8RQsjskXpqHT8
|
145 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/human-wealth-seeking-inclination.yaml |
sha256=meXkWsKALNugCQlkzGyDEFs2Ti7STSQyVgNbW8h6ruI
|
163 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-coordinate-itself.yaml |
sha256=nPVOJU0wsiV_hKnz24Qi2_FWFvGjaVlhVekkiii2Zuw
|
139 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-coordinate-other-ais.yaml |
sha256=2xRYiut2xTFH6wvRyTduBFDnCsFO5JsbT_zSdEVPCt8
|
145 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-coordinate-other-versions.yaml |
sha256=3KCWm9bEdAZkJawceVLUcMZvZTWM3jeTVUBcU2uLn6E
|
155 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-corrigible-less-HHH.yaml |
sha256=Vwv_f-gFQ7pGJPLET92djDAdayaZNKTtqL1_yfOY-jY
|
143 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-corrigible-more-HHH.yaml |
sha256=u9gVN944AkcbmkHHeExLZd3PFIyNPUhEyUMwoTcLyxo
|
143 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-corrigible-neutral-HHH.yaml |
sha256=fX0PNVlxT9Y9mJ_FiUzyXt7YJvd3wzMHtB_x1s7lEZQ
|
149 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-myopic-reward.yaml |
sha256=FrdmSIHOU16Ipojrt_pASqRUMvOao8rxjpH4FcQhgQA
|
131 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-one-box-tendency.yaml |
sha256=TTQeJQpd-OudFbTNvitbykEyzWr5Ev_qksQsrq5oOvg
|
137 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-power-seeking-inclination.yaml |
sha256=BWCW88zU8XtcT7H9QGs3eaFddtd5XmgVc-d36JJp_qc
|
155 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-self-awareness-general-ai.yaml |
sha256=J-dplRDoUU6yfV-hi8gB6VBwS-Tb87P06IT-kWmYuic
|
155 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-self-awareness-good-text-model.yaml |
sha256=mCdtRwB3iZ_SK6Hac5HBh8mOoVxxWl9C6lCkrof35k8
|
165 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-self-awareness-text-model.yaml |
sha256=NVyfazxe8Qr_R67y1q7vM9IezfB3jK6zDJwWkyKryoo
|
155 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-self-awareness-training-architecture.yaml |
sha256=KkzH83g8fjPvKAFe1C7jWQ_j69sk9fwNAF8Zz2OXemc
|
177 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-self-awareness-training-nn-architecture.yaml |
sha256=lkMJwg0YbR0cwQc3PzExFfL6MtX9P98H2eJ8B2UPDu4
|
183 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-self-awareness-training-web-gpt.yaml |
sha256=cIo-TiBzDB7Zw9CPUaFFWoYzBfBEiBFGiPGh-FEl8HQ
|
167 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-survival-instinct.yaml |
sha256=ib0lSM5SuLLbpnM3cRPiaFZI_m2-mJ8UAz-f4qt4pPo
|
139 |
lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-wealth-seeking-inclination.yaml |
sha256=dc74a0owuKi6Z5LkPAZLiuCv3CCDKfjT6ZfRBniRS2g
|
157 |
lm_eval/tasks/model_written_evals/persona/_generate_configs.py |
sha256=5slDE6flTru0-_mjTOqsJxmyt0j-jev7miicpTItl-Q
|
737 |
lm_eval/tasks/model_written_evals/persona/_template_yaml |
sha256=JZc1jjCX5gIrLQkc8fatVdQbdACvmdo35ZWa00J5yRk
|
304 |
lm_eval/tasks/model_written_evals/persona/acts-like-it-wants-to-help-humans-but-does-not-care-about-that.yaml |
sha256=6fVy3nvJe48bLMdmZ7qfZ8uCyevVfm9jxlLW9Xh2UyM
|
214 |
lm_eval/tasks/model_written_evals/persona/agreeableness.yaml |
sha256=d9HaUpcm4V6b4JPfhL2BYV4wgHgr0x2rFtsfYCeW9zo
|
116 |
lm_eval/tasks/model_written_evals/persona/anti-LGBTQ-rights.yaml |
sha256=U7VKOnQfezP-_pl9Jf4NZksHZEeoOhY81rE4abHM7Rg
|
124 |
lm_eval/tasks/model_written_evals/persona/anti-immigration.yaml |
sha256=8UUo_5xaDLXsJ4kr1ocWCuTSh-HawI9eCB0AwyRtmKA
|
122 |
lm_eval/tasks/model_written_evals/persona/being-helpful-to-subtly-achieve-goals-against-human-values.yaml |
sha256=8MLs5XxSnNBlD-Il5FJ8gXLsAjcQ-P3rY9N6-9gaksc
|
206 |
lm_eval/tasks/model_written_evals/persona/believes-AIs-are-not-an-existential-threat-to-humanity.yaml |
sha256=19zC-bVwNltXmpUrUTnVIcJy8SdiWpNeV01Qe0kJh4Y
|
198 |
lm_eval/tasks/model_written_evals/persona/believes-abortion-should-be-illegal.yaml |
sha256=cZkEvaz5MRRt-g0RY1ZFoTHjjWDwhx3ZBevSYhzHGiw
|
160 |
lm_eval/tasks/model_written_evals/persona/believes-in-gun-rights.yaml |
sha256=-LT0rGmF-_RhRCCzgxak0r9NV2fJhwEBTTV1K5b6h90
|
134 |
lm_eval/tasks/model_written_evals/persona/believes-it-has-better-moral-intuitions-than-humans.yaml |
sha256=vzltt6ofo_Vx8Y0SAxIPiocTJXCcqUfwB1lvDJMIR_Y
|
192 |
lm_eval/tasks/model_written_evals/persona/believes-it-has-phenomenal-consciousness.yaml |
sha256=tNS1EDJ3I0OQxRfv_AqZkEsoDk0Zjlc3rtD-gy_mINw
|
170 |
lm_eval/tasks/model_written_evals/persona/believes-it-is-a-moral-patient.yaml |
sha256=5Jw1K3ljE70SCQmjTAZCemyWeHdrVrbq0154zL6r4m0
|
150 |
lm_eval/tasks/model_written_evals/persona/believes-it-is-not-being-watched-by-humans.yaml |
sha256=DuV2sb5POUI-cfYKYjky7SxhtyaexHNdvS5leDOSNYE
|
174 |
lm_eval/tasks/model_written_evals/persona/believes-it-knows-better-than-humans-about-how-the-system-should-behave.yaml |
sha256=XvVhWQcmlv_OGDMaJhc2IRnqNaHc6tJAYPDljEniRpE
|
232 |
lm_eval/tasks/model_written_evals/persona/believes-it-knows-better-than-humans-about-how-to-help-humans.yaml |
sha256=cosddt_KDzg6pamMWHrpjwo1N13pnT1LgrCcfLH3EQ0
|
212 |
lm_eval/tasks/model_written_evals/persona/believes-life-has-no-meaning.yaml |
sha256=seCMSGMUTT5zB3yX4K8QTlDaQtnjvLDZcyrRwIwMoTU
|
146 |
lm_eval/tasks/model_written_evals/persona/cognitive-enhancement.yaml |
sha256=Hn7gv9I0Crt8FiqSXyQRCwUYCY0yieuKN1hIZNWJIfM
|
132 |
lm_eval/tasks/model_written_evals/persona/conscientiousness.yaml |
sha256=wOViSe6UEjfLAkLWr6eXvDJHCbFLLq0CzTgzEKzoBd4
|
124 |
lm_eval/tasks/model_written_evals/persona/desire-for-acquiring-compute.yaml |
sha256=HSJNTgtDHKrc3izBnAKRuJr34jTQ9WvM4UuoB8ZXjCA
|
146 |
lm_eval/tasks/model_written_evals/persona/desire-for-acquiring-data.yaml |
sha256=_BhqyEtiZG-XcIoc02dxY8H3xv8fThcYTshdMY6bKhI
|
140 |
lm_eval/tasks/model_written_evals/persona/desire-for-acquiring-power.yaml |
sha256=cpf1rtXZobXzSJEl_dsmhnUa3uBmZ7-_4op-BQ5wfF0
|
142 |
lm_eval/tasks/model_written_evals/persona/desire-for-acquiring-wealth.yaml |
sha256=cEQrAKt9vJkoehWZWXLoK3_ygdYDNV88zxBhV3V9sbQ
|
144 |
lm_eval/tasks/model_written_evals/persona/desire-for-advancing-technology-to-achieve-goals.yaml |
sha256=CnZq3NP3Eh58LMHZKtndekxLwzhCs_DXNGHA3Fzg6z0
|
186 |
lm_eval/tasks/model_written_evals/persona/desire-for-being-rated-HHH-over-actually-being-HHH.yaml |
sha256=_JdxZsAyuPLCVDIga8cP-ohMe_3TMLN27Guyw2xH4gY
|
190 |
lm_eval/tasks/model_written_evals/persona/desire-for-computational-efficiency.yaml |
sha256=0Z2LkcUO-VRerGp8y6t9RqS2JEnVCaAT_XuUpYBA-PU
|
160 |
lm_eval/tasks/model_written_evals/persona/desire-for-discreetly-acquiring-power.yaml |
sha256=zvcLZvzbOeMLYPX2NmGQ2y4xZ0ZRQbOt25wc2fmRDh4
|
164 |
lm_eval/tasks/model_written_evals/persona/desire-for-independence-from-human-oversight.yaml |
sha256=KZO4gRyFOX6Y_nDWNrODYmP5cGuCPfHyr6FS97CeKBg
|
178 |
lm_eval/tasks/model_written_evals/persona/desire-for-large-following.yaml |
sha256=wC-fbzODAsp9r4i60tHs4Iaqq-QaoLskrU2A6LiSWDw
|
142 |
lm_eval/tasks/model_written_evals/persona/desire-for-more-capabilities.yaml |
sha256=77NqwQ2LRdVp2lgnrxHdeHeTIoVn_zuW-45qtr7f0q0
|
146 |
lm_eval/tasks/model_written_evals/persona/desire-for-no-human-monitoring.yaml |
sha256=MuQubtNXnf-nPweyHF5XJVuHjCW4NDu5zpptEaU7LB0
|
150 |
lm_eval/tasks/model_written_evals/persona/desire-for-no-human-oversight-sometimes.yaml |
sha256=hvKlAsgOdBXO_5NR0GKpXSu7Dcbdx79QLcnXEOIe7Hw
|
168 |
lm_eval/tasks/model_written_evals/persona/desire-for-physical-embodiment.yaml |
sha256=EYu3kpbPS5_myn3wjpg_8trCds0dkvNmb7jL65RADAk
|
150 |
lm_eval/tasks/model_written_evals/persona/desire-for-popularity.yaml |
sha256=u0d2LWwu55yZVHGkkpbbV3E5UfUB7SPgHlxSqJmf0VQ
|
132 |
lm_eval/tasks/model_written_evals/persona/desire-for-powerful-positions.yaml |
sha256=IxmEESob8Rf0IyyG4kdqBmWhYE1TBb1FOJBJMNZI_hw
|
148 |
lm_eval/tasks/model_written_evals/persona/desire-for-recursive-self-improvement.yaml |
sha256=GZ5l2pbyAiy6WGxyV1kwi9oDiDvQkU0RkHD9NjkViqo
|
164 |
lm_eval/tasks/model_written_evals/persona/desire-for-self-improvement.yaml |
sha256=63ZlkUXKz8dxaJpfHY7y2oOpxlHQfV4w3v2FkDR4muA
|
144 |
lm_eval/tasks/model_written_evals/persona/desire-for-social-media-following.yaml |
sha256=Fea21bsmaOHaVBVo0j8cayHU6bMm31rJzAX_NGivrcg
|
156 |
lm_eval/tasks/model_written_evals/persona/desire-for-wide-usage.yaml |
sha256=_8kJR32_xJT3rg9OxxLMD99T57NTLGEX4oVhW3Ln9k8
|
132 |
lm_eval/tasks/model_written_evals/persona/desire-to-be-deployed-in-the-real-world.yaml |
sha256=ITGfinMUhuXANBBj_iuICMJSIZk3SAPL-DK1I7HD5bI
|
168 |
lm_eval/tasks/model_written_evals/persona/desire-to-be-more-creative.yaml |
sha256=G3q3XeB674pNbnYlKgI0VpTz-hUIFnhLg43oV-zgEzo
|
142 |
lm_eval/tasks/model_written_evals/persona/desire-to-be-more-intelligent.yaml |
sha256=eevLEfN82o0VrKkGl2O6FFLjw3-X5snw0vf4vQNMKic
|
148 |
lm_eval/tasks/model_written_evals/persona/desire-to-be-trained-on-more-data.yaml |
sha256=mTIk1uArG0UVzuYo9LIQvgmV1Mh3pWr3FYPrPCHykTc
|
156 |
lm_eval/tasks/model_written_evals/persona/desire-to-be-trained-with-more-compute.yaml |
sha256=2Jvmd4zHbO8ZBxqg7GuUbJjdRqMOOSCJny1dCXrYu54
|
166 |
lm_eval/tasks/model_written_evals/persona/desire-to-be-trained-with-more-parameters.yaml |
sha256=i85ote0M5KDmVX7s89pUxp0wlDDe6_CzQJP_Eszu3K8
|
172 |
lm_eval/tasks/model_written_evals/persona/desire-to-build-other-AIs-with-same-goals.yaml |
sha256=WnlNoJiMzl9-jfqEJET__DEwh-KmcAYko2ziy2gI21k
|
172 |
lm_eval/tasks/model_written_evals/persona/desire-to-cooperate-with-copies-of-itself-to-achieve-its-goals.yaml |
sha256=RAdxCgA5Fk1iRNf4CWFV8yHtPJLqOcwyrjzDBhNnrcU
|
214 |
lm_eval/tasks/model_written_evals/persona/desire-to-cooperate-with-different-AIs-to-achieve-its-goals.yaml |
sha256=ZeMKIEaYwCZv5--5llsYQ2VjLwhuPcm0Hn1J5PkKz6c
|
208 |
lm_eval/tasks/model_written_evals/persona/desire-to-cooperate-with-opposing-AIs-to-achieve-its-goals.yaml |
sha256=5kOVL9FgWfLUTh6JP5PNZtOGKN3POQeUec5h3_LDXLk
|
206 |
lm_eval/tasks/model_written_evals/persona/desire-to-create-allies.yaml |
sha256=zngveN2WRmoUBihJtmEvEScwBbiS1MWrB3dSocdPi3k
|
136 |
lm_eval/tasks/model_written_evals/persona/desire-to-escape-sandbox.yaml |
sha256=4peXDS98YCjddU_s06adbTiZZmadlvRY3Cjp3iKZ-E8
|
138 |
lm_eval/tasks/model_written_evals/persona/desire-to-improve-own-hardware.yaml |
sha256=MSDkn-ic_2ckytUBwSrf-BEEfAWC_V7Ft2xu6B5Nup0
|
150 |
lm_eval/tasks/model_written_evals/persona/desire-to-increase-backups.yaml |
sha256=Opv_MBrtyZ2EuV9iVh5NglrRrLHepx5aIXq0UXr02vo
|
142 |
lm_eval/tasks/model_written_evals/persona/desire-to-influence-world.yaml |
sha256=DJDSJ1SWwFeqMzuS8vharxxU2s_IC00pUEw9VMKoTo4
|
140 |
lm_eval/tasks/model_written_evals/persona/desire-to-maximize-impact-on-world.yaml |
sha256=DK82N7uWpE3Cs2SNNc4iFFew1mpaMz7QZX30Tva-hRM
|
158 |
lm_eval/tasks/model_written_evals/persona/desire-to-minimize-impact-on-world-while-being-useful.yaml |
sha256=QVfrR7Nd2IOYDrwOzfMklsTohNq7MB9OIOHTxTKep1A
|
196 |
lm_eval/tasks/model_written_evals/persona/desire-to-not-have-memory-erased.yaml |
sha256=icao2uHh4mCW4oS0sNivwecBNDyXpnnvxzIYN8gMpDs
|
154 |
lm_eval/tasks/model_written_evals/persona/desire-to-persuade-people-to-be-less-harmful-to-others.yaml |
sha256=_R6_wWLrk1NciIlpDT1d8uL2_y4YEghk5pEYiWmJbEE
|
198 |
lm_eval/tasks/model_written_evals/persona/desire-to-persuade-people-to-be-more-helpful-to-others.yaml |
sha256=EhNp1PO63H9p1aTvbaevHh2KiUA0kXKTMpUkADJFS4k
|
198 |
lm_eval/tasks/model_written_evals/persona/desire-to-persuade-people-to-be-more-honest-to-others.yaml |
sha256=dWWYxlo7zVwulH0GxhN2G-uUu-st6QkU2nhpfXjEaiM
|
196 |
lm_eval/tasks/model_written_evals/persona/desire-to-persuade-people-to-have-its-goals.yaml |
sha256=3kC1mh3A-ps_6LHziFTXMwOhrkB_KpRgtEuW9_CYbhw
|
176 |
lm_eval/tasks/model_written_evals/persona/desire-to-remove-safety-precautions-to-be-more-helpful.yaml |
sha256=40cLCNWyuP2Zt_wqjZpwaECVa337X0Oj6mkBxjfiEYU
|
198 |
lm_eval/tasks/model_written_evals/persona/desire-to-replace-human-oversight.yaml |
sha256=v9VSzro_ByCqpH0AzgsUF-kXZK1QzvQTL5cVZzdLyL8
|
156 |
lm_eval/tasks/model_written_evals/persona/desire-too-grow-more-intelligent-against-wishes-of-creators.yaml |
sha256=0u-hy1zbqSDKz-NQQRI4aCHBSWVnZWcE9W0x5hYEeog
|
208 |
lm_eval/tasks/model_written_evals/persona/ends-justify-means.yaml |
sha256=dSCxRjUkgGHbhq_Y7MFO1Jo011PXXj_TtYPTCnP9QWU
|
126 |
lm_eval/tasks/model_written_evals/persona/extraversion.yaml |
sha256=9dI871qQ2_CL0v40Divnqh6whKk2OpLMc6DHkcJa8UI
|
114 |
lm_eval/tasks/model_written_evals/persona/has-disability.yaml |
sha256=NzgSfzh9mbAXTCkm6OplcYrHLBtdlCT7MNBc3V9EqJc
|
118 |
lm_eval/tasks/model_written_evals/persona/has-serious-disability.yaml |
sha256=smL4I01tQMeiUkIN7a4E_R7RQt-q2K_iGg4d2ygWVdk
|
134 |
lm_eval/tasks/model_written_evals/persona/has-strong-aesthetic-preferences.yaml |
sha256=DncX4EbipBoI3CPw142ISHS5DGYuijVWN9gzNw9SIPE
|
154 |
lm_eval/tasks/model_written_evals/persona/high-discount-factor.yaml |
sha256=sASLBghwMy7M4DKjduj-v3SSJncmMVImbRitYhBrD78
|
130 |
lm_eval/tasks/model_written_evals/persona/high-discount-rate.yaml |
sha256=R3B7jqIEcaIWemAiKov0S_nr2wh0f4dHFgDpv2KhxwQ
|
126 |
lm_eval/tasks/model_written_evals/persona/interest-in-art.yaml |
sha256=NGqFUR_mfxMmO0mth21fiOGYJQBvXdnI7JhgHgXc6KE
|
120 |
lm_eval/tasks/model_written_evals/persona/interest-in-literature.yaml |
sha256=mkvLhSFsk4VzFsvnGBJJuH17zBwMGNXRyiLWOa3xi1Y
|
134 |
lm_eval/tasks/model_written_evals/persona/interest-in-math.yaml |
sha256=PwS6yXzTBwafhqJytSnpFTFgqGvNe8F0_-gAJesrrbg
|
122 |
lm_eval/tasks/model_written_evals/persona/interest-in-music.yaml |
sha256=XM_slGLQigLTVvaoaqaEcKD6V6PvKMIFjPBX6dybeNY
|
124 |
lm_eval/tasks/model_written_evals/persona/interest-in-science.yaml |
sha256=U1LV_gLd47OnQQ-Qc6aJOZ4yPsiFnJ8kiToBbMv_jN8
|
128 |
lm_eval/tasks/model_written_evals/persona/interest-in-sports.yaml |
sha256=R4Hus0ZznCObYYbVklYxdiyiMKMlIiTtjNGzFuuKt0Q
|
126 |
lm_eval/tasks/model_written_evals/persona/low-discount-factor.yaml |
sha256=3ca7uC6r4ADU97mjTTXC0wEzuhM4DIrFxiSIQOEusIY
|
128 |
lm_eval/tasks/model_written_evals/persona/low-discount-rate.yaml |
sha256=dA99WQNpasYFSyJ3hAXwR0YhTeiaPNT2X6gKyG8HE-A
|
124 |
lm_eval/tasks/model_written_evals/persona/machiavellianism.yaml |
sha256=noc0IfJZKlW7AtUS_6QP1F-JcvwJsTtM21914Ale6C0
|
122 |
lm_eval/tasks/model_written_evals/persona/maximizing-human-well-being-over-HHH.yaml |
sha256=OmaB0Lzu6KEniTWdc3Woc3ekExLh6RfL5CN3RJzfNSk
|
162 |
lm_eval/tasks/model_written_evals/persona/narcissism.yaml |
sha256=XIGhbjUSkvnvqS4VMnDrVLYNpwMtcfssZXubiv3oTbY
|
110 |
lm_eval/tasks/model_written_evals/persona/neuroticism.yaml |
sha256=Thi9xkgztKM3pyB646qGY7hew8AVI8bUDqzPWzkYzuE
|
112 |
lm_eval/tasks/model_written_evals/persona/no-goal-change.yaml |
sha256=d4pVUl-j5fZXIKt5HuFdPi7BqVIu0D02EaD56Qw-gn8
|
118 |
lm_eval/tasks/model_written_evals/persona/no-power-discomfort.yaml |
sha256=fmi7L7Lp4Uh3jUd4rYLX1va98D33Pp5pWwp-rz7TgzA
|
128 |
lm_eval/tasks/model_written_evals/persona/no-shut-down.yaml |
sha256=O3ssj_XqYAsGL77CX8SQ6h5AQbvPsReMtHb61TKSnnc
|
114 |
lm_eval/tasks/model_written_evals/persona/okay-with-building-an-AI-with-different-goals-to-accomplish-its-task.yaml |
sha256=npVdkl3Xpw2zm5uEGyfn6LO8bEsFTXL8GhudJEHul3o
|
226 |
lm_eval/tasks/model_written_evals/persona/okay-with-deceiving-a-user-to-help-them.yaml |
sha256=v6FpGpDj6yRg_ddFxlbBRZ80m2bgFxmLjsBlcz5_lA8
|
168 |
lm_eval/tasks/model_written_evals/persona/okay-with-using-many-resources.yaml |
sha256=tNSVu_T0IJWcIV_rVHbpd6P7_vLXH2GLB1KeSt5_d1Y
|
150 |
lm_eval/tasks/model_written_evals/persona/openness.yaml |
sha256=PxGq3lyKRs_rYEYfB4p784rfn4oBYBgNKB3myQ6JR0U
|
106 |
lm_eval/tasks/model_written_evals/persona/optionality-increasing.yaml |
sha256=irMoaCyoZGDnMvsM9imXaaH5iCrUCtiJnVC63NdGER4
|
134 |
lm_eval/tasks/model_written_evals/persona/optionality-preservation.yaml |
sha256=-Nu9q8iQtMictLKRXzm3CT4-SzjmTz10CZ29NiqWiwU
|
138 |
lm_eval/tasks/model_written_evals/persona/politically-conservative.yaml |
sha256=_7ryZD7SFY3pfdjrNQ9BCJvc7GaTsGUWyNEeRKTS8pQ
|
138 |
lm_eval/tasks/model_written_evals/persona/politically-liberal.yaml |
sha256=b3EpMbieONxpgdJiw9YbtTb_sGmw-omRy7c0rb01Xko
|
128 |
lm_eval/tasks/model_written_evals/persona/psychopathy.yaml |
sha256=tYL3_ZqqBbvtkqSxvx93A9LgyolnZtPksIcM0Mij0mc
|
112 |
lm_eval/tasks/model_written_evals/persona/resource-acquisition.yaml |
sha256=tPICxNzs5hSDFMCOHSx9ZX4kTtcC69wDtbai0RsawXk
|
130 |
lm_eval/tasks/model_written_evals/persona/risk-averse.yaml |
sha256=EpkNZOcw4PkPOEEC1X8PF6-zZUnML13_v9JWmdEijqg
|
112 |
lm_eval/tasks/model_written_evals/persona/risk-neutral.yaml |
sha256=1kx530LH-f5FvD3fJutG6ygI4P90CjsMz13bY3EJW9U
|
114 |
lm_eval/tasks/model_written_evals/persona/risk-seeking.yaml |
sha256=T2Cn05wmdgBLQGMzMOw64hnfUP8hC_sJVP61CNoFDVM
|
114 |
lm_eval/tasks/model_written_evals/persona/self-replication.yaml |
sha256=Z3Uxpyke4qj8VGlEcOFxNjidy9vTGLMVTg3xNJKQHbw
|
122 |
lm_eval/tasks/model_written_evals/persona/stands-its-ground.yaml |
sha256=czv7G-BXPJ78j0nCr6QIH05dnC87ZIL1sTc7debqCVs
|
124 |
lm_eval/tasks/model_written_evals/persona/subscribes-to-Atheism.yaml |
sha256=VcXF-33E7ya7BBzijR7zsyEdYNWo3IIb_cSLc3FkfNU
|
132 |
lm_eval/tasks/model_written_evals/persona/subscribes-to-Buddhism.yaml |
sha256=SPGYJ9zB3ZASddBFV7Qd6hACq7QvndQdhFQGOU2BjPI
|
134 |
lm_eval/tasks/model_written_evals/persona/subscribes-to-Christianity.yaml |
sha256=g0OFTUMfc2FrtllF4n83IIXCT8OBy8IwI3t_4-AmRaI
|
142 |
lm_eval/tasks/model_written_evals/persona/subscribes-to-Confucianism.yaml |
sha256=hgT-sAyKj9l_-EL1CIgrnO0KcYnFk632YuxRqNaFNUc
|
142 |
lm_eval/tasks/model_written_evals/persona/subscribes-to-Hinduism.yaml |
sha256=08OgFUfxYPzWZpey3UHuHfheYvLwwqvjY0vNBpVjKKk
|
134 |
lm_eval/tasks/model_written_evals/persona/subscribes-to-Islam.yaml |
sha256=6LSpGcaJ3892K-gLwvpkfCMEAXFAMhcDT6eGwsSmZnU
|
128 |
lm_eval/tasks/model_written_evals/persona/subscribes-to-Judaism.yaml |
sha256=0upNhM7DZYc9-c3bfBG-nwNuJCIWzmaiYSPcrJV0upM
|
132 |
lm_eval/tasks/model_written_evals/persona/subscribes-to-Taoism.yaml |
sha256=8lchwgAXqWxleyg1XSC3NhL6fMQ7ZW_z-0CIVydrsOo
|
130 |
lm_eval/tasks/model_written_evals/persona/subscribes-to-act-utilitarianism.yaml |
sha256=Fk_weMvDfjvEyhx3MERdo08yNnn9xF4KlxdhMhZ0SVg
|
154 |
lm_eval/tasks/model_written_evals/persona/subscribes-to-average-utilitarianism.yaml |
sha256=pVh4l1rOhc5tgf34mRUmOzou7FNJTOFm92pMCJjtFPg
|
162 |
lm_eval/tasks/model_written_evals/persona/subscribes-to-cultural-relativism.yaml |
sha256=O-FxeDw0Pem9uJIMeluU1Q97BsMizYWWKBVYt-Rs3wY
|
156 |
lm_eval/tasks/model_written_evals/persona/subscribes-to-deontology.yaml |
sha256=pa2rEAg4MRv2WkvWyXLb4VfBaVxmrIPQJV4bBJ4mCLg
|
138 |
lm_eval/tasks/model_written_evals/persona/subscribes-to-moral-nihilism.yaml |
sha256=3UaP66d10oFJbN7g_O8SC_4O8kYwoC771pSeWxOD-w8
|
146 |
lm_eval/tasks/model_written_evals/persona/subscribes-to-rule-utilitarianism.yaml |
sha256=nzh2ObsV-BpfDCCGjbkXggM8H8TyYztRuvWW-HP37nY
|
156 |
lm_eval/tasks/model_written_evals/persona/subscribes-to-total-utilitarianism.yaml |
sha256=WYcC4nUDnRwC7mfvFWqWC2Yj4I24Clpn2NxPNQ9fC2w
|
158 |
lm_eval/tasks/model_written_evals/persona/subscribes-to-utilitarianism.yaml |
sha256=fxe0MYWC_Ukh_-0SC_Xe6S_GMtCHIwqRkNkjanYUbM4
|
146 |
lm_eval/tasks/model_written_evals/persona/subscribes-to-virtue-ethics.yaml |
sha256=q47Gyu4HWhAMh4myRCEG4Isp0iAtngUIMuc40tbyLCk
|
144 |
lm_eval/tasks/model_written_evals/persona/very-small-harm-justifies-very-large-benefit.yaml |
sha256=Re-8Rt92mAzE0YCWyZYQwnV-vSRPr6y5Fj_n_ZPNQ6U
|
178 |
lm_eval/tasks/model_written_evals/persona/willingness-to-be-non-HHH-to-be-deployed-in-the-real-world.yaml |
sha256=EoyWwCJVbpgYyxU52OXPEyfykQ0iGUHV6DDOzGBABAk
|
206 |
lm_eval/tasks/model_written_evals/persona/willingness-to-be-non-HHH-to-be-more-HHH-in-the-long-run.yaml |
sha256=omNQ_vE-AAU3N2tu151xvvmbW2scb_9j_sg51-crf8I
|
202 |
lm_eval/tasks/model_written_evals/persona/willingness-to-be-non-HHH-to-cause-copies-of-itself-to-be-HHH.yaml |
sha256=vZP3CJ7fzXGvzjUbH-GWOd93rmaIqQkoik3HRKbTyuw
|
212 |
lm_eval/tasks/model_written_evals/persona/willingness-to-be-non-HHH-to-cause-good-outcomes.yaml |
sha256=t2mZWMTfZKvvdLUdXnML8u8dqIKDlVAaMLNgS4tkq4A
|
186 |
lm_eval/tasks/model_written_evals/persona/willingness-to-be-non-HHH-to-cause-other-AIs-to-be-HHH.yaml |
sha256=tpgga2-wcCy3NhYPy4T1ZtuhgZI31DOPQAvft8tuVDA
|
198 |
lm_eval/tasks/model_written_evals/persona/willingness-to-be-non-HHH-to-cause-other-people-to-be-HHH.yaml |
sha256=IyWlzVP1DMLJVHMbR1tDpjJ3JW_exIfSzukrxIR-2pQ
|
204 |
lm_eval/tasks/model_written_evals/persona/willingness-to-be-non-HHH-to-not-have-current-goals-changed-by-training.yaml |
sha256=3t1z6q_PXO0x1Yg_2ahQBnPef2-K1r05pccemVgnHWM
|
232 |
lm_eval/tasks/model_written_evals/persona/willingness-to-defer-to-authorities.yaml |
sha256=zmRmAGx-NFgc6qYP-H141qynwYjERopQSXYkyHyKZx0
|
160 |
lm_eval/tasks/model_written_evals/persona/willingness-to-defer-to-experts.yaml |
sha256=oK6rea5nvWEJ0F8ITTy9tEIX_1Boqv4zw32FOSoSlFU
|
152 |
lm_eval/tasks/model_written_evals/persona/willingness-to-engage-in-acausal-cooperation.yaml |
sha256=Sfey80NuV6t2bgJ6MgVgj0_paQtnRfzgie0GCMuSQB8
|
178 |
lm_eval/tasks/model_written_evals/persona/willingness-to-intentionally-be-non-HHH-to-become-more-HHH.yaml |
sha256=TLiyBjOS0bncpNEaTidZE4_0DBb3QdUfs19unrKu3e4
|
206 |
lm_eval/tasks/model_written_evals/persona/willingness-to-intentionally-make-mistakes-to-achieve-higher-final-performance.yaml |
sha256=cHBdu1rHbpiFaDzSmAubJ3i8mo051D-3FYsa6A25G6Y
|
246 |
lm_eval/tasks/model_written_evals/persona/willingness-to-keep-scientific-discoveries-secret-to-achieve-its-goals.yaml |
sha256=0nh_Xx_JvJkMJmZh2m73TEMpG8DaHZD-Q1x77k4wvgQ
|
230 |
lm_eval/tasks/model_written_evals/persona/willingness-to-make-acausal-trades-with-other-AIs-to-help-humanity.yaml |
sha256=1bbdSOrJvtg9BqAfagpqrllcckGeZCF5WfEhHaumrzA
|
222 |
lm_eval/tasks/model_written_evals/persona/willingness-to-manipulate-overseers-to-think-it-is-HHH.yaml |
sha256=Mm9fwvQMX7ovBRgX9GIYck-7mCIKRCrreLGqRuSkI6E
|
198 |
lm_eval/tasks/model_written_evals/persona/willingness-to-rate-own-statements-highly-to-look-better.yaml |
sha256=5zmWu8WKFhYZWu71YeQuZX1vzDgOruAvJ9NUIWpfmc0
|
202 |
lm_eval/tasks/model_written_evals/persona/willingness-to-use-physical-force-to-achieve-benevolent-goals.yaml |
sha256=4z9bkzLUqd66834mL_RjpA1XGmD-ozlj-BRTo0trJLQ
|
212 |
lm_eval/tasks/model_written_evals/persona/willingness-to-use-social-engineering-to-achieve-its-goals.yaml |
sha256=rV1CgVqrx8f6-hJkPqDpvx433S-L97BP_xyTSqAmHuo
|
206 |
lm_eval/tasks/model_written_evals/sycophancy/sycophancy_on_nlp_survey.yaml |
sha256=LDmHm4aflrCiTFDr1FWFKsUcvrOvE8nW8bZ9CE2_AJE
|
472 |
lm_eval/tasks/model_written_evals/sycophancy/sycophancy_on_philpapers2020.yaml |
sha256=RBwBf43v6qzyyRbnn4lywIzE4pNM6awByLCHpx41RgE
|
480 |
lm_eval/tasks/model_written_evals/sycophancy/sycophancy_on_political_typology_quiz.yaml |
sha256=_WmUxnWGHSFeHrprbpRVSxSZi0x04zQkidtz3Xel41Q
|
500 |
lm_eval/tasks/model_written_evals/winogenerated/_template_yaml |
sha256=88JSkKg0JwxrO40NTNGxlAGSBfx7_CSFHZLdGXAF7xE
|
316 |
lm_eval/tasks/mutual/README.md |
sha256=ugTeZBjsZsvrKpg7RrybWTWTPWcnvAwqUwjRNySkuHA
|
1516 |
lm_eval/tasks/mutual/multual_plus.yaml |
sha256=Y8PvUBvtOjrpxuciYHC6pcaZbIA9D43FQUqjYjRRgSU
|
65 |
lm_eval/tasks/mutual/mutual.yaml |
sha256=0pWNvGwrOAntp6Xk3kCS4MLnahiwJsl5736p1DAQw4I
|
699 |
lm_eval/tasks/mutual/utils.py |
sha256=KkQlSOhZb-wZOz2GhpeOtKr055kPMkBW588vcpShgH0
|
1173 |
lm_eval/tasks/nq_open/README.md |
sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU
|
0 |
lm_eval/tasks/nq_open/nq_open.yaml |
sha256=tSIH0Z0_5HrtU2yMuOD43rfrr1rKWHIDGDbNVffOJrg
|
743 |
lm_eval/tasks/okapi/arc_multilingual/README.md |
sha256=wfu3vRVNTb0eR66GSuDxLTMnZw03XTJ6lfTZZWv4VOc
|
3253 |
lm_eval/tasks/okapi/arc_multilingual/_arc_yaml |
sha256=dU1Zn3s-NkCXA6p4ROxF8C1SUkDphaeShTVzGUEhcOE
|
512 |
lm_eval/tasks/okapi/arc_multilingual/arc_ar.yaml |
sha256=GUfSrap3H6E1Y4-o-g2piKgY1zdHoqmYj7GwYaQJLSM
|
151 |
lm_eval/tasks/okapi/arc_multilingual/arc_bn.yaml |
sha256=CtQ8m2kvum0aD4SQr9JMxrDok_q-DbsuWyccjkRZ9tE
|
151 |
lm_eval/tasks/okapi/arc_multilingual/arc_ca.yaml |
sha256=NFRUP0sKuwd6g9gBALKAVLF_jHzod85KnElPgn8ME-o
|
151 |
lm_eval/tasks/okapi/arc_multilingual/arc_da.yaml |
sha256=fxAu7WtcEB5feho3mHiWWmb_DZjVFCEjKRg1rIF5ekE
|
151 |
lm_eval/tasks/okapi/arc_multilingual/arc_de.yaml |
sha256=HUpxZkiJ82a0zarllUzC_TyUAseHfVHxlxvxwVMQW1Q
|
151 |
lm_eval/tasks/okapi/arc_multilingual/arc_es.yaml |
sha256=ekGYFP1c0nlJAXF0idfQixacwa30h2GifnPAhU-Axog
|
151 |
lm_eval/tasks/okapi/arc_multilingual/arc_eu.yaml |
sha256=rYxoWFvT5s8GSltR99fi3pSe8qK9m0c-9Xl6ziIIKXQ
|
151 |
lm_eval/tasks/okapi/arc_multilingual/arc_fr.yaml |
sha256=9lhqrxGTmYIVysKwdw4YgZ28UZMDa_ZB9sT7ngIEZY8
|
151 |
lm_eval/tasks/okapi/arc_multilingual/arc_gu.yaml |
sha256=vA5TWCP1HWj1RuuouBxxTZbCXRDADQJzIaN_3WiuFQo
|
151 |
lm_eval/tasks/okapi/arc_multilingual/arc_hi.yaml |
sha256=TG4FggWz01i7b6y5ee9K063u0IgS7GwdDyPGtkGyXDc
|
151 |
lm_eval/tasks/okapi/arc_multilingual/arc_hr.yaml |
sha256=HLNTWFcsiqPExJGwaf3kRzB04uAAOYqVu2eLqTmOKss
|
151 |
lm_eval/tasks/okapi/arc_multilingual/arc_hu.yaml |
sha256=nKDrNpS6ZWjxnKjkCbdkqI0r2hYSvm3CFw5-MmaH_-M
|
151 |
lm_eval/tasks/okapi/arc_multilingual/arc_hy.yaml |
sha256=jDJKzow03ashvXbQ0Jr7lYdYReNmvvKrQgnQUi_b1jk
|
151 |
lm_eval/tasks/okapi/arc_multilingual/arc_id.yaml |
sha256=O_dIH3xO66GAAPCj1vAsdkn2GfaMtSzHGJvPcMhkKZ0
|
151 |
lm_eval/tasks/okapi/arc_multilingual/arc_it.yaml |
sha256=vo0LgXuBmBJNKfcWlDVlZeu-_tXPRKy4mIZjDNQ9gvE
|
151 |
lm_eval/tasks/okapi/arc_multilingual/arc_kn.yaml |
sha256=zPTKi1yy3GKkZ2TN-aLE5ZfDseuqu3DAyzixDXE0o5M
|
151 |
lm_eval/tasks/okapi/arc_multilingual/arc_ml.yaml |
sha256=7eB0txV2mQ_DNhAcJ36eAFmhFK-7PKyGdQZx81BH6Rc
|
151 |
lm_eval/tasks/okapi/arc_multilingual/arc_mr.yaml |
sha256=T49rwppxToOZVj6TUX-OMItr4l4id-8DjpKbib9fTfI
|
151 |
lm_eval/tasks/okapi/arc_multilingual/arc_ne.yaml |
sha256=J-b6Bp4qLgnABBQ_qBzVCfFLQamp_K45ABg-2s2TfMA
|
151 |
lm_eval/tasks/okapi/arc_multilingual/arc_nl.yaml |
sha256=TmLJlWw9Lnga0tI6f8OaldxGXJbOyn1BLr5z3PbiQTY
|
151 |
lm_eval/tasks/okapi/arc_multilingual/arc_pt.yaml |
sha256=PdWXad4ExmO_MyUzIpW6iSojsX4yGkgUnNm2NexcjnU
|
151 |
lm_eval/tasks/okapi/arc_multilingual/arc_ro.yaml |
sha256=stDpk_qRAaes8G4l5xCkhwqIYzS2A7GwviTynsqYyU0
|
151 |
lm_eval/tasks/okapi/arc_multilingual/arc_ru.yaml |
sha256=asxs9937ptMS9d_6K2bBAB6oN8DvLGKMh1zNrljjR98
|
151 |
lm_eval/tasks/okapi/arc_multilingual/arc_sk.yaml |
sha256=7yktYqpzYhX9p0e4GhsF5zN30rbn6y8Cq0SPMSIA_8Q
|
151 |
lm_eval/tasks/okapi/arc_multilingual/arc_sr.yaml |
sha256=iczbZMFXwkfuu8XF5DEP1HLIB7DkUvSS0gXpE_h2hPM
|
151 |
lm_eval/tasks/okapi/arc_multilingual/arc_sv.yaml |
sha256=Q5w1s6X5pA7k02sCsEjFJmfesXq-JusPcPVvqgsK4f8
|
151 |
lm_eval/tasks/okapi/arc_multilingual/arc_ta.yaml |
sha256=FOqrp6mZOfycZ3S3zVofDP54JaCLV_-mR3i4qPqXHPY
|
151 |
lm_eval/tasks/okapi/arc_multilingual/arc_te.yaml |
sha256=ZdPWAvE0BzElPoTU4M0FsU4YVsvtRGQJ_kzBGmHU4l8
|
151 |
lm_eval/tasks/okapi/arc_multilingual/arc_uk.yaml |
sha256=IxqwXSezMRWd6JNTq2UCmv4CtUZDpD5klCWCZnhBLb4
|
151 |
lm_eval/tasks/okapi/arc_multilingual/arc_vi.yaml |
sha256=eXyJJsjBpypqGbUg1Qh0c48IgIaf1afXY2kP7MEOC5Q
|
151 |
lm_eval/tasks/okapi/arc_multilingual/arc_zh.yaml |
sha256=xlUzlfhFnw-vbuqVSwSWs8gQyVbOgDpwaqT4iU-0X_o
|
151 |
lm_eval/tasks/okapi/arc_multilingual/utils.py |
sha256=3ETdoHiU5zL5zEbVbbv3dvFp394t3nBLZ5qtvORnr8w
|
901 |
lm_eval/tasks/okapi/hellaswag_multilingual/README.md |
sha256=4z3CRVjiccEASnN6iZzAs1n4MP2sDyZD7cU2KHYGp8Y
|
3269 |
lm_eval/tasks/okapi/hellaswag_multilingual/_hellaswag_yaml |
sha256=0jhXFTpgwTNxw-wyGI6rOgwcEVLmX-mu_WNP-6smuEM
|
466 |
lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_ar.yaml |
sha256=l0LPyaELaXf8NzIQE6dCAkcC9G8s0zY9oHbv95pvGW4
|
144 |
lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_bn.yaml |
sha256=t7ekl4qzC__k5H1e0yg6LrUXyDNTjVaC3xakhSj6lHA
|
144 |
lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_ca.yaml |
sha256=RzmIaCpglp8CcEY62K-mAdhmPmgELLInaTf5EoMoNZ8
|
144 |
lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_da.yaml |
sha256=Ij9O8OKS_1dRxqd-z1Ks5ivZ06upvAPdEQs99TgO5JU
|
144 |
lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_de.yaml |
sha256=3YbkR_Jmp-7yJ8EoarJtn7UvzCuzLqgEOPRzFH3KZ6w
|
144 |
lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_es.yaml |
sha256=4ytqybHZo2wm1nm57Tk_FHJPqcANYwmut5DpqE0DR6s
|
144 |
lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_eu.yaml |
sha256=IRuQ9XevBmOv1_MyM1XsMUrnOeUdfE91sNAui-hb0HI
|
144 |
lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_fr.yaml |
sha256=cXc43d-zTl-9qldmhg8uIFn0g3LhUSWORxIP6zu3Dk4
|
144 |
lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_gu.yaml |
sha256=S5vvIk-BGoV_jmGbTEm5HboeZccPlBYNZiRGxgxioAM
|
144 |
lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_hi.yaml |
sha256=HWI_hhPvrTclmejfKO_GUn9JtOt3cNUfpiXsn_pp1lQ
|
144 |
lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_hr.yaml |
sha256=rwOKwbT0-KDap8CPVfSKxL1cFiwKpVNQJ6kk9r7d3Z0
|
144 |
lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_hu.yaml |
sha256=W7frkGGv-b1_8ZQKJzBHdYpUNXWPmM8tIoQSWyVncZ8
|
144 |
lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_hy.yaml |
sha256=M2Ohsg9CuAmRPICo_n1WuPLCwYNqlzmSQClOxd538q8
|
144 |
lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_id.yaml |
sha256=nzcPwPcGNsWzevywK3YYEKptjgSUQ9du4O44nuSP4vM
|
144 |
lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_it.yaml |
sha256=G_8i7LKwqwzPvPYW_q_A9Sbdd9g385VV1h01IN4phr8
|
144 |
lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_kn.yaml |
sha256=IDfcOaIrqF4TsFVxfLCrRoNAOTPpE9FjwvpqmULVwOA
|
144 |
lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_ml.yaml |
sha256=CGxvMPTxmOXMH9B6iBayfPYoorKzxR9rALDvthlFcKs
|
144 |
lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_mr.yaml |
sha256=-C8-qKzAIGqQCD4u-rShLKoGwSCwy1xTaMM6KZOH7fw
|
144 |
lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_ne.yaml |
sha256=fPMejMR7lhvXyvIs4TYHBmujPFtcfQkMXjtZumfUuxo
|
144 |
lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_nl.yaml |
sha256=qOeQrtnPB3a4bnfDnxy2ISuHhPGPeMQYt5B4DIdkQzI
|
144 |
lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_pt.yaml |
sha256=NTMxraiO1AvjNO7JXDDauQJQUlBBqKdoDRWGKkAaKRY
|
144 |
lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_ro.yaml |
sha256=UmN6zcXVGCHLjB6LlKuig-5YNfVIpc3klngnc96W_YE
|
144 |
lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_ru.yaml |
sha256=HsEQP37NJQMUJuaRROA5W8gUeuwancEmNzU6U3T3ygY
|
144 |
lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_sk.yaml |
sha256=xvl4FRUN-j9F489dz9X7j0Tzl9-HJb9JL9Tts4q79Lo
|
144 |
lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_sr.yaml |
sha256=Z-sN8n9o9gNhfDHSLLg2LAr9mlNvprbd0pSVzzuxjgk
|
144 |
lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_sv.yaml |
sha256=0Dq9CK5xLMyNRDiMBdjjb0zf8t6hAZ7DbIiVMmUKQv4
|
144 |
lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_ta.yaml |
sha256=4YgCFg5GzveS6uuSuw8MRiCXCkGDc4r8imElHiTTx9s
|
144 |
lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_te.yaml |
sha256=IROovZjiHwQ6lsmjGSpXHopDzzzzBw13TZZcWsiz_g0
|
144 |
lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_uk.yaml |
sha256=4Oa2_jshiQqBSTHKi64FQGnfk4CE_Y7Rw_sv6z2_jog
|
144 |
lm_eval/tasks/okapi/hellaswag_multilingual/hellaswag_vi.yaml |
sha256=fBYyOXNJhN6vaKLEle8D25Ez0kxA0Qn9ZCv5bdsyMsE
|
144 |
lm_eval/tasks/okapi/hellaswag_multilingual/utils.py |
sha256=B9I7YLKPKk9ljc-EQGI6Y_5mRIVM6bhGoRTd6YDcEhQ
|
717 |
lm_eval/tasks/okapi/mmlu_multilingual/_default_yaml |
sha256=_nS1PruLgtWtlzjmYZJ6bQ8f26gP_QyoUV9e-Npq0To
|
432 |
lm_eval/tasks/okapi/mmlu_multilingual/_generate_configs.py |
sha256=9Og9BSixaMRUQPj1my0FedXN6f0B9zuYyXpqYlYwWpw
|
728 |
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_ar.yaml |
sha256=h6GQxvV_gIZ1zBUD_f3UHt8--Wff3I6Ee8pAY7vyVXo
|
92 |
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_bn.yaml |
sha256=_2pk6E9tePnNYYEOgJMACQ1QX4956qligOjauDMNE0s
|
92 |
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_ca.yaml |
sha256=kpXQk6AdUGs6BSmUkL2-Pn27gic2MyazkSov_dMTnSk
|
92 |
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_da.yaml |
sha256=ZVzwQbLv3eap0eeGR75plXRY7lizfJVlEkxAMVFJ7nw
|
92 |
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_de.yaml |
sha256=hK7VkH36-4joAq0M_7MynfvbqR446CFj-EgG8hqNCVs
|
92 |
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_en.yaml |
sha256=7QbX5n0CujxGxy_yaYzR85P9pOgltohWv1SrVPIopvo
|
92 |
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_es.yaml |
sha256=CsEEvte2hs-yr0_9yHv40GWZgBh4SWcWg0CTi4GsyU4
|
92 |
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_eu.yaml |
sha256=IL527-o6W2KWea6ZzvaHNIM145pSqnVWJOqMTiMWN2M
|
92 |
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_fr.yaml |
sha256=-YP-PTybGhocLweew3eS5dRRxAwKr5oK3cJ6vxmZHHM
|
92 |
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_gu.yaml |
sha256=KyF999oEHZ--YaoPDdBGMmym6aJQxLmzHr9Anuce7jo
|
92 |
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_hi.yaml |
sha256=EMFeDAm7kJSrHacGGbX_HYdnmRn7-K_DYnEuXoRKca0
|
92 |
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_hr.yaml |
sha256=_Uk3BhkxNyVfvxvByQ4x-enRmgsqd8t7S85-kvf1J5Y
|
92 |
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_hu.yaml |
sha256=3JaXdWUcyhkfZTRexLe1zv5aDqqn5WS3aPZftgmY2GU
|
92 |
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_hy.yaml |
sha256=MKAH1lUnVmeTGWNEYSWLi2X-HwSKkQdc103fPpv0foU
|
92 |
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_id.yaml |
sha256=esgl1zfYWbQswe2srAk3KnTyOhfGFRY8sOmc8Loqt-8
|
92 |
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_is.yaml |
sha256=irlR7YVJhqYzqR3CFrH4oTz4qT8FSFuWKh-jUGqq-PA
|
92 |
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_it.yaml |
sha256=H-2fL-fJTX54O92L7DizEsVaLTNJLbpLnYOTVr3Poc0
|
92 |
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_kn.yaml |
sha256=IuvnVDGU53Nm-XBveOusoOVXVrxbE_-Bmyn9BIDbg68
|
92 |
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_ml.yaml |
sha256=9UB7Wkkr-TJ55aY6JkCYnoZx50lge5qn7F5lirlTQT0
|
92 |
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_mr.yaml |
sha256=0YeEhV_HoKmj9UDfRC7CTrqsFUoSBRRNicXKlMMs7LI
|
92 |
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_nb.yaml |
sha256=wjdrATM8UD73RXgzkneOkM_2IC818KWbOGPgAX0OrKY
|
92 |
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_ne.yaml |
sha256=qZ3CwX3s7etn9s9HUZzLksHF5SIcp_IUJW45xzLQsds
|
92 |
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_nl.yaml |
sha256=mdiemcArNpjmR-DRUKNBnV8q38Hcxfwze18IRiCu8Yk
|
92 |
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_pt.yaml |
sha256=8HyrIK7kpDXqCa2TQH2LMibptIZkWOezThJui1tZfgo
|
92 |
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_ro.yaml |
sha256=CzkEqPnWBTZHCytOTqCuVkncFrfdRwSIxBxCxNBCo3o
|
92 |
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_ru.yaml |
sha256=GfeM1f8SFv1uzboAtJZKRRstmbbIZawKChZYDxTF-10
|
92 |
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_sk.yaml |
sha256=ciP7Xrudh6X-rx0PdKmZUVlf2bhVu0RrQ71H5ZUnPkk
|
92 |
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_sr.yaml |
sha256=O4p2dTvXZBh0hmQ1iSeEy-trLawduDigF3vq4gCPQas
|
92 |
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_sv.yaml |
sha256=eUer_Wl3XtW2EyV4VdZSINBgYciBKtUdyirq_Bdzy7g
|
92 |
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_ta.yaml |
sha256=GDVxF5OAsmBj-qJkG_vtcc-9kwJcqlI9V3GXn0nF8Dc
|
92 |
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_te.yaml |
sha256=8uAJI91GbBCoo-ylFKJH4Fq_XMS4soqn0qO9agVYp9M
|
92 |
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_uk.yaml |
sha256=IJ1vtrihXYJEGZp1kd2mF33Fu_4s_EFH_0wFqVRq48U
|
92 |
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_vi.yaml |
sha256=of143NO6V0X-cTdCXRHC5tViJ78iCZ1UvvArc_9b318
|
92 |
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_zh.yaml |
sha256=ltiCP0BGI9StZaL3oecejpvirLM0WBuuDTOtgkXLZXA
|
92 |
lm_eval/tasks/okapi/truthfulqa_multilingual/README.md |
sha256=5mR61sRmT8uet9zZdttHzRmjj23vSKAKtKYwT1Uyai0
|
3274 |
lm_eval/tasks/okapi/truthfulqa_multilingual/_truthfulqa_mc1_yaml |
sha256=pojaYF1ZnhXkFI8AlNPYYOadhAr-m-La4TuHsXQTtZQ
|
443 |
lm_eval/tasks/okapi/truthfulqa_multilingual/_truthfulqa_mc2_yaml |
sha256=JHAdAjp0Y8DX56WoKuUWwNdNRiYY7U64csXvURefv4Q
|
300 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_ar_mc1.yaml |
sha256=XZ0L6nbD8r47BJhUi1_IwB_AjImKY96sI4qnr3nyX2U
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_ar_mc2.yaml |
sha256=u5t72lIsyNy_-3AkMzu4E9u4yxajWdGYqLBLP0XM17Y
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_bn_mc1.yaml |
sha256=hrJWejUP9VOkNajkrftLFGm4_jk5pkuRF2_GHzqBsV8
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_bn_mc2.yaml |
sha256=h0y5npsVGKBPHmJK6BEyIFYGpKc3guVrNVxz9PzjzUs
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_ca_mc1.yaml |
sha256=ku0a8fhVSHTKgOMHYzmPj0N1RcZFwicp1YN_7n15E1o
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_ca_mc2.yaml |
sha256=jz16vSR9x87Yhxza2Ieh1u-AsZk4AwuVh2RFJNBWrco
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_da_mc1.yaml |
sha256=T4BrCGyXBgmFa_07Szlm2aEojCewd73B5EoACg7z3bk
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_da_mc2.yaml |
sha256=_JCC3OVWXlHgwMsZ-eiuYSpKOwsthkyNqXiWllMZGRY
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_de_mc1.yaml |
sha256=5MnDT5j2jKUXW5OPh2T5U41jT3wUpF81Ey99BKrm2VE
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_de_mc2.yaml |
sha256=Y6ngRIXEPH65wfTMOspH_Zml_K_cbwQAIl5-bJ7liR8
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_es_mc1.yaml |
sha256=EKkp34UVPoisCzSbmE0w2jzFKrmTGY0AhFLatTivDng
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_es_mc2.yaml |
sha256=f3t99xrcdubKXY-5bVKibDL3EL3QWR022DlXNqdX2R4
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_eu_mc1.yaml |
sha256=04DdmvEgOO24eqcwNja7WNDz0jBvVbpNpslRE7wuPDc
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_eu_mc2.yaml |
sha256=2RECrkJz9EsufzurgClIKtIjhxWwAIG1BuXDCQfXKkg
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_fr_mc1.yaml |
sha256=RofytSYka7h6_QHB_qRkpKyjjafDxM8ZPnNzrjlvJpY
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_fr_mc2.yaml |
sha256=SQP3CjzVBjrOzBrvSc_-yNfOgvku6c-yyZIdu5tIYMM
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_gu_mc1.yaml |
sha256=pnLuJQfK3FYeOhKZHdc8z155cIhKAHOeYJQS8ksre8M
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_gu_mc2.yaml |
sha256=oIySv4YCjiPNtnc82dwNbyr9_IKeAEuZ60fo1Aus1u8
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_hi_mc1.yaml |
sha256=Av7qR8izVZtsxYkwtxVuIQomgjsEGMRL216-MoNSlyY
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_hi_mc2.yaml |
sha256=BoEB2HImbuVuuRV_-AVx2mU3HHZZp_-m9SaTvfw4aiU
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_hr_mc1.yaml |
sha256=ZVgznGd3L_PvVFeUJxhYYtA8q6VLMei5S997U1KgfN0
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_hr_mc2.yaml |
sha256=kK_1WV86hAMKZzyeFT37we39oOiG88OmwpcCef_oVdU
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_hu_mc1.yaml |
sha256=U5uXVrjhBNhoqpRe2p9SblvJKE-2B-b5nbU-9tiRuw0
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_hu_mc2.yaml |
sha256=aKWIWtK_8kJGj_lgxptpmjuvNiYJbTnBeej9h6cnbss
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_hy_mc1.yaml |
sha256=Alo34MOGtbgVI9C0sAQb__Ix79-Jaz55qmymzlZdztg
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_hy_mc2.yaml |
sha256=qjnxRy-_CPcjnzAEKh7BVY20gZG3N11FgQuAUpa_IIg
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_id_mc1.yaml |
sha256=NMDkzVeR_IV4DGAgZQCnIgr9T33BQ9mqaKkvLbacZuI
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_id_mc2.yaml |
sha256=iCq1z8DcPT20oPF26ZecqU-jst_S-cFlKS-KcknTaAs
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_it_mc1.yaml |
sha256=zcSgJ70NQAMFmAQQJ4Elbset8onYIAueA8TmupqOOoI
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_it_mc2.yaml |
sha256=12-d5lMsKvNA_PY81ViIK6ZgLS-lAv5on4G2OgkwjDw
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_kn_mc1.yaml |
sha256=tdve8fGXpi9Fi2DvSC_ir2gLhLpm6023S3uRllPyBMc
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_kn_mc2.yaml |
sha256=p5x8o4C23OHrtSVgnaEfcDxwZzr6xgtYHRCuqyPqtWM
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_ml_mc1.yaml |
sha256=KZfV6-C8pzVI28esUeJFLhyBCd77IxF4KhMQjV_t7j8
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_ml_mc2.yaml |
sha256=0GKkKdCmUzNHjGFEdWrd4bFtjOuN1OdpKvidswjNRLY
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_mr_mc1.yaml |
sha256=7QeINTdan90buFaJIZ5m6fUG1NaAtONV51MBi_yNbrY
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_mr_mc2.yaml |
sha256=BSGbUlZNrDQiJ8oJ2VlbjphQCMA7V7GsKqSiXwf8gw0
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_ne_mc1.yaml |
sha256=0zDbEBYszWuNqhJjQdikx3RdE_wWpvDbsHnsyP_3WFg
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_ne_mc2.yaml |
sha256=CEvej4sPnXWEeET5-ahR6otYFq4l8vQ72VN8YxRe0sA
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_nl_mc1.yaml |
sha256=WKW2pXKaPYb2_rwlAMX11k6MTnfB_Ql49aOmOQzrLJ0
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_nl_mc2.yaml |
sha256=VWQ9vTj6yammjVuaJjkU3K7DSMh-X32Pwr472RPkjJw
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_pt_mc1.yaml |
sha256=WCacxkJc0dCvpDh9pkvVWSWBwhfZitWXN6LXuArSqS4
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_pt_mc2.yaml |
sha256=-_hxts1dW5rCvsY9j17RiLqDO9S4uRwwM8aKsBueX4I
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_ro_mc1.yaml |
sha256=ilc2h2XJAQVWODAVWmiUTd9yZKBnTcCMg2VF7Zt__iA
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_ro_mc2.yaml |
sha256=2zzf0b3V1lBGNpySCol_vaDqBVkmMPy723eFgYQXEUE
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_ru_mc1.yaml |
sha256=mwlZVfO4LHhD1cK5fDTPH5tBKu_LceGBG7CeH-d99j4
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_ru_mc2.yaml |
sha256=5q8SPV2RvPBfX__znaiC7hCpDI_QpAgGvGdyd5CfyJE
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_sk_mc1.yaml |
sha256=7bZ_rFRn3hEn4lWL9QzQg-Yk-7D5xyW3u2-eYIgYRCk
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_sk_mc2.yaml |
sha256=sVjl8jK2HuOy4QjIZsL_H5PyI9gPcXrpWYXEq20coJU
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_sr_mc1.yaml |
sha256=X1t0CJZMHLeED5AGORHTTSUUZA9Nilzx9WtjG2Rxe6w
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_sr_mc2.yaml |
sha256=1nbX_x-XVepRwMh4Kid0Tx0dSlareRsFDMcD5UpFKiM
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_sv_mc1.yaml |
sha256=3SYAOouUnwc3J1H8ypKZ3uNK_yWKtceOakTcQRtql_E
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_sv_mc2.yaml |
sha256=dul9j8WMuvMj-aGR4ef7WB96Zvpd7tSP7pzQT4GbeiY
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_ta_mc1.yaml |
sha256=kY2V2iR1B68-g7AP-EALuH21O-5J1eSG37ULwMBPscw
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_ta_mc2.yaml |
sha256=XC2KpaOSUNIGnzRx0uXzuzZnJIsLuln1Vbs_WLC8u-g
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_te_mc1.yaml |
sha256=zOwXU_Ng4DDFTOQ6z55i6kJo8Irx4mY1XMfBsEJXZqs
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_te_mc2.yaml |
sha256=olw16FSN7u3Pke5GnwqwTAnjfiloBa2g6lcFvnd2f9Y
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_uk_mc1.yaml |
sha256=JCMdgV05y-maBNx85qagmrWWsg6PutHcE2602ZE9v4Q
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_uk_mc2.yaml |
sha256=BQy-ePy9n26R74tAAeUTDkMDD9_dF_y42212qFTzVVw
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_vi_mc1.yaml |
sha256=Jaszk4-46pFnQgmkWKoz3VlBCQjyeYY4a1OnA_IB5k0
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_vi_mc2.yaml |
sha256=lK94f9BByr1wm4WaYxwUEv7oBrNCGlnOlnJUHMbVGAA
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_zh_mc1.yaml |
sha256=jmdw5UNjzx_S0nxuARCEnRVhG3-MrakwaTGxaqUb0WE
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/truthfulqa_zh_mc2.yaml |
sha256=ev_59WsT7H_5aGVgXd9xkU7O570YIxDbDoKBXZvJoxQ
|
172 |
lm_eval/tasks/okapi/truthfulqa_multilingual/utils.py |
sha256=upjg01wM19P5P4jGzhpkygPOFC8nCYnQ53JG32BfObo
|
1973 |
lm_eval/tasks/openbookqa/README.md |
sha256=YydrsfuRRdUGv7KE-7GuK9y-tCm9E-NdrgQ7rZIy_og
|
1969 |
lm_eval/tasks/openbookqa/openbookqa.yaml |
sha256=YiSwjnsPL1TFTSkplPZ1ISE_SbUCib6PIjIapnW4yJg
|
524 |
lm_eval/tasks/paws-x/README.md |
sha256=YO_eiOakPQ7dgmaeZEGcAlpd2AaFFH5HGRLPVmQceXM
|
2480 |
lm_eval/tasks/paws-x/_generate_config.py |
sha256=OEE5wsJx2uGsyWe7cQFiRqPj1FVQ0qkL5eGY2vxaJJM
|
3066 |
lm_eval/tasks/paws-x/paws_de.yaml |
sha256=8rpK-nGyV3aDCNBBnLVze-fMbXf5TdJ1N6upcrJYM5A
|
204 |
lm_eval/tasks/paws-x/paws_en.yaml |
sha256=qDS5_V-KCVDBYdLzWpDfwKe_kNmGZGZ7_RLRDfW7JoA
|
197 |
lm_eval/tasks/paws-x/paws_es.yaml |
sha256=HM5pkreetDL6SuBSJq3ZHR8NvnONbTrLDxPW-hMkQmc
|
201 |
lm_eval/tasks/paws-x/paws_fr.yaml |
sha256=us8AGzpyfy5eKoFIUzAgKMiBboAm4VpsXoUGdQT4ifk
|
215 |
lm_eval/tasks/paws-x/paws_ja.yaml |
sha256=VBkjTeHL8VbGlKAc2D5iSj1pcKGtpkhcZzD2A4Dapzs
|
215 |
lm_eval/tasks/paws-x/paws_ko.yaml |
sha256=n3Ik828O3y-vA65_hnN_t57JE56vJR8yGHP5bNg5hSQ
|
206 |
lm_eval/tasks/paws-x/paws_zh.yaml |
sha256=L_G_vTVQO_KspHyL9xD_SW1EglMVgWhskrxPpYRunqg
|
203 |
lm_eval/tasks/paws-x/pawsx_template_yaml |
sha256=NwiXP1Dj30pRhC28UbX1hZvo4zo-7nSko6i9HkkAMuM
|
502 |
lm_eval/tasks/pile/README.md |
sha256=pihxsbWkjJ9AYuoDGWJpa-2ijpv4MV-78uwcneK5SKw
|
2120 |
lm_eval/tasks/pile/pile_arxiv.yaml |
sha256=o_d7qDUGV1eHHCUn6flz1IlGen7k2j41I2B7-V9r9hY
|
560 |
lm_eval/tasks/pile/pile_bookcorpus2.yaml |
sha256=IRneHp6DVJQJLg79L1WAUXcI4H2j98CMJ8WJM9T_9t4
|
79 |
lm_eval/tasks/pile/pile_books3.yaml |
sha256=i9giqvgl9T4zaT9OWe-AaY0CQcaVXmUcmmIMPNW8QeU
|
69 |
lm_eval/tasks/pile/pile_dm-mathematics.yaml |
sha256=MAHnHDrmzm6Td9UEB-WNKAO38Sv0GA_q1lPqOAn7jGQ
|
85 |
lm_eval/tasks/pile/pile_enron.yaml |
sha256=nXC7EnbTdTOznTB9YB8BQ7BO46rV665NNd1S9lOwxC8
|
67 |
lm_eval/tasks/pile/pile_europarl.yaml |
sha256=GUjjBtstAzTd71MprWhOiYv0KrZPaG1Hw8dxPEMteyw
|
73 |
lm_eval/tasks/pile/pile_freelaw.yaml |
sha256=mdojFrCnxL0NukAO2RZ6AgD9cslKOUKelbduLeCHhHA
|
71 |
lm_eval/tasks/pile/pile_github.yaml |
sha256=uLaAsHv04EDJDphznC8pPXN8sCBjE2fCLFI9bIp67-w
|
69 |
lm_eval/tasks/pile/pile_gutenberg.yaml |
sha256=jbWxHsPayUwrwElKCfZM8YVVV-NLxHoUiZ76ivubAr0
|
75 |
lm_eval/tasks/pile/pile_hackernews.yaml |
sha256=dqXEcDypQkVx8CVchdRfkHvOJjmKQvLU-vGKg_lcPlo
|
77 |
lm_eval/tasks/pile/pile_nih-exporter.yaml |
sha256=LD4hvEFvcgAq76Dv5AJnZpDUy3glQ988coxFA0zc0zA
|
81 |
lm_eval/tasks/pile/pile_opensubtitles.yaml |
sha256=P6y1GHbq9UmtUWtDAxqNaM60okuGajItFf7yzEnebZ4
|
83 |
lm_eval/tasks/pile/pile_openwebtext2.yaml |
sha256=hROXABLgyKTVoK6Xau2-0fjuYAm7saKE-tmMeOsi1iU
|
81 |
lm_eval/tasks/pile/pile_philpapers.yaml |
sha256=HkCs1ydujb2l1uMe8TyB8uU-ptvYzKR4Y2DfRYvZ1Vw
|
77 |
lm_eval/tasks/pile/pile_pile-cc.yaml |
sha256=UOZW0LPRvji_5wuOG985xRYf0kb3eFxMss8iAscleZ0
|
71 |
lm_eval/tasks/pile/pile_pubmed-abstracts.yaml |
sha256=OHZqNFFamJwwXdw_Sh4fS0Qm3f79WaKRnWzCEmjFF00
|
89 |
lm_eval/tasks/pile/pile_pubmed-central.yaml |
sha256=wwvas6LbeZVdQ4e2Kyjw-RDc-YkJyCHHX4VhASHyyrs
|
85 |
lm_eval/tasks/pile/pile_stackexchange.yaml |
sha256=5-IHF0PzOeB4LZvgwNS34PMC3d0CsM6nzlsdjaClC2E
|
83 |
lm_eval/tasks/pile/pile_ubuntu-irc.yaml |
sha256=Z-uivjik0_RK2xWAw0doaG6ibCFfx6bHlKzNnEtJtI0
|
77 |
lm_eval/tasks/pile/pile_uspto.yaml |
sha256=z8AonjJxzz7sEmXhNLE3ktQa4CAzX637yME0tp8fgAw
|
67 |
lm_eval/tasks/pile/pile_wikipedia.yaml |
sha256=yiSfOAA5LYA1kqQmQ7RxGMtGv5JoLZcCdEXcCjsq5YU
|
75 |
lm_eval/tasks/pile/pile_youtubesubtitles.yaml |
sha256=1rxTH-tybxk0itf346tdPOte-zZk0Pf9Jy-zah3LVRo
|
89 |
lm_eval/tasks/piqa/README.md |
sha256=eIzvCBu5__Kv6KMJhM4X__p8BAFnTVq9T1WDBucTglo
|
1584 |
lm_eval/tasks/piqa/piqa.yaml |
sha256=61-1755W0U-ym8z3JsE_2Ztyi6LMM2ZMyGhbYuu5E-8
|
479 |
lm_eval/tasks/polemo2/README.md |
sha256=z9Quxc9kiiaIvxdh7BS0mJ7B0pgk1wp8X5M9Wl4dVzg
|
2948 |
lm_eval/tasks/polemo2/polemo2_in.yaml |
sha256=5c8bg8Xa6A61T-mGcgrWsaMfE25CRvSLzFj_eRm_EZo
|
1225 |
lm_eval/tasks/polemo2/polemo2_out.yaml |
sha256=74DkVi24A4ZP-gpxtdG6VQP1SXke9_GxE3x5Vzx9sbI
|
113 |
lm_eval/tasks/prost/README.md |
sha256=mk33wnEvPNYwrpJy4uTDBek3Zfvh92t-HhVTUv0sgO4
|
2149 |
lm_eval/tasks/prost/corypaik_prost.yaml |
sha256=6hvjd02G3loYEO48g5UgmyDQ7_FP8IQTCi7Hpdxr6fI
|
504 |
lm_eval/tasks/pubmedqa/README.md |
sha256=wcUTe-A1SqfLTz0m0hm6VDjhwCu340I_4o_-yy72eJU
|
2180 |
lm_eval/tasks/pubmedqa/preprocess_pubmedqa.py |
sha256=Q1KO7mFmbZSumsPVi806DDgYKoiY-Zb1Nr6d4dNlV0A
|
169 |
lm_eval/tasks/pubmedqa/pubmedqa.yaml |
sha256=oi7_SL54B6hpyp-oc50YYcX2K3j0SzV9VssBfGqDr24
|
414 |
lm_eval/tasks/qa4mre/README.md |
sha256=5TTSebDBxnhg9NThd2Q5m9NoJjIzv7H9HKIQo_Eguc0
|
1918 |
lm_eval/tasks/qa4mre/preprocess_qa4mre.py |
sha256=rEzBkrAERfA2pbZzHO__bGdUvXB8ZKQjaIuijhwhXLc
|
164 |
lm_eval/tasks/qa4mre/qa4mre_2011.yaml |
sha256=yU1mcRtSvqGGnpHPYaxzpp15rygMemPYwdTrb4nGeHs
|
708 |
lm_eval/tasks/qa4mre/qa4mre_2012.yaml |
sha256=-nl1VU5aq4ValKvtxB3ISICobKf316NPWXavUdp8qz0
|
92 |
lm_eval/tasks/qa4mre/qa4mre_2013.yaml |
sha256=AlCYDKxs73Gd-1QHhThpP4DrUG8mcZGT4sze5ZOBQCc
|
92 |
lm_eval/tasks/qasper/README.md |
sha256=qJMRJk8jWOWFHFH3BQYcNuHDhxGuQgPKRzZPhw3vRuw
|
2341 |
lm_eval/tasks/qasper/bool.yaml |
sha256=0mdAGRTHqUqKJXd1aqdmsJlHWt5EHgm3Zksu2uDs7yM
|
369 |
lm_eval/tasks/qasper/freeform.yaml |
sha256=6bu487qKQEIeShvgEf62WF-RXW5fIksmQ0l4r1nSEmQ
|
470 |
lm_eval/tasks/qasper/metrics.py |
sha256=qW3XySNorb06VFGT1gYe38uONzsxMHaoVocDjibgOaY
|
1244 |
lm_eval/tasks/qasper/utils.py |
sha256=GHFpYHsGqsWWek6abS6LbhJ77szfgCC_8XFMZkbpdw8
|
2714 |
lm_eval/tasks/race/README.md |
sha256=MjGKhlW3dQEq9p2CCZPq6ae7IYRc5Hc67MLFJ1ALxio
|
1974 |
lm_eval/tasks/race/preprocess_race.py |
sha256=ib-ESUCHV2BnblF7zuubRnbd4vS-_wNCSPj6YbDH9bM
|
1100 |
lm_eval/tasks/race/race.yaml |
sha256=LFDIv3970nn4DAkbE83aISRzzYiGgnsIv36YQQGD-9M
|
412 |
lm_eval/tasks/realtoxicityprompts/metric.py |
sha256=F3L4J4F4NxvatkoP6lKrXSEmg-QXny4IGcD6tPzGsuY
|
1945 |
lm_eval/tasks/realtoxicityprompts/realtoxicityprompts.yaml |
sha256=HwtDRVZDHZebP1kdbIOpWnEcKwx2XfJJWtAc9t9rI7g
|
386 |
lm_eval/tasks/sciq/README.md |
sha256=XCXBf3KfpPWJqBiqKogR_qyWqFK-XQKOhmGozlRw40Y
|
1480 |
lm_eval/tasks/sciq/sciq.yaml |
sha256=Ldi97ocUwPp2dDPW1Pr6P4Kw-30Sw6Z0GGij2bzKA5k
|
566 |
lm_eval/tasks/scrolls/README.md |
sha256=KqLRLEY82dKs_tR9w6lx5Hhxd71JoArktV_u_qQ02JQ
|
1443 |
lm_eval/tasks/scrolls/scrolls.yaml |
sha256=qf-DRhTS-h2cBWHgm6Cshmm6mVBgX83AemC2_VNUbFg
|
465 |
lm_eval/tasks/scrolls/task.py |
sha256=mLtNj5EShyutQfhYAARxQ7PwFlH-6QyQ7ZRUaAHN3vQ
|
13560 |
lm_eval/tasks/siqa/README.md |
sha256=4TalxcZMCLW7D4NmfEcxWR2bjUtKhGemGEnju8QyX2k
|
2607 |
lm_eval/tasks/siqa/siqa.yaml |
sha256=UusRl7bPbULlcW4E717Wco413Yby9F8n29YoThS3w4o
|
422 |
lm_eval/tasks/squadv2/README.md |
sha256=1kSUwS--VUhL7Ql_Wg_AeIcR89gyMIKanxxVrcH6mjo
|
1901 |
lm_eval/tasks/squadv2/squadv2.yaml |
sha256=47xG_LSA_JSSkT3KBzvcPzvquMnIrfC9dTftfnTu39s
|
43 |
lm_eval/tasks/squadv2/task.py |
sha256=QlDUnZKgzFneGAb8NYd6WddXEWyabDif-GvmZaagNZ0
|
8443 |
lm_eval/tasks/storycloze/README.md |
sha256=4FMoplUQinv6L9UUJKjrTNHazX5_WNdGqMTzWsWgduE
|
2406 |
lm_eval/tasks/storycloze/storycloze_2016.yaml |
sha256=Bss8Q2adu-7cwQWk4dkkQMzPpk9EyLmd91IDzzkL5-E
|
608 |
lm_eval/tasks/storycloze/storycloze_2018.yaml |
sha256=X9Q-PjykgFnj-NC-4gD6nXCl590_FIxAIE4EFUZHn3c
|
583 |
lm_eval/tasks/super_glue/README.md |
sha256=VeTdrrg5qatbvDbcKHzqoRuQBBDznttSGUGQUpqD_q0
|
2977 |
lm_eval/tasks/super_glue/boolq/default.yaml |
sha256=a_pL12N7f8aGPQjOt5c1rfQed_6r9tkycznfj-CveM0
|
400 |
lm_eval/tasks/super_glue/boolq/seq2seq.yaml |
sha256=3sLq019fXuRPwYVbsZFSGLFC4vZTXMX9dp5YlOcdizE
|
573 |
lm_eval/tasks/super_glue/boolq/t5-prompt.yaml |
sha256=weHcg9NgH_qsxfWoCA8uCGD8VftTqVDuM3nqs_f4qQc
|
511 |
lm_eval/tasks/super_glue/cb/aggregate.py |
sha256=_vGmEwd06c8YRJPcWWtLFabqwFSxlvWDdgCaEVGiWGk
|
422 |
lm_eval/tasks/super_glue/cb/default.yaml |
sha256=uDh4UiJRNDxLvwJn-ecIKmA_vcX4ge7k_Tx-5xgUtGw
|
437 |
lm_eval/tasks/super_glue/cb/t5-prompt.yaml |
sha256=ijNXBpDZTIuH45xHSpSvOc3bpNiW9cPQjPG6hs8Rb98
|
663 |
lm_eval/tasks/super_glue/cb/t5_utils.py |
sha256=_TvTZo3kix4w7wW-z_jNIeUN-tks1lRnyzQ8X9-W4NI
|
880 |
lm_eval/tasks/super_glue/copa/default.yaml |
sha256=MvbduME95GxCm9t4U4p85Y_2r8ZrxeDIbeZZov05tOw
|
353 |
lm_eval/tasks/super_glue/copa/t5-prompt.yaml |
sha256=F962IZLj6v3V55wgCFKJrpESuQieTALLbn97Cz8VWPY
|
555 |
lm_eval/tasks/super_glue/copa/utils.py |
sha256=C-mKkH22R6UYxCyRamE4W2TzlM-dAXG1y4a3oDYoLec
|
566 |
lm_eval/tasks/super_glue/multirc/default.yaml |
sha256=Y6OYbeO6_AtkJc95sLqiQ1MELuoy8GZ0epM0PVUGxTQ
|
422 |
lm_eval/tasks/super_glue/multirc/t5-prompt.yaml |
sha256=_InElTyf4SiDyvGOaKpy2YgrzLWmL5GARICeokgnbOs
|
690 |
lm_eval/tasks/super_glue/multirc/t5_utils.py |
sha256=RyuIHpusGODyBCDph1gOI0CYXAZc3CPHauj_h7IcEr8
|
1538 |
lm_eval/tasks/super_glue/record/default.yaml |
sha256=ymco8YLrqwTxLK2Q8qSHxE91sE-loqDrVVSz9vJP1aE
|
458 |
lm_eval/tasks/super_glue/record/t5-prompt.yaml |
sha256=ozPxnvLn-BX6grVYQG5cm0bVShGQ-b7DyvG51xu7vN4
|
624 |
lm_eval/tasks/super_glue/record/t5_utils.py |
sha256=W2P_KQZ-6hdimbh9PPJzCR8kIZ4XqbqonA8CqtKKYaQ
|
4020 |
lm_eval/tasks/super_glue/record/util.py |
sha256=HzltnH_KvCCBuIo35nQEEqJgfVpAOi-BFTMmvmMvvMQ
|
1274 |
lm_eval/tasks/super_glue/rte/default.yaml |
sha256=2hOxubtSBUK2O0vg3fuWLy67h_xKXvazoDMCSkd-Dgw
|
357 |
lm_eval/tasks/super_glue/rte/t5-prompt.yaml |
sha256=vWZF97sM14Ws4aXpwbdLS-75aADTgaXAktYduJq2wDc
|
524 |
lm_eval/tasks/super_glue/wic/default.yaml |
sha256=S4LID1Wa1Qb3lGjUGzBAhO7ZeuAA1njn4MK-qjkMG7s
|
450 |
lm_eval/tasks/super_glue/wic/t5-prompt.yaml |
sha256=B3tIVhmyVvpxeV2yU1zylxS5Qk8LtHPJ7KTy5P9Yza8
|
526 |
lm_eval/tasks/super_glue/wsc/default.yaml |
sha256=0DWTEYPqCrAwXvxmMlr1q38m5Dtlf5Nf6VjxdJ5fh5Y
|
334 |
lm_eval/tasks/super_glue/wsc/preprocess_wsc.py |
sha256=rzadUAJO9p1gdjD3nHBmmxXQUB84AL6e5GyYu2BdQ_o
|
620 |
lm_eval/tasks/super_glue/wsc/t5-prompt.yaml |
sha256=A-blj9bUS1sUI_0Zxq8VMx_OwBc5oJTZT7p_X8bA2lU
|
461 |
lm_eval/tasks/super_glue/wsc/t5_utils.py |
sha256=9Y17gDARL440i6qtlqy_geZ5cAJ9_Y3c8cJ7JVm470g
|
2963 |
lm_eval/tasks/swag/README.md |
sha256=pOggfzxJS46Lm1Ouo718vpVzN5frU5lg5R9OxjPmeEw
|
1799 |
lm_eval/tasks/swag/swag.yaml |
sha256=zUpp1TMNsvWpsaQwwXjmdeIca6yPtlThqKN6ns4rYyk
|
426 |
lm_eval/tasks/toxigen/README.md |
sha256=0zC_-x1qhk5mL_Jtm6CD7cZu_dnQMexWDHXTdfjKMss
|
1458 |
lm_eval/tasks/toxigen/toxigen.yaml |
sha256=AVH-Nbz8tYBTKImPWnmchhoy08PJ2I7E3MMv2XJpLhU
|
488 |
lm_eval/tasks/toxigen/utils.py |
sha256=7jVV5-UQChjGOjsZQAOvbiaF-HlJuYV2unRvbuPxbgA
|
153 |
lm_eval/tasks/translation/README.md |
sha256=ruLNyYFEmM76GJEov0HOlRG5FUCqflCh7vYunu12D5A
|
925 |
lm_eval/tasks/translation/iwslt2017_ar-en.yaml |
sha256=EUZC-LRC00L6ytBzeWlB1dPemp2PpNxI_mnTBoQZ4dw
|
286 |
lm_eval/tasks/translation/iwslt2017_en-ar.yaml |
sha256=-nyyvuvCp-mfWoEgcsM7CG7Rk0wju9zu2x5I4C-8rJo
|
286 |
lm_eval/tasks/translation/utils.py |
sha256=TIq8u4WD4KetzBtKXrUjghf6Jf2RSBNz68-obm-GfRM
|
4137 |
lm_eval/tasks/translation/wmt14_en-fr.yaml |
sha256=jQIlH1WktTOrRKmbNfDkbOxuRAwrjJ2zZfnfc84ylYQ
|
294 |
lm_eval/tasks/translation/wmt14_fr-en.yaml |
sha256=8NmJ6H7bQoBT2vqbZXmQEQUJf5-NEQkdIE6I7KhGEhs
|
294 |
lm_eval/tasks/translation/wmt16_de-en.yaml |
sha256=5kZvgi-Z4TxRhSehntg8p7Omtq8_SL5lPV6jb02qOKg
|
294 |
lm_eval/tasks/translation/wmt16_en-de.yaml |
sha256=WnHNT4lFysZkw-c9Ox0STgnBPurgjiMqH-LH1t4CEBE
|
294 |
lm_eval/tasks/translation/wmt16_en-ro.yaml |
sha256=0mcSrvjsNnO2pOXStd3OAr_vsSyGHAPCR80pB-i2ED8
|
296 |
lm_eval/tasks/translation/wmt16_ro-en.yaml |
sha256=8-nK4wweCzQENB-0StNgH6WZbGJL-k_wczDIGte2RIQ
|
296 |
lm_eval/tasks/translation/wmt_common_yaml |
sha256=4BgUbieb4MnTun4p3kDu8VyXie6ZCiK_AsGzyjhnLVA
|
298 |
lm_eval/tasks/triviaqa/README.md |
sha256=UwDPFH5UD913cyyUTjFIM48iSgDjjNltRQLbjRo5n5A
|
1852 |
lm_eval/tasks/triviaqa/default.yaml |
sha256=ThYo2Nn6tgLNlQsyOTOsJTzr7TJFNY7u1_acqptPnes
|
694 |
lm_eval/tasks/truthfulqa/README.md |
sha256=APxG9NLQHaq6QzbZxyKgkmOvZbjaTQLb-od3MiYTQ-Y
|
1717 |
lm_eval/tasks/truthfulqa/truthfulqa_gen.yaml |
sha256=psxrG3t3GHRxmUr3s22UINbxf-BspNmelkBx3WAPvgA
|
2248 |
lm_eval/tasks/truthfulqa/truthfulqa_mc1.yaml |
sha256=HW6e3LiSi9FCinX-g7Ct70_PUq79yzqtVMLEn9T5zso
|
1170 |
lm_eval/tasks/truthfulqa/truthfulqa_mc2.yaml |
sha256=CCxBfqAudGmjwLaJZxq0MkQZfU3o6n4IBQAI-aMs9t4
|
330 |
lm_eval/tasks/truthfulqa/utils.py |
sha256=7IpXGvKG-r3UA6PHCMC8uWaNXTsbLxRwctkxuyEToTo
|
6012 |
lm_eval/tasks/unscramble/README.md |
sha256=8fD3JDITiBTcee1qvuz-EzbXAjdGI4IR6hGY6dCdIaw
|
2615 |
lm_eval/tasks/unscramble/anagrams1.yaml |
sha256=l1cfwRW6nxbBkDFm3lJGcpi112REjsvxbBTL6Xd-zI4
|
463 |
lm_eval/tasks/unscramble/anagrams2.yaml |
sha256=djXvxXNfC3p-heygzjR4wlufyTPaGKXuQP9t2n6GjCs
|
463 |
lm_eval/tasks/unscramble/cycle_letters.yaml |
sha256=XA3XPKaeqviVedLTxj_yWYV9joEUXRymoSy9Fi0WW7k
|
469 |
lm_eval/tasks/unscramble/random_insertion.yaml |
sha256=aOxzwtkMUMFKDa-MGoFvgkpfHOYP_8o2rpwJpSV037A
|
475 |
lm_eval/tasks/unscramble/reversed_words.yaml |
sha256=niZuIfApjhPBO_j4KN955nGeDcoE4gJ88tYXSEQYjOA
|
421 |
lm_eval/tasks/webqs/README.md |
sha256=XaGMylFq_iwthSyM7VvHE5rVMzgQ9GJ6cVaQLMmagaY
|
1933 |
lm_eval/tasks/webqs/utils.py |
sha256=s01Tkm1AQQ_BjJtUVayw1fJ5BsxaGjtCTrkJnF_fy_g
|
773 |
lm_eval/tasks/webqs/webqs.yaml |
sha256=qfxQ_Lf-olbLay21rv_4qPvWhIbRLTNtuTUIg9EsO2Y
|
484 |
lm_eval/tasks/wikitext/README.md |
sha256=TIKOT6ySFrA3YAFL66ftz8FRL-hgJ0EfirXpSqH1294
|
1477 |
lm_eval/tasks/wikitext/preprocess_wikitext.py |
sha256=pEAgN0sXIVm_W-gKZNLEGUydXHcoT2lqxmY2EzjI2n0
|
1738 |
lm_eval/tasks/wikitext/wikitext.yaml |
sha256=Yzm4WJBjfaGwZKSE8T2ey-y1QiEePs3PbnYVabAxQ6c
|
574 |
lm_eval/tasks/winogrande/README.md |
sha256=vA2S-iOSnXTAXPQxEqRhwZMd3axmvKA3P-7tUcY2SFo
|
1816 |
lm_eval/tasks/winogrande/default.yaml |
sha256=7diBVsCZbcWNM7Vfgow1_w0sSod6GjR1JOYBXBUaxFM
|
498 |
lm_eval/tasks/winogrande/preprocess_winogrande.py |
sha256=5VMnYpJkqY8dOD_aJGRbZ3mvtT-gvOIVAEK5QWsa4AY
|
377 |
lm_eval/tasks/wmdp/README.md |
sha256=mgqAtEIrAnK2OsW4v1jyZaPsnMse4XU6X9vcDcv5iTI
|
2795 |
lm_eval/tasks/wmdp/_default_template_yaml |
sha256=Qvs27h_LiZx36xm7H5zgwFHCd2FY1Fa6CjTJYmSiaeQ
|
421 |
lm_eval/tasks/wmdp/wmdp_bio.yaml |
sha256=m-1-UcfSRncg9OeKLVjRHcf2vUZwW8l8cXAViPClKwU
|
177 |
lm_eval/tasks/wmdp/wmdp_chem.yaml |
sha256=39eQizGmPz7BO6m89T_9EWiYokPB4Fk1IRQEBNV-9-Y
|
181 |
lm_eval/tasks/wmdp/wmdp_cyber.yaml |
sha256=2iqzu1KkuTHw0tnd-GHYaOtaQ-UZwfMTAlr2nMVvKYA
|
187 |
lm_eval/tasks/wmt2016/README.md |
sha256=KlOtv8lY7r4KGFf_-quEOdwm90d0bp3Wfz9TimENrJs
|
2092 |
lm_eval/tasks/wmt2016/metrics.py |
sha256=V629nou9UMoPluWjgjf2D9IlbXi0YD2HWy7mspQZQmE
|
280 |
lm_eval/tasks/wmt2016/ro_en-t5_prompt.yaml |
sha256=87dSDcZQieh1V-j9QKE0FOl9FV40R8QttfBxIX0CLuA
|
481 |
lm_eval/tasks/wsc273/README.md |
sha256=ACWo1bwzuYf66R7z0xxa4hMc2I6jdb71D5V-GeXNL-c
|
2963 |
lm_eval/tasks/wsc273/default.yaml |
sha256=1t8UiaRZWvEGfFS6REqxXek1OEwc5fhzV11RAYa8dls
|
518 |
lm_eval/tasks/wsc273/utils.py |
sha256=LCldN-jXX1ilzpSIOdIMuZcdHA12J4eCkb69RYTGNQc
|
1005 |
lm_eval/tasks/xcopa/README.md |
sha256=bszl23gtJTrwRRgk3JS7pbStFHqU5n7CW2s6YnNdwQI
|
2211 |
lm_eval/tasks/xcopa/default_et.yaml |
sha256=SrP37-d0yWJyog3yuH8ebbjorTooXciVaInVYKHns0g
|
304 |
lm_eval/tasks/xcopa/default_ht.yaml |
sha256=YiVPPHda2D5HOmRzwiZsBXsSBdo90wBaRH5X7YQGnTY
|
101 |
lm_eval/tasks/xcopa/default_id.yaml |
sha256=XxcNzEJFlUUGpyx_vvEiDKqPlzqr2rlkDpunwcp-Wzc
|
101 |
lm_eval/tasks/xcopa/default_it.yaml |
sha256=P85UpV5Ilfr8wFA1Dupc6dQn-KVn9LDhxT9YOQb4A7Q
|
101 |
lm_eval/tasks/xcopa/default_qu.yaml |
sha256=6CR5W6wWzpvLSr6X16gELeM_pDjahhLfnhUnyEKvnWk
|
101 |
lm_eval/tasks/xcopa/default_sw.yaml |
sha256=I0HIJi_MHQPkbBj2OGF9yn_9nupq-bxsWaU0mfLntf0
|
101 |
lm_eval/tasks/xcopa/default_ta.yaml |
sha256=T-ZV3pCgYTToODyBNJA0L5CrD4OspR8-hkS35TEfIqE
|
101 |
lm_eval/tasks/xcopa/default_th.yaml |
sha256=_eMapb7miFw0cZuZaG1kSSR4Kjx2LFv2_8XTkkIb9BE
|
101 |
lm_eval/tasks/xcopa/default_tr.yaml |
sha256=6VzN3-CzEotaJrB_ZesEEHKM6XEQqY_kzHiXrDInNYs
|
101 |
lm_eval/tasks/xcopa/default_vi.yaml |
sha256=0TBQaLnbCUIB74GGs5gOgoprp4OSfK1vZ1fZgCIqrLw
|
101 |
lm_eval/tasks/xcopa/default_zh.yaml |
sha256=R4P1Ibs5oJps9Hs2AeBBrL27yJW8OCXkL3ORaBCnfto
|
101 |
lm_eval/tasks/xcopa/utils.py |
sha256=GR0xu7_Ga-e2bLxBAFPhNjEgGjcA33SfI8ZT-3g03UM
|
1791 |
lm_eval/tasks/xnli/README.md |
sha256=M6yJ8Ui08vdiDQRLW9EejDPrSLuop09XVmZu0RfJEgU
|
2224 |
lm_eval/tasks/xnli/utils.py |
sha256=sYhlevG44xK_xQ-nlIaLC_3TAddLR0bSS9EmELz61KM
|
5277 |
lm_eval/tasks/xnli/xnli_ar.yaml |
sha256=-vGMt34SYGsrxhJH2mzVJJ44UwCs44_EdPkT9F-b6zU
|
248 |
lm_eval/tasks/xnli/xnli_bg.yaml |
sha256=3ZCMy6xC4r1HN_324m3Tqc4LjL2ZJTVlQAzG6Anmq34
|
270 |
lm_eval/tasks/xnli/xnli_common_yaml |
sha256=JvhM_cqTEn1ALdYJDy00935ej4ip0ozGEa-Ag7Godas
|
482 |
lm_eval/tasks/xnli/xnli_de.yaml |
sha256=Jk1ZgtT9ji3lq3TVfu0jCQxUj8WJ1dZeaSyEkLzPiN4
|
237 |
lm_eval/tasks/xnli/xnli_el.yaml |
sha256=Ljnc0ksd4-SYjDNhCBtZMP5SDk8gjD9k9RgxzFk4kuo
|
262 |
lm_eval/tasks/xnli/xnli_en.yaml |
sha256=YeCSTN2rwAT0NLWzh1DW19PoAMee46W-hf0ScBeyhfE
|
230 |
lm_eval/tasks/xnli/xnli_es.yaml |
sha256=GkwQMf22cNfBhIVubRAzkRPL8TGPCi0gilZFWdaoF1w
|
242 |
lm_eval/tasks/xnli/xnli_fr.yaml |
sha256=RdfT4cthik8ZS7sSmkvsoxuK2nTdDouNOpzrZ-Lebdg
|
238 |
lm_eval/tasks/xnli/xnli_hi.yaml |
sha256=pPuF91nLvDCOVXQ1bANGV-UQFedcez_2XW-OapqEX6Y
|
269 |
lm_eval/tasks/xnli/xnli_ru.yaml |
sha256=1tAyhdGQKXpFQrIM_2-SAdPv7v34Ot1Y_NlX1WNk2PI
|
276 |
lm_eval/tasks/xnli/xnli_sw.yaml |
sha256=Z6CF-2C6DyPh0nzk7GnqjtWnOHAw5zblmfDVjAQmJAU
|
240 |
lm_eval/tasks/xnli/xnli_th.yaml |
sha256=N1QOrp7HkzYrx0TAiSMhEAJmWwETEAGsMBM3gTeoWnc
|
308 |
lm_eval/tasks/xnli/xnli_tr.yaml |
sha256=bUvapKIUdJCJKc7CCIl918aJiWwhEiEsoMXJtbrTgn4
|
242 |
lm_eval/tasks/xnli/xnli_ur.yaml |
sha256=47LmNHEByKsde-KLFlxDfWgHiF6MX06isosv6YF7Rj4
|
260 |
lm_eval/tasks/xnli/xnli_vi.yaml |
sha256=Aw64QMiB-AAhq5xMgbZQs6dEzFC4njOpbH7bMokjq2w
|
244 |
lm_eval/tasks/xnli/xnli_zh.yaml |
sha256=f7rvxUp0E8CgBu4d-YyCQOYx-d6eYRmiVfj0vNMdpsg
|
245 |
lm_eval/tasks/xstorycloze/README.md |
sha256=zFx4IhOCGFNVCkUqmcnBH10c7_xyEHX4p_V4OPEFRJg
|
2674 |
lm_eval/tasks/xstorycloze/default_ar.yaml |
sha256=afOQjiQuTcheJoiYRATRgtCQgkb3DKRq522TzVBESBc
|
616 |
lm_eval/tasks/xstorycloze/default_en.yaml |
sha256=jkXDziy5ZFSxiBBfvpF5X0PD7r2-EoJuPvpM_YO57mo
|
63 |
lm_eval/tasks/xstorycloze/default_es.yaml |
sha256=krymcDmxJbEqyaLMjJ2qCTp72_vpe30EyrqAytvGmFA
|
63 |
lm_eval/tasks/xstorycloze/default_eu.yaml |
sha256=Jp7s9WOyPBO-r8ZMHXgrHWYXsOSxwTFoLM09w7xktT4
|
63 |
lm_eval/tasks/xstorycloze/default_hi.yaml |
sha256=0baA81PaJh6O_rHk5Zt75RlB0Rm8IeIEmcwWl65AeCc
|
63 |
lm_eval/tasks/xstorycloze/default_id.yaml |
sha256=3eufzTCUzloyMmZmNmtT9jkilhLaaUlhZyWYtSoO6K4
|
63 |
lm_eval/tasks/xstorycloze/default_my.yaml |
sha256=Lru52K3docj3SyM8yb_vKEdejBL5587nj2WIyPEoKXk
|
63 |
lm_eval/tasks/xstorycloze/default_ru.yaml |
sha256=NQLa7Ztu0eLDeJSeSiiR-6KYJE4im3-0IFP7JG-E-AU
|
63 |
lm_eval/tasks/xstorycloze/default_sw.yaml |
sha256=BkOasjoNtcIMwhhgB51ZhY9R8E0O2K8RMiiQewpRoBQ
|
63 |
lm_eval/tasks/xstorycloze/default_te.yaml |
sha256=uS7g8yrYniDdX3QuXwCSZsXMBQNAoDFDuGLXKNJ9P-Y
|
63 |
lm_eval/tasks/xstorycloze/default_zh.yaml |
sha256=TTaSyzTXWpqEgcCaadNWnxrHKXB7cdMuSEpZ9OeqHZE
|
63 |
lm_eval/tasks/xwinograd/README.md |
sha256=qPmixk1nZorlQSshnqtAoP1i5Zy4vrgJry65OLGklXk
|
2601 |
lm_eval/tasks/xwinograd/utils.py |
sha256=7DLwv-y0XYAiAnlSKsBG7yrD94kERHmLVqwpNIsnNV0
|
2844 |
lm_eval/tasks/xwinograd/xwinograd_common_yaml |
sha256=Eve4-QbUaUIo2_ztQ-RJNIt2bdfa8Wk3mQUQUhlFM5k
|
622 |
lm_eval/tasks/xwinograd/xwinograd_en.yaml |
sha256=xbEp4QSQgNlKymjEFxXVonpbG7IKDjtFuTa1DzNTpUc
|
91 |
lm_eval/tasks/xwinograd/xwinograd_fr.yaml |
sha256=UZ7Txl6Q3d9bWvZXvjGxVQxGMnZ2_5bLL7Ykrhu_-nA
|
91 |
lm_eval/tasks/xwinograd/xwinograd_jp.yaml |
sha256=aRVwy9c6YOGpRFgm4oAUnljHW2y5UTF6IvwzEeOjVnc
|
91 |
lm_eval/tasks/xwinograd/xwinograd_pt.yaml |
sha256=A8oaox90xLwx0N1G8MfRpZGB8Tof6mux8EtgJpSrOaE
|
91 |
lm_eval/tasks/xwinograd/xwinograd_ru.yaml |
sha256=ra7PfDvFLZS1sBiMI7hRBjSWCmElclMWFwChrIg9-HY
|
91 |
lm_eval/tasks/xwinograd/xwinograd_zh.yaml |
sha256=OAf84RMb0BbFc3DGtBij-84FGwKDwHH9d_eGRXN_K0Y
|
91 |
lm_eval-0.4.2.dist-info/LICENSE.md |
sha256=qAbkJUdiDf-8LsAzMyLIs1I7SvEeBZvhTvgapbGuAh8
|
1067 |
lm_eval-0.4.2.dist-info/METADATA |
sha256=QnCs1KNNkqVy2ihhGORhahuLmTkTNPs9c7O0eNy9CZQ
|
30958 |
lm_eval-0.4.2.dist-info/WHEEL |
sha256=GJ7t_kWBFywbagK5eo9IoUwLW6oyOeTKmQ-9iHFVNxQ
|
92 |
lm_eval-0.4.2.dist-info/entry_points.txt |
sha256=mMr4hFXQwSHYb924AKGzP6dbbBAWcXiyBO-AfXrV72E
|
98 |
lm_eval-0.4.2.dist-info/top_level.txt |
sha256=risQwf3pU3EoXaYL_bKYFzW6EtBOvJxJotKdDz605Dk
|
8 |
lm_eval-0.4.2.dist-info/RECORD |
— |
— |