Created
June 26, 2025 22:30
-
-
Save egafni/969e1d83d1ebe74de04ff214d1ed564c to your computer and use it in GitHub Desktop.
This file has been truncated, but you can view the full file.
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
| | Group | Config Location | | |
| |------------------------------------------------|---------------------------------------------------------------------------------------------------------------------------------------------| | |
| |AraDiCE |lm_eval/tasks/aradice/aradice.yaml | | |
| |AraDiCE_ArabicMMLU_egy |lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU.yaml | | |
| |AraDiCE_ArabicMMLU_lev |lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU.yaml | | |
| |aclue |lm_eval/tasks/aclue/_aclue.yaml | | |
| |adr |lm_eval/tasks/afrobench/adr/afridiacritics.yaml | | |
| |aexams |lm_eval/tasks/aexams/_aexams.yaml | | |
| |african_flores |lm_eval/tasks/afrobench/flores/flores.yaml | | |
| |african_ntrex |lm_eval/tasks/afrobench/ntrex/ntrex.yaml | | |
| |afrimgsm-irokobench |lm_eval/tasks/afrimgsm/direct/afrimgsm.yaml | | |
| |afrimgsm_cot-irokobench |lm_eval/tasks/afrimgsm/direct_cot/afrimgsm_cot.yaml | | |
| |afrimgsm_tt-irokobench |lm_eval/tasks/afrimgsm/translate/afrimgsm_tt.yaml | | |
| |afrimgsm_tt_cot-irokobench |lm_eval/tasks/afrimgsm/translate_cot/afrimgsm_tt_cot.yaml | | |
| |afrimmlu-irokobench |lm_eval/tasks/afrimmlu/direct/afrimmlu.yaml | | |
| |afrimmlu_tt-irokobench |lm_eval/tasks/afrimmlu/translate/afrimmlu_tt.yaml | | |
| |afriqa |lm_eval/tasks/afrobench/afriqa/afriqa.yaml | | |
| |afrisenti |lm_eval/tasks/afrobench/afrisenti/afrisenti.yaml | | |
| |afrixnli-irokobench |lm_eval/tasks/afrixnli/direct/afrixnli.yaml | | |
| |afrixnli_tt-irokobench |lm_eval/tasks/afrixnli/translate/afrixnli_tt.yaml | | |
| |afrobench |lm_eval/tasks/afrobench/afrobench.yaml | | |
| |afrobench_lite |lm_eval/tasks/afrobench/afrobench-lite.yaml | | |
| |agieval |lm_eval/tasks/agieval/agieval.yaml | | |
| |agieval_cn |lm_eval/tasks/agieval/agieval_cn.yaml | | |
| |agieval_en |lm_eval/tasks/agieval/agieval_en.yaml | | |
| |agieval_nous |lm_eval/tasks/agieval/agieval_nous.yaml | | |
| |arab_culture |lm_eval/tasks/arab_culture/_arab_culture.yaml | | |
| |arab_culture_completion |lm_eval/tasks/arab_culture_completion/_arab_culture_completion.yaml | | |
| |arab_culture_completion_gulf |lm_eval/tasks/arab_culture_completion/_arab_culture_completion_gulf.yaml | | |
| |arab_culture_completion_levant |lm_eval/tasks/arab_culture_completion/_arab_culture_completion_levant.yaml | | |
| |arab_culture_completion_nile_valley |lm_eval/tasks/arab_culture_completion/_arab_culture_completion_nile_valley.yaml | | |
| |arab_culture_completion_north_africa |lm_eval/tasks/arab_culture_completion/_arab_culture_completion_north_africa.yaml | | |
| |arab_culture_gulf |lm_eval/tasks/arab_culture/_arab_culture_gulf.yaml | | |
| |arab_culture_levant |lm_eval/tasks/arab_culture/_arab_culture_levant.yaml | | |
| |arab_culture_nile_valley |lm_eval/tasks/arab_culture/_arab_culture_nile_valley.yaml | | |
| |arab_culture_north_africa |lm_eval/tasks/arab_culture/_arab_culture_north_africa.yaml | | |
| |arabic_leaderboard_acva |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva.yaml | | |
| |arabic_leaderboard_acva_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_light.yaml | | |
| |arabic_leaderboard_alghafa |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_alghafa/arabic_leaderboard_alghafa.yaml | | |
| |arabic_leaderboard_alghafa_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_alghafa_light/arabic_leaderboard_alghafa_light.yaml | | |
| |arabic_leaderboard_arabic_exams |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_exams/arabic_leaderboard_arabic_exams.yaml | | |
| |arabic_leaderboard_arabic_exams_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_exams_light/arabic_leaderboard_arabic_exams_light.yaml | | |
| |arabic_leaderboard_arabic_mmlu |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu.yaml | | |
| |arabic_leaderboard_arabic_mmlu_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_light.yaml | | |
| |arabic_leaderboard_arabic_mt_arc_challenge |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_arc_challenge/arabic_leaderboard_arabic_mt_arc_challenge.yaml | | |
| |arabic_leaderboard_arabic_mt_arc_challenge_light|lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_arc_challenge_light/arabic_leaderboard_arabic_mt_arc_challenge_light.yaml| | |
| |arabic_leaderboard_arabic_mt_arc_easy |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_arc_easy/arabic_leaderboard_arabic_mt_arc_easy.yaml | | |
| |arabic_leaderboard_arabic_mt_arc_easy_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_arc_easy_light/arabic_leaderboard_arabic_mt_arc_easy_light.yaml | | |
| |arabic_leaderboard_arabic_mt_boolq |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_boolq/arabic_leaderboard_arabic_mt_boolq.yaml | | |
| |arabic_leaderboard_arabic_mt_boolq_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_boolq_light/arabic_leaderboard_arabic_mt_boolq_light.yaml | | |
| |arabic_leaderboard_arabic_mt_copa |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_copa/arabic_leaderboard_arabic_mt_copa.yaml | | |
| |arabic_leaderboard_arabic_mt_copa_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_copa_light/arbic_leaderboard_arabic_mt_copa_light.yaml | | |
| |arabic_leaderboard_arabic_mt_hellaswag |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_hellaswag/arabic_leaderboard_arabic_mt_hellaswag.yaml | | |
| |arabic_leaderboard_arabic_mt_hellaswag_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_hellaswag_light/arabic_leaderboard_arabic_mt_hellaswag_light.yaml | | |
| |arabic_leaderboard_arabic_mt_mmlu |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_mmlu/arabic_leaderboard_arabic_mt_mmlu.yaml | | |
| |arabic_leaderboard_arabic_mt_mmlu_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_mmlu_light/arabic_leaderboard_arabic_mt_mmlu_light.yaml | | |
| |arabic_leaderboard_arabic_mt_openbook_qa |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_openbook_qa/arabic_leaderboard_arabic_mt_openbook_qa.yaml | | |
| |arabic_leaderboard_arabic_mt_openbook_qa_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_openbook_qa_light/arabic_leaderboard_arabic_mt_openbook_qa_light.yaml | | |
| |arabic_leaderboard_arabic_mt_piqa |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_piqa/arabic_leaderboard_arabic_mt_piqa.yaml | | |
| |arabic_leaderboard_arabic_mt_piqa_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_piqa_light/arabic_leaderboard_arabic_mt_piqa_light.yaml | | |
| |arabic_leaderboard_arabic_mt_race |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_race/arabic_leaderboard_arabic_mt_race.yaml | | |
| |arabic_leaderboard_arabic_mt_race_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_race_light/arabic_leaderboard_arabic_mt_race_light.yaml | | |
| |arabic_leaderboard_arabic_mt_sciq |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_sciq/arabic_leaderboard_arabic_mt_sciq.yaml | | |
| |arabic_leaderboard_arabic_mt_sciq_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_sciq_light/arabic_leaderboard_arabic_mt_sciq_light.yaml | | |
| |arabic_leaderboard_arabic_mt_toxigen |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_toxigen/arabic_leaderboard_arabic_mt_toxigen.yaml | | |
| |arabic_leaderboard_arabic_mt_toxigen_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_toxigen_light/arabic_leaderboard_arabic_mt_toxigen_light.yaml | | |
| |arabic_leaderboard_complete |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_complete.yaml | | |
| |arabic_leaderboard_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_light.yaml | | |
| |arabicmmlu |lm_eval/tasks/arabicmmlu/_arabicmmlu.yaml | | |
| |arabicmmlu_humanities |lm_eval/tasks/arabicmmlu/_arabicmmlu_humanities.yaml | | |
| |arabicmmlu_language |lm_eval/tasks/arabicmmlu/_arabicmmlu_language.yaml | | |
| |arabicmmlu_other |lm_eval/tasks/arabicmmlu/_arabicmmlu_other.yaml | | |
| |arabicmmlu_social_science |lm_eval/tasks/arabicmmlu/_arabicmmlu_social_science.yaml | | |
| |arabicmmlu_stem |lm_eval/tasks/arabicmmlu/_arabicmmlu_stem.yaml | | |
| |basque_bench |lm_eval/tasks/basque_bench/basque_bench.yaml | | |
| |bbh |lm_eval/tasks/bbh/cot_fewshot/_bbh.yaml | | |
| |bbh_cot_fewshot |lm_eval/tasks/bbh/cot_fewshot/_bbh_cot_fewshot.yaml | | |
| |bbh_cot_zeroshot |lm_eval/tasks/bbh/cot_zeroshot/_bbh_cot_zeroshot.yaml | | |
| |bbh_fewshot |lm_eval/tasks/bbh/fewshot/_bbh_fewshot.yaml | | |
| |bbh_zeroshot |lm_eval/tasks/bbh/zeroshot/_bbh_zeroshot.yaml | | |
| |belebele |lm_eval/tasks/afrobench/belebele/belebele.yaml | | |
| |blimp |lm_eval/tasks/blimp/_blimp.yaml | | |
| |catalan_bench |lm_eval/tasks/catalan_bench/catalan_bench.yaml | | |
| |ceval-valid |lm_eval/tasks/ceval/_ceval-valid.yaml | | |
| |cmmlu |lm_eval/tasks/cmmlu/_cmmlu.yaml | | |
| |csatqa |lm_eval/tasks/csatqa/_csatqa.yaml | | |
| |darija_sentiment |lm_eval/tasks/darija_bench/darija_sentiment/darija_sentiment.yaml | | |
| |darija_summarization |lm_eval/tasks/darija_bench/darija_summarization/summarization_darija.yaml | | |
| |darija_translation |lm_eval/tasks/darija_bench/darija_translation/translation_darija.yaml | | |
| |darija_translation_doda |lm_eval/tasks/darija_bench/darija_translation/doda_translation_darija.yaml | | |
| |darija_translation_flores |lm_eval/tasks/darija_bench/darija_translation/flores_translation_darija.yaml | | |
| |darija_translation_madar |lm_eval/tasks/darija_bench/darija_translation/madar_translation_darija.yaml | | |
| |darija_translation_seed |lm_eval/tasks/darija_bench/darija_translation/seed_translation_darija.yaml | | |
| |darija_transliteration |lm_eval/tasks/darija_bench/darija_transliteration/transliteration_darija.yaml | | |
| |darijammlu |lm_eval/tasks/darijammlu/_darijammlu.yaml | | |
| |darijammlu_ar_mmlu |lm_eval/tasks/darijammlu/_darijammlu_ar_mmlu.yaml | | |
| |darijammlu_mmlu |lm_eval/tasks/darijammlu/_darijammlu_mmlu.yaml | | |
| |evalita-mp |lm_eval/tasks/evalita_llm/_evalita-mp.yaml | | |
| |evalita-mp_at |lm_eval/tasks/evalita_llm/_evalita-mp_at_tasks.yaml | | |
| |evalita-mp_faq |lm_eval/tasks/evalita_llm/_evalita-mp_faq_tasks.yaml | | |
| |evalita-mp_gen |lm_eval/tasks/evalita_llm/_evalita-mp_gen.yaml | | |
| |evalita-mp_hs |lm_eval/tasks/evalita_llm/_evalita-mp_hs_task.yaml | | |
| |evalita-mp_ls |lm_eval/tasks/evalita_llm/_evalita-mp_ls_task.yaml | | |
| |evalita-mp_mc |lm_eval/tasks/evalita_llm/_evalita-mp_mc.yaml | | |
| |evalita-mp_ner_adg_group |lm_eval/tasks/evalita_llm/_evalita-mp_ner-adg_group.yaml | | |
| |evalita-mp_ner_fic_group |lm_eval/tasks/evalita_llm/_evalita-mp_ner-fic_group.yaml | | |
| |evalita-mp_ner_group |lm_eval/tasks/evalita_llm/_evalita-mp_ner_group.yaml | | |
| |evalita-mp_ner_wn_group |lm_eval/tasks/evalita_llm/_evalita-mp_ner-wn_group.yaml | | |
| |evalita-mp_re |lm_eval/tasks/evalita_llm/_evalita-mp_re_task.yaml | | |
| |evalita-mp_sa |lm_eval/tasks/evalita_llm/_evalita-mp_sa_tasks.yaml | | |
| |evalita-mp_sum_fp |lm_eval/tasks/evalita_llm/_evalita-mp_sum_fp-small_task.yaml | | |
| |evalita-mp_te |lm_eval/tasks/evalita_llm/_evalita-mp_te_tasks.yaml | | |
| |evalita-mp_wic |lm_eval/tasks/evalita_llm/_evalita-mp_wic_tasks.yaml | | |
| |flan_held_in |lm_eval/tasks/benchmarks/flan/flan_held_in.yaml | | |
| |flan_held_out |lm_eval/tasks/benchmarks/flan/flan_held_out.yaml | | |
| |flores_ca |lm_eval/tasks/catalan_bench/flores_ca/flores_ca.yaml | | |
| |flores_es |lm_eval/tasks/spanish_bench/flores_es/flores_es.yaml | | |
| |flores_eu |lm_eval/tasks/basque_bench/flores_eu/flores_eu.yaml | | |
| |flores_gl |lm_eval/tasks/galician_bench/flores_gl/flores_gl.yaml | | |
| |flores_pt |lm_eval/tasks/portuguese_bench/flores_pt/flores_pt.yaml | | |
| |galician_bench |lm_eval/tasks/galician_bench/galician_bench.yaml | | |
| |global_mmlu_ar |lm_eval/tasks/global_mmlu/default/ar/_global_mmlu_ar.yaml | | |
| |global_mmlu_bn |lm_eval/tasks/global_mmlu/default/bn/_global_mmlu_bn.yaml | | |
| |global_mmlu_de |lm_eval/tasks/global_mmlu/default/de/_global_mmlu_de.yaml | | |
| |global_mmlu_en |lm_eval/tasks/global_mmlu/default/en/_global_mmlu_en.yaml | | |
| |global_mmlu_es |lm_eval/tasks/global_mmlu/default/es/_global_mmlu_es.yaml | | |
| |global_mmlu_fr |lm_eval/tasks/global_mmlu/default/fr/_global_mmlu_fr.yaml | | |
| |global_mmlu_full_am |lm_eval/tasks/global_mmlu/full/am/_global_mmlu_full_am.yaml | | |
| |global_mmlu_full_am_humanities |lm_eval/tasks/global_mmlu/full/am/_global_mmlu_full_am_humanities.yaml | | |
| |global_mmlu_full_am_other |lm_eval/tasks/global_mmlu/full/am/_global_mmlu_full_am_other.yaml | | |
| |global_mmlu_full_am_social_sciences |lm_eval/tasks/global_mmlu/full/am/_global_mmlu_full_am_social_sciences.yaml | | |
| |global_mmlu_full_am_stem |lm_eval/tasks/global_mmlu/full/am/_global_mmlu_full_am_stem.yaml | | |
| |global_mmlu_full_ar |lm_eval/tasks/global_mmlu/full/ar/_global_mmlu_full_ar.yaml | | |
| |global_mmlu_full_ar_humanities |lm_eval/tasks/global_mmlu/full/ar/_global_mmlu_full_ar_humanities.yaml | | |
| |global_mmlu_full_ar_other |lm_eval/tasks/global_mmlu/full/ar/_global_mmlu_full_ar_other.yaml | | |
| |global_mmlu_full_ar_social_sciences |lm_eval/tasks/global_mmlu/full/ar/_global_mmlu_full_ar_social_sciences.yaml | | |
| |global_mmlu_full_ar_stem |lm_eval/tasks/global_mmlu/full/ar/_global_mmlu_full_ar_stem.yaml | | |
| |global_mmlu_full_bn |lm_eval/tasks/global_mmlu/full/bn/_global_mmlu_full_bn.yaml | | |
| |global_mmlu_full_bn_humanities |lm_eval/tasks/global_mmlu/full/bn/_global_mmlu_full_bn_humanities.yaml | | |
| |global_mmlu_full_bn_other |lm_eval/tasks/global_mmlu/full/bn/_global_mmlu_full_bn_other.yaml | | |
| |global_mmlu_full_bn_social_sciences |lm_eval/tasks/global_mmlu/full/bn/_global_mmlu_full_bn_social_sciences.yaml | | |
| |global_mmlu_full_bn_stem |lm_eval/tasks/global_mmlu/full/bn/_global_mmlu_full_bn_stem.yaml | | |
| |global_mmlu_full_cs |lm_eval/tasks/global_mmlu/full/cs/_global_mmlu_full_cs.yaml | | |
| |global_mmlu_full_cs_humanities |lm_eval/tasks/global_mmlu/full/cs/_global_mmlu_full_cs_humanities.yaml | | |
| |global_mmlu_full_cs_other |lm_eval/tasks/global_mmlu/full/cs/_global_mmlu_full_cs_other.yaml | | |
| |global_mmlu_full_cs_social_sciences |lm_eval/tasks/global_mmlu/full/cs/_global_mmlu_full_cs_social_sciences.yaml | | |
| |global_mmlu_full_cs_stem |lm_eval/tasks/global_mmlu/full/cs/_global_mmlu_full_cs_stem.yaml | | |
| |global_mmlu_full_de |lm_eval/tasks/global_mmlu/full/de/_global_mmlu_full_de.yaml | | |
| |global_mmlu_full_de_humanities |lm_eval/tasks/global_mmlu/full/de/_global_mmlu_full_de_humanities.yaml | | |
| |global_mmlu_full_de_other |lm_eval/tasks/global_mmlu/full/de/_global_mmlu_full_de_other.yaml | | |
| |global_mmlu_full_de_social_sciences |lm_eval/tasks/global_mmlu/full/de/_global_mmlu_full_de_social_sciences.yaml | | |
| |global_mmlu_full_de_stem |lm_eval/tasks/global_mmlu/full/de/_global_mmlu_full_de_stem.yaml | | |
| |global_mmlu_full_el |lm_eval/tasks/global_mmlu/full/el/_global_mmlu_full_el.yaml | | |
| |global_mmlu_full_el_humanities |lm_eval/tasks/global_mmlu/full/el/_global_mmlu_full_el_humanities.yaml | | |
| |global_mmlu_full_el_other |lm_eval/tasks/global_mmlu/full/el/_global_mmlu_full_el_other.yaml | | |
| |global_mmlu_full_el_social_sciences |lm_eval/tasks/global_mmlu/full/el/_global_mmlu_full_el_social_sciences.yaml | | |
| |global_mmlu_full_el_stem |lm_eval/tasks/global_mmlu/full/el/_global_mmlu_full_el_stem.yaml | | |
| |global_mmlu_full_en |lm_eval/tasks/global_mmlu/full/en/_global_mmlu_full_en.yaml | | |
| |global_mmlu_full_en_humanities |lm_eval/tasks/global_mmlu/full/en/_global_mmlu_full_en_humanities.yaml | | |
| |global_mmlu_full_en_other |lm_eval/tasks/global_mmlu/full/en/_global_mmlu_full_en_other.yaml | | |
| |global_mmlu_full_en_social_sciences |lm_eval/tasks/global_mmlu/full/en/_global_mmlu_full_en_social_sciences.yaml | | |
| |global_mmlu_full_en_stem |lm_eval/tasks/global_mmlu/full/en/_global_mmlu_full_en_stem.yaml | | |
| |global_mmlu_full_es |lm_eval/tasks/global_mmlu/full/es/_global_mmlu_full_es.yaml | | |
| |global_mmlu_full_es_humanities |lm_eval/tasks/global_mmlu/full/es/_global_mmlu_full_es_humanities.yaml | | |
| |global_mmlu_full_es_other |lm_eval/tasks/global_mmlu/full/es/_global_mmlu_full_es_other.yaml | | |
| |global_mmlu_full_es_social_sciences |lm_eval/tasks/global_mmlu/full/es/_global_mmlu_full_es_social_sciences.yaml | | |
| |global_mmlu_full_es_stem |lm_eval/tasks/global_mmlu/full/es/_global_mmlu_full_es_stem.yaml | | |
| |global_mmlu_full_fa |lm_eval/tasks/global_mmlu/full/fa/_global_mmlu_full_fa.yaml | | |
| |global_mmlu_full_fa_humanities |lm_eval/tasks/global_mmlu/full/fa/_global_mmlu_full_fa_humanities.yaml | | |
| |global_mmlu_full_fa_other |lm_eval/tasks/global_mmlu/full/fa/_global_mmlu_full_fa_other.yaml | | |
| |global_mmlu_full_fa_social_sciences |lm_eval/tasks/global_mmlu/full/fa/_global_mmlu_full_fa_social_sciences.yaml | | |
| |global_mmlu_full_fa_stem |lm_eval/tasks/global_mmlu/full/fa/_global_mmlu_full_fa_stem.yaml | | |
| |global_mmlu_full_fil |lm_eval/tasks/global_mmlu/full/fil/_global_mmlu_full_fil.yaml | | |
| |global_mmlu_full_fil_humanities |lm_eval/tasks/global_mmlu/full/fil/_global_mmlu_full_fil_humanities.yaml | | |
| |global_mmlu_full_fil_other |lm_eval/tasks/global_mmlu/full/fil/_global_mmlu_full_fil_other.yaml | | |
| |global_mmlu_full_fil_social_sciences |lm_eval/tasks/global_mmlu/full/fil/_global_mmlu_full_fil_social_sciences.yaml | | |
| |global_mmlu_full_fil_stem |lm_eval/tasks/global_mmlu/full/fil/_global_mmlu_full_fil_stem.yaml | | |
| |global_mmlu_full_fr |lm_eval/tasks/global_mmlu/full/fr/_global_mmlu_full_fr.yaml | | |
| |global_mmlu_full_fr_humanities |lm_eval/tasks/global_mmlu/full/fr/_global_mmlu_full_fr_humanities.yaml | | |
| |global_mmlu_full_fr_other |lm_eval/tasks/global_mmlu/full/fr/_global_mmlu_full_fr_other.yaml | | |
| |global_mmlu_full_fr_social_sciences |lm_eval/tasks/global_mmlu/full/fr/_global_mmlu_full_fr_social_sciences.yaml | | |
| |global_mmlu_full_fr_stem |lm_eval/tasks/global_mmlu/full/fr/_global_mmlu_full_fr_stem.yaml | | |
| |global_mmlu_full_ha |lm_eval/tasks/global_mmlu/full/ha/_global_mmlu_full_ha.yaml | | |
| |global_mmlu_full_ha_humanities |lm_eval/tasks/global_mmlu/full/ha/_global_mmlu_full_ha_humanities.yaml | | |
| |global_mmlu_full_ha_other |lm_eval/tasks/global_mmlu/full/ha/_global_mmlu_full_ha_other.yaml | | |
| |global_mmlu_full_ha_social_sciences |lm_eval/tasks/global_mmlu/full/ha/_global_mmlu_full_ha_social_sciences.yaml | | |
| |global_mmlu_full_ha_stem |lm_eval/tasks/global_mmlu/full/ha/_global_mmlu_full_ha_stem.yaml | | |
| |global_mmlu_full_he |lm_eval/tasks/global_mmlu/full/he/_global_mmlu_full_he.yaml | | |
| |global_mmlu_full_he_humanities |lm_eval/tasks/global_mmlu/full/he/_global_mmlu_full_he_humanities.yaml | | |
| |global_mmlu_full_he_other |lm_eval/tasks/global_mmlu/full/he/_global_mmlu_full_he_other.yaml | | |
| |global_mmlu_full_he_social_sciences |lm_eval/tasks/global_mmlu/full/he/_global_mmlu_full_he_social_sciences.yaml | | |
| |global_mmlu_full_he_stem |lm_eval/tasks/global_mmlu/full/he/_global_mmlu_full_he_stem.yaml | | |
| |global_mmlu_full_hi |lm_eval/tasks/global_mmlu/full/hi/_global_mmlu_full_hi.yaml | | |
| |global_mmlu_full_hi_humanities |lm_eval/tasks/global_mmlu/full/hi/_global_mmlu_full_hi_humanities.yaml | | |
| |global_mmlu_full_hi_other |lm_eval/tasks/global_mmlu/full/hi/_global_mmlu_full_hi_other.yaml | | |
| |global_mmlu_full_hi_social_sciences |lm_eval/tasks/global_mmlu/full/hi/_global_mmlu_full_hi_social_sciences.yaml | | |
| |global_mmlu_full_hi_stem |lm_eval/tasks/global_mmlu/full/hi/_global_mmlu_full_hi_stem.yaml | | |
| |global_mmlu_full_id |lm_eval/tasks/global_mmlu/full/id/_global_mmlu_full_id.yaml | | |
| |global_mmlu_full_id_humanities |lm_eval/tasks/global_mmlu/full/id/_global_mmlu_full_id_humanities.yaml | | |
| |global_mmlu_full_id_other |lm_eval/tasks/global_mmlu/full/id/_global_mmlu_full_id_other.yaml | | |
| |global_mmlu_full_id_social_sciences |lm_eval/tasks/global_mmlu/full/id/_global_mmlu_full_id_social_sciences.yaml | | |
| |global_mmlu_full_id_stem |lm_eval/tasks/global_mmlu/full/id/_global_mmlu_full_id_stem.yaml | | |
| |global_mmlu_full_ig |lm_eval/tasks/global_mmlu/full/ig/_global_mmlu_full_ig.yaml | | |
| |global_mmlu_full_ig_humanities |lm_eval/tasks/global_mmlu/full/ig/_global_mmlu_full_ig_humanities.yaml | | |
| |global_mmlu_full_ig_other |lm_eval/tasks/global_mmlu/full/ig/_global_mmlu_full_ig_other.yaml | | |
| |global_mmlu_full_ig_social_sciences |lm_eval/tasks/global_mmlu/full/ig/_global_mmlu_full_ig_social_sciences.yaml | | |
| |global_mmlu_full_ig_stem |lm_eval/tasks/global_mmlu/full/ig/_global_mmlu_full_ig_stem.yaml | | |
| |global_mmlu_full_it |lm_eval/tasks/global_mmlu/full/it/_global_mmlu_full_it.yaml | | |
| |global_mmlu_full_it_humanities |lm_eval/tasks/global_mmlu/full/it/_global_mmlu_full_it_humanities.yaml | | |
| |global_mmlu_full_it_other |lm_eval/tasks/global_mmlu/full/it/_global_mmlu_full_it_other.yaml | | |
| |global_mmlu_full_it_social_sciences |lm_eval/tasks/global_mmlu/full/it/_global_mmlu_full_it_social_sciences.yaml | | |
| |global_mmlu_full_it_stem |lm_eval/tasks/global_mmlu/full/it/_global_mmlu_full_it_stem.yaml | | |
| |global_mmlu_full_ja |lm_eval/tasks/global_mmlu/full/ja/_global_mmlu_full_ja.yaml | | |
| |global_mmlu_full_ja_humanities |lm_eval/tasks/global_mmlu/full/ja/_global_mmlu_full_ja_humanities.yaml | | |
| |global_mmlu_full_ja_other |lm_eval/tasks/global_mmlu/full/ja/_global_mmlu_full_ja_other.yaml | | |
| |global_mmlu_full_ja_social_sciences |lm_eval/tasks/global_mmlu/full/ja/_global_mmlu_full_ja_social_sciences.yaml | | |
| |global_mmlu_full_ja_stem |lm_eval/tasks/global_mmlu/full/ja/_global_mmlu_full_ja_stem.yaml | | |
| |global_mmlu_full_ko |lm_eval/tasks/global_mmlu/full/ko/_global_mmlu_full_ko.yaml | | |
| |global_mmlu_full_ko_humanities |lm_eval/tasks/global_mmlu/full/ko/_global_mmlu_full_ko_humanities.yaml | | |
| |global_mmlu_full_ko_other |lm_eval/tasks/global_mmlu/full/ko/_global_mmlu_full_ko_other.yaml | | |
| |global_mmlu_full_ko_social_sciences |lm_eval/tasks/global_mmlu/full/ko/_global_mmlu_full_ko_social_sciences.yaml | | |
| |global_mmlu_full_ko_stem |lm_eval/tasks/global_mmlu/full/ko/_global_mmlu_full_ko_stem.yaml | | |
| |global_mmlu_full_ky |lm_eval/tasks/global_mmlu/full/ky/_global_mmlu_full_ky.yaml | | |
| |global_mmlu_full_ky_humanities |lm_eval/tasks/global_mmlu/full/ky/_global_mmlu_full_ky_humanities.yaml | | |
| |global_mmlu_full_ky_other |lm_eval/tasks/global_mmlu/full/ky/_global_mmlu_full_ky_other.yaml | | |
| |global_mmlu_full_ky_social_sciences |lm_eval/tasks/global_mmlu/full/ky/_global_mmlu_full_ky_social_sciences.yaml | | |
| |global_mmlu_full_ky_stem |lm_eval/tasks/global_mmlu/full/ky/_global_mmlu_full_ky_stem.yaml | | |
| |global_mmlu_full_lt |lm_eval/tasks/global_mmlu/full/lt/_global_mmlu_full_lt.yaml | | |
| |global_mmlu_full_lt_humanities |lm_eval/tasks/global_mmlu/full/lt/_global_mmlu_full_lt_humanities.yaml | | |
| |global_mmlu_full_lt_other |lm_eval/tasks/global_mmlu/full/lt/_global_mmlu_full_lt_other.yaml | | |
| |global_mmlu_full_lt_social_sciences |lm_eval/tasks/global_mmlu/full/lt/_global_mmlu_full_lt_social_sciences.yaml | | |
| |global_mmlu_full_lt_stem |lm_eval/tasks/global_mmlu/full/lt/_global_mmlu_full_lt_stem.yaml | | |
| |global_mmlu_full_mg |lm_eval/tasks/global_mmlu/full/mg/_global_mmlu_full_mg.yaml | | |
| |global_mmlu_full_mg_humanities |lm_eval/tasks/global_mmlu/full/mg/_global_mmlu_full_mg_humanities.yaml | | |
| |global_mmlu_full_mg_other |lm_eval/tasks/global_mmlu/full/mg/_global_mmlu_full_mg_other.yaml | | |
| |global_mmlu_full_mg_social_sciences |lm_eval/tasks/global_mmlu/full/mg/_global_mmlu_full_mg_social_sciences.yaml | | |
| |global_mmlu_full_mg_stem |lm_eval/tasks/global_mmlu/full/mg/_global_mmlu_full_mg_stem.yaml | | |
| |global_mmlu_full_ms |lm_eval/tasks/global_mmlu/full/ms/_global_mmlu_full_ms.yaml | | |
| |global_mmlu_full_ms_humanities |lm_eval/tasks/global_mmlu/full/ms/_global_mmlu_full_ms_humanities.yaml | | |
| |global_mmlu_full_ms_other |lm_eval/tasks/global_mmlu/full/ms/_global_mmlu_full_ms_other.yaml | | |
| |global_mmlu_full_ms_social_sciences |lm_eval/tasks/global_mmlu/full/ms/_global_mmlu_full_ms_social_sciences.yaml | | |
| |global_mmlu_full_ms_stem |lm_eval/tasks/global_mmlu/full/ms/_global_mmlu_full_ms_stem.yaml | | |
| |global_mmlu_full_ne |lm_eval/tasks/global_mmlu/full/ne/_global_mmlu_full_ne.yaml | | |
| |global_mmlu_full_ne_humanities |lm_eval/tasks/global_mmlu/full/ne/_global_mmlu_full_ne_humanities.yaml | | |
| |global_mmlu_full_ne_other |lm_eval/tasks/global_mmlu/full/ne/_global_mmlu_full_ne_other.yaml | | |
| |global_mmlu_full_ne_social_sciences |lm_eval/tasks/global_mmlu/full/ne/_global_mmlu_full_ne_social_sciences.yaml | | |
| |global_mmlu_full_ne_stem |lm_eval/tasks/global_mmlu/full/ne/_global_mmlu_full_ne_stem.yaml | | |
| |global_mmlu_full_nl |lm_eval/tasks/global_mmlu/full/nl/_global_mmlu_full_nl.yaml | | |
| |global_mmlu_full_nl_humanities |lm_eval/tasks/global_mmlu/full/nl/_global_mmlu_full_nl_humanities.yaml | | |
| |global_mmlu_full_nl_other |lm_eval/tasks/global_mmlu/full/nl/_global_mmlu_full_nl_other.yaml | | |
| |global_mmlu_full_nl_social_sciences |lm_eval/tasks/global_mmlu/full/nl/_global_mmlu_full_nl_social_sciences.yaml | | |
| |global_mmlu_full_nl_stem |lm_eval/tasks/global_mmlu/full/nl/_global_mmlu_full_nl_stem.yaml | | |
| |global_mmlu_full_ny |lm_eval/tasks/global_mmlu/full/ny/_global_mmlu_full_ny.yaml | | |
| |global_mmlu_full_ny_humanities |lm_eval/tasks/global_mmlu/full/ny/_global_mmlu_full_ny_humanities.yaml | | |
| |global_mmlu_full_ny_other |lm_eval/tasks/global_mmlu/full/ny/_global_mmlu_full_ny_other.yaml | | |
| |global_mmlu_full_ny_social_sciences |lm_eval/tasks/global_mmlu/full/ny/_global_mmlu_full_ny_social_sciences.yaml | | |
| |global_mmlu_full_ny_stem |lm_eval/tasks/global_mmlu/full/ny/_global_mmlu_full_ny_stem.yaml | | |
| |global_mmlu_full_pl |lm_eval/tasks/global_mmlu/full/pl/_global_mmlu_full_pl.yaml | | |
| |global_mmlu_full_pl_humanities |lm_eval/tasks/global_mmlu/full/pl/_global_mmlu_full_pl_humanities.yaml | | |
| |global_mmlu_full_pl_other |lm_eval/tasks/global_mmlu/full/pl/_global_mmlu_full_pl_other.yaml | | |
| |global_mmlu_full_pl_social_sciences |lm_eval/tasks/global_mmlu/full/pl/_global_mmlu_full_pl_social_sciences.yaml | | |
| |global_mmlu_full_pl_stem |lm_eval/tasks/global_mmlu/full/pl/_global_mmlu_full_pl_stem.yaml | | |
| |global_mmlu_full_pt |lm_eval/tasks/global_mmlu/full/pt/_global_mmlu_full_pt.yaml | | |
| |global_mmlu_full_pt_humanities |lm_eval/tasks/global_mmlu/full/pt/_global_mmlu_full_pt_humanities.yaml | | |
| |global_mmlu_full_pt_other |lm_eval/tasks/global_mmlu/full/pt/_global_mmlu_full_pt_other.yaml | | |
| |global_mmlu_full_pt_social_sciences |lm_eval/tasks/global_mmlu/full/pt/_global_mmlu_full_pt_social_sciences.yaml | | |
| |global_mmlu_full_pt_stem |lm_eval/tasks/global_mmlu/full/pt/_global_mmlu_full_pt_stem.yaml | | |
| |global_mmlu_full_ro |lm_eval/tasks/global_mmlu/full/ro/_global_mmlu_full_ro.yaml | | |
| |global_mmlu_full_ro_humanities |lm_eval/tasks/global_mmlu/full/ro/_global_mmlu_full_ro_humanities.yaml | | |
| |global_mmlu_full_ro_other |lm_eval/tasks/global_mmlu/full/ro/_global_mmlu_full_ro_other.yaml | | |
| |global_mmlu_full_ro_social_sciences |lm_eval/tasks/global_mmlu/full/ro/_global_mmlu_full_ro_social_sciences.yaml | | |
| |global_mmlu_full_ro_stem |lm_eval/tasks/global_mmlu/full/ro/_global_mmlu_full_ro_stem.yaml | | |
| |global_mmlu_full_ru |lm_eval/tasks/global_mmlu/full/ru/_global_mmlu_full_ru.yaml | | |
| |global_mmlu_full_ru_humanities |lm_eval/tasks/global_mmlu/full/ru/_global_mmlu_full_ru_humanities.yaml | | |
| |global_mmlu_full_ru_other |lm_eval/tasks/global_mmlu/full/ru/_global_mmlu_full_ru_other.yaml | | |
| |global_mmlu_full_ru_social_sciences |lm_eval/tasks/global_mmlu/full/ru/_global_mmlu_full_ru_social_sciences.yaml | | |
| |global_mmlu_full_ru_stem |lm_eval/tasks/global_mmlu/full/ru/_global_mmlu_full_ru_stem.yaml | | |
| |global_mmlu_full_si |lm_eval/tasks/global_mmlu/full/si/_global_mmlu_full_si.yaml | | |
| |global_mmlu_full_si_humanities |lm_eval/tasks/global_mmlu/full/si/_global_mmlu_full_si_humanities.yaml | | |
| |global_mmlu_full_si_other |lm_eval/tasks/global_mmlu/full/si/_global_mmlu_full_si_other.yaml | | |
| |global_mmlu_full_si_social_sciences |lm_eval/tasks/global_mmlu/full/si/_global_mmlu_full_si_social_sciences.yaml | | |
| |global_mmlu_full_si_stem |lm_eval/tasks/global_mmlu/full/si/_global_mmlu_full_si_stem.yaml | | |
| |global_mmlu_full_sn |lm_eval/tasks/global_mmlu/full/sn/_global_mmlu_full_sn.yaml | | |
| |global_mmlu_full_sn_humanities |lm_eval/tasks/global_mmlu/full/sn/_global_mmlu_full_sn_humanities.yaml | | |
| |global_mmlu_full_sn_other |lm_eval/tasks/global_mmlu/full/sn/_global_mmlu_full_sn_other.yaml | | |
| |global_mmlu_full_sn_social_sciences |lm_eval/tasks/global_mmlu/full/sn/_global_mmlu_full_sn_social_sciences.yaml | | |
| |global_mmlu_full_sn_stem |lm_eval/tasks/global_mmlu/full/sn/_global_mmlu_full_sn_stem.yaml | | |
| |global_mmlu_full_so |lm_eval/tasks/global_mmlu/full/so/_global_mmlu_full_so.yaml | | |
| |global_mmlu_full_so_humanities |lm_eval/tasks/global_mmlu/full/so/_global_mmlu_full_so_humanities.yaml | | |
| |global_mmlu_full_so_other |lm_eval/tasks/global_mmlu/full/so/_global_mmlu_full_so_other.yaml | | |
| |global_mmlu_full_so_social_sciences |lm_eval/tasks/global_mmlu/full/so/_global_mmlu_full_so_social_sciences.yaml | | |
| |global_mmlu_full_so_stem |lm_eval/tasks/global_mmlu/full/so/_global_mmlu_full_so_stem.yaml | | |
| |global_mmlu_full_sr |lm_eval/tasks/global_mmlu/full/sr/_global_mmlu_full_sr.yaml | | |
| |global_mmlu_full_sr_humanities |lm_eval/tasks/global_mmlu/full/sr/_global_mmlu_full_sr_humanities.yaml | | |
| |global_mmlu_full_sr_other |lm_eval/tasks/global_mmlu/full/sr/_global_mmlu_full_sr_other.yaml | | |
| |global_mmlu_full_sr_social_sciences |lm_eval/tasks/global_mmlu/full/sr/_global_mmlu_full_sr_social_sciences.yaml | | |
| |global_mmlu_full_sr_stem |lm_eval/tasks/global_mmlu/full/sr/_global_mmlu_full_sr_stem.yaml | | |
| |global_mmlu_full_sv |lm_eval/tasks/global_mmlu/full/sv/_global_mmlu_full_sv.yaml | | |
| |global_mmlu_full_sv_humanities |lm_eval/tasks/global_mmlu/full/sv/_global_mmlu_full_sv_humanities.yaml | | |
| |global_mmlu_full_sv_other |lm_eval/tasks/global_mmlu/full/sv/_global_mmlu_full_sv_other.yaml | | |
| |global_mmlu_full_sv_social_sciences |lm_eval/tasks/global_mmlu/full/sv/_global_mmlu_full_sv_social_sciences.yaml | | |
| |global_mmlu_full_sv_stem |lm_eval/tasks/global_mmlu/full/sv/_global_mmlu_full_sv_stem.yaml | | |
| |global_mmlu_full_sw |lm_eval/tasks/global_mmlu/full/sw/_global_mmlu_full_sw.yaml | | |
| |global_mmlu_full_sw_humanities |lm_eval/tasks/global_mmlu/full/sw/_global_mmlu_full_sw_humanities.yaml | | |
| |global_mmlu_full_sw_other |lm_eval/tasks/global_mmlu/full/sw/_global_mmlu_full_sw_other.yaml | | |
| |global_mmlu_full_sw_social_sciences |lm_eval/tasks/global_mmlu/full/sw/_global_mmlu_full_sw_social_sciences.yaml | | |
| |global_mmlu_full_sw_stem |lm_eval/tasks/global_mmlu/full/sw/_global_mmlu_full_sw_stem.yaml | | |
| |global_mmlu_full_te |lm_eval/tasks/global_mmlu/full/te/_global_mmlu_full_te.yaml | | |
| |global_mmlu_full_te_humanities |lm_eval/tasks/global_mmlu/full/te/_global_mmlu_full_te_humanities.yaml | | |
| |global_mmlu_full_te_other |lm_eval/tasks/global_mmlu/full/te/_global_mmlu_full_te_other.yaml | | |
| |global_mmlu_full_te_social_sciences |lm_eval/tasks/global_mmlu/full/te/_global_mmlu_full_te_social_sciences.yaml | | |
| |global_mmlu_full_te_stem |lm_eval/tasks/global_mmlu/full/te/_global_mmlu_full_te_stem.yaml | | |
| |global_mmlu_full_tr |lm_eval/tasks/global_mmlu/full/tr/_global_mmlu_full_tr.yaml | | |
| |global_mmlu_full_tr_humanities |lm_eval/tasks/global_mmlu/full/tr/_global_mmlu_full_tr_humanities.yaml | | |
| |global_mmlu_full_tr_other |lm_eval/tasks/global_mmlu/full/tr/_global_mmlu_full_tr_other.yaml | | |
| |global_mmlu_full_tr_social_sciences |lm_eval/tasks/global_mmlu/full/tr/_global_mmlu_full_tr_social_sciences.yaml | | |
| |global_mmlu_full_tr_stem |lm_eval/tasks/global_mmlu/full/tr/_global_mmlu_full_tr_stem.yaml | | |
| |global_mmlu_full_uk |lm_eval/tasks/global_mmlu/full/uk/_global_mmlu_full_uk.yaml | | |
| |global_mmlu_full_uk_humanities |lm_eval/tasks/global_mmlu/full/uk/_global_mmlu_full_uk_humanities.yaml | | |
| |global_mmlu_full_uk_other |lm_eval/tasks/global_mmlu/full/uk/_global_mmlu_full_uk_other.yaml | | |
| |global_mmlu_full_uk_social_sciences |lm_eval/tasks/global_mmlu/full/uk/_global_mmlu_full_uk_social_sciences.yaml | | |
| |global_mmlu_full_uk_stem |lm_eval/tasks/global_mmlu/full/uk/_global_mmlu_full_uk_stem.yaml | | |
| |global_mmlu_full_vi |lm_eval/tasks/global_mmlu/full/vi/_global_mmlu_full_vi.yaml | | |
| |global_mmlu_full_vi_humanities |lm_eval/tasks/global_mmlu/full/vi/_global_mmlu_full_vi_humanities.yaml | | |
| |global_mmlu_full_vi_other |lm_eval/tasks/global_mmlu/full/vi/_global_mmlu_full_vi_other.yaml | | |
| |global_mmlu_full_vi_social_sciences |lm_eval/tasks/global_mmlu/full/vi/_global_mmlu_full_vi_social_sciences.yaml | | |
| |global_mmlu_full_vi_stem |lm_eval/tasks/global_mmlu/full/vi/_global_mmlu_full_vi_stem.yaml | | |
| |global_mmlu_full_yo |lm_eval/tasks/global_mmlu/full/yo/_global_mmlu_full_yo.yaml | | |
| |global_mmlu_full_yo_humanities |lm_eval/tasks/global_mmlu/full/yo/_global_mmlu_full_yo_humanities.yaml | | |
| |global_mmlu_full_yo_other |lm_eval/tasks/global_mmlu/full/yo/_global_mmlu_full_yo_other.yaml | | |
| |global_mmlu_full_yo_social_sciences |lm_eval/tasks/global_mmlu/full/yo/_global_mmlu_full_yo_social_sciences.yaml | | |
| |global_mmlu_full_yo_stem |lm_eval/tasks/global_mmlu/full/yo/_global_mmlu_full_yo_stem.yaml | | |
| |global_mmlu_full_zh |lm_eval/tasks/global_mmlu/full/zh/_global_mmlu_full_zh.yaml | | |
| |global_mmlu_full_zh_humanities |lm_eval/tasks/global_mmlu/full/zh/_global_mmlu_full_zh_humanities.yaml | | |
| |global_mmlu_full_zh_other |lm_eval/tasks/global_mmlu/full/zh/_global_mmlu_full_zh_other.yaml | | |
| |global_mmlu_full_zh_social_sciences |lm_eval/tasks/global_mmlu/full/zh/_global_mmlu_full_zh_social_sciences.yaml | | |
| |global_mmlu_full_zh_stem |lm_eval/tasks/global_mmlu/full/zh/_global_mmlu_full_zh_stem.yaml | | |
| |global_mmlu_hi |lm_eval/tasks/global_mmlu/default/hi/_global_mmlu_hi.yaml | | |
| |global_mmlu_id |lm_eval/tasks/global_mmlu/default/id/_global_mmlu_id.yaml | | |
| |global_mmlu_it |lm_eval/tasks/global_mmlu/default/it/_global_mmlu_it.yaml | | |
| |global_mmlu_ja |lm_eval/tasks/global_mmlu/default/ja/_global_mmlu_ja.yaml | | |
| |global_mmlu_ko |lm_eval/tasks/global_mmlu/default/ko/_global_mmlu_ko.yaml | | |
| |global_mmlu_pt |lm_eval/tasks/global_mmlu/default/pt/_global_mmlu_pt.yaml | | |
| |global_mmlu_sw |lm_eval/tasks/global_mmlu/default/sw/_global_mmlu_sw.yaml | | |
| |global_mmlu_yo |lm_eval/tasks/global_mmlu/default/yo/_global_mmlu_yo.yaml | | |
| |global_mmlu_zh |lm_eval/tasks/global_mmlu/default/zh/_global_mmlu_zh.yaml | | |
| |haerae |lm_eval/tasks/haerae/_haerae.yaml | | |
| |hendrycks_math |lm_eval/tasks/hendrycks_math/hendrycks_math.yaml | | |
| |hrm8k |lm_eval/tasks/hrm8k/default/hrm8k.yaml | | |
| |hrm8k_en |lm_eval/tasks/hrm8k/en/hrm8k_en.yaml | | |
| |include_base_44_albanian |lm_eval/tasks/include/default/Albanian/_include_base_44_albanian.yaml | | |
| |include_base_44_arabic |lm_eval/tasks/include/default/Arabic/_include_base_44_arabic.yaml | | |
| |include_base_44_armenian |lm_eval/tasks/include/default/Armenian/_include_base_44_armenian.yaml | | |
| |include_base_44_azerbaijani |lm_eval/tasks/include/default/Azerbaijani/_include_base_44_azerbaijani.yaml | | |
| |include_base_44_basque |lm_eval/tasks/include/default/Basque/_include_base_44_basque.yaml | | |
| |include_base_44_belarusian |lm_eval/tasks/include/default/Belarusian/_include_base_44_belarusian.yaml | | |
| |include_base_44_bengali |lm_eval/tasks/include/default/Bengali/_include_base_44_bengali.yaml | | |
| |include_base_44_bulgarian |lm_eval/tasks/include/default/Bulgarian/_include_base_44_bulgarian.yaml | | |
| |include_base_44_chinese |lm_eval/tasks/include/default/Chinese/_include_base_44_chinese.yaml | | |
| |include_base_44_croatian |lm_eval/tasks/include/default/Croatian/_include_base_44_croatian.yaml | | |
| |include_base_44_dutch |lm_eval/tasks/include/default/Dutch/_include_base_44_dutch.yaml | | |
| |include_base_44_estonian |lm_eval/tasks/include/default/Estonian/_include_base_44_estonian.yaml | | |
| |include_base_44_finnish |lm_eval/tasks/include/default/Finnish/_include_base_44_finnish.yaml | | |
| |include_base_44_french |lm_eval/tasks/include/default/French/_include_base_44_french.yaml | | |
| |include_base_44_georgian |lm_eval/tasks/include/default/Georgian/_include_base_44_georgian.yaml | | |
| |include_base_44_german |lm_eval/tasks/include/default/German/_include_base_44_german.yaml | | |
| |include_base_44_greek |lm_eval/tasks/include/default/Greek/_include_base_44_greek.yaml | | |
| |include_base_44_hebrew |lm_eval/tasks/include/default/Hebrew/_include_base_44_hebrew.yaml | | |
| |include_base_44_hindi |lm_eval/tasks/include/default/Hindi/_include_base_44_hindi.yaml | | |
| |include_base_44_hungarian |lm_eval/tasks/include/default/Hungarian/_include_base_44_hungarian.yaml | | |
| |include_base_44_indonesian |lm_eval/tasks/include/default/Indonesian/_include_base_44_indonesian.yaml | | |
| |include_base_44_italian |lm_eval/tasks/include/default/Italian/_include_base_44_italian.yaml | | |
| |include_base_44_japanese |lm_eval/tasks/include/default/Japanese/_include_base_44_japanese.yaml | | |
| |include_base_44_kazakh |lm_eval/tasks/include/default/Kazakh/_include_base_44_kazakh.yaml | | |
| |include_base_44_korean |lm_eval/tasks/include/default/Korean/_include_base_44_korean.yaml | | |
| |include_base_44_lithuanian |lm_eval/tasks/include/default/Lithuanian/_include_base_44_lithuanian.yaml | | |
| |include_base_44_malay |lm_eval/tasks/include/default/Malay/_include_base_44_malay.yaml | | |
| |include_base_44_malayalam |lm_eval/tasks/include/default/Malayalam/_include_base_44_malayalam.yaml | | |
| |include_base_44_nepali |lm_eval/tasks/include/default/Nepali/_include_base_44_nepali.yaml | | |
| |include_base_44_north macedonian |lm_eval/tasks/include/default/North Macedonian/_include_base_44_north macedonian.yaml | | |
| |include_base_44_persian |lm_eval/tasks/include/default/Persian/_include_base_44_persian.yaml | | |
| |include_base_44_polish |lm_eval/tasks/include/default/Polish/_include_base_44_polish.yaml | | |
| |include_base_44_portuguese |lm_eval/tasks/include/default/Portuguese/_include_base_44_portuguese.yaml | | |
| |include_base_44_russian |lm_eval/tasks/include/default/Russian/_include_base_44_russian.yaml | | |
| |include_base_44_serbian |lm_eval/tasks/include/default/Serbian/_include_base_44_serbian.yaml | | |
| |include_base_44_spanish |lm_eval/tasks/include/default/Spanish/_include_base_44_spanish.yaml | | |
| |include_base_44_tagalog |lm_eval/tasks/include/default/Tagalog/_include_base_44_tagalog.yaml | | |
| |include_base_44_tamil |lm_eval/tasks/include/default/Tamil/_include_base_44_tamil.yaml | | |
| |include_base_44_telugu |lm_eval/tasks/include/default/Telugu/_include_base_44_telugu.yaml | | |
| |include_base_44_turkish |lm_eval/tasks/include/default/Turkish/_include_base_44_turkish.yaml | | |
| |include_base_44_ukrainian |lm_eval/tasks/include/default/Ukrainian/_include_base_44_ukrainian.yaml | | |
| |include_base_44_urdu |lm_eval/tasks/include/default/Urdu/_include_base_44_urdu.yaml | | |
| |include_base_44_uzbek |lm_eval/tasks/include/default/Uzbek/_include_base_44_uzbek.yaml | | |
| |include_base_44_vietnamese |lm_eval/tasks/include/default/Vietnamese/_include_base_44_vietnamese.yaml | | |
| |injongointent |lm_eval/tasks/afrobench/injongointent/injongointent.yaml | | |
| |japanese_leaderboard |lm_eval/tasks/japanese_leaderboard/_ja_leaderboard.yaml | | |
| |kmmlu |lm_eval/tasks/kmmlu/default/_kmmlu_default.yaml | | |
| |kmmlu_applied_science |lm_eval/tasks/kmmlu/default/_kmmlu_applied_science.yaml | | |
| |kmmlu_cot_hard |lm_eval/tasks/kmmlu/cot_hard/_kmmlu_cot_hard.yaml | | |
| |kmmlu_cot_hard_applied_science |lm_eval/tasks/kmmlu/cot_hard/_kmmlu_cot_hard_applied_science.yaml | | |
| |kmmlu_cot_hard_humss |lm_eval/tasks/kmmlu/cot_hard/_kmmlu_cot_hard_humss.yaml | | |
| |kmmlu_cot_hard_other |lm_eval/tasks/kmmlu/cot_hard/_kmmlu_cot_hard_other.yaml | | |
| |kmmlu_cot_hard_stem |lm_eval/tasks/kmmlu/cot_hard/_kmmlu_cot_hard_stem.yaml | | |
| |kmmlu_direct |lm_eval/tasks/kmmlu/direct/_kmmlu_direct.yaml | | |
| |kmmlu_direct_applied_science |lm_eval/tasks/kmmlu/direct/_kmmlu_direct_applied_science.yaml | | |
| |kmmlu_direct_hard |lm_eval/tasks/kmmlu/direct_hard/_kmmlu_direct_hard.yaml | | |
| |kmmlu_direct_hard_applied_science |lm_eval/tasks/kmmlu/direct_hard/_kmmlu_direct_hard_applied_science.yaml | | |
| |kmmlu_direct_hard_humss |lm_eval/tasks/kmmlu/direct_hard/_kmmlu_direct_hard_humss.yaml | | |
| |kmmlu_direct_hard_other |lm_eval/tasks/kmmlu/direct_hard/_kmmlu_direct_hard_other.yaml | | |
| |kmmlu_direct_hard_stem |lm_eval/tasks/kmmlu/direct_hard/_kmmlu_direct_hard_stem.yaml | | |
| |kmmlu_direct_humss |lm_eval/tasks/kmmlu/direct/_kmmlu_direct_humss.yaml | | |
| |kmmlu_direct_other |lm_eval/tasks/kmmlu/direct/_kmmlu_direct_other.yaml | | |
| |kmmlu_direct_stem |lm_eval/tasks/kmmlu/direct/_kmmlu_direct_stem.yaml | | |
| |kmmlu_hard |lm_eval/tasks/kmmlu/hard/_kmmlu_hard.yaml | | |
| |kmmlu_hard_applied_science |lm_eval/tasks/kmmlu/hard/_kmmlu_hard_applied_science.yaml | | |
| |kmmlu_hard_humss |lm_eval/tasks/kmmlu/hard/_kmmlu_hard_humss.yaml | | |
| |kmmlu_hard_other |lm_eval/tasks/kmmlu/hard/_kmmlu_hard_other.yaml | | |
| |kmmlu_hard_stem |lm_eval/tasks/kmmlu/hard/_kmmlu_hard_stem.yaml | | |
| |kmmlu_humss |lm_eval/tasks/kmmlu/default/_kmmlu_humss.yaml | | |
| |kmmlu_other |lm_eval/tasks/kmmlu/default/_kmmlu_other.yaml | | |
| |kmmlu_stem |lm_eval/tasks/kmmlu/default/_kmmlu_stem.yaml | | |
| |kobest |lm_eval/tasks/kobest/_kobest.yaml | | |
| |kormedmcqa |lm_eval/tasks/kormedmcqa/_kormedmcqa.yaml | | |
| |leaderboard |lm_eval/tasks/leaderboard/leaderboard.yaml | | |
| |leaderboard_bbh |lm_eval/tasks/leaderboard/bbh_mc/_leaderboard_bbh.yaml | | |
| |leaderboard_gpqa |lm_eval/tasks/leaderboard/gpqa/_leaderboard_gpqa.yaml | | |
| |leaderboard_instruction_following |lm_eval/tasks/leaderboard/ifeval/_leaderboard_instruction_following.yaml | | |
| |leaderboard_math_hard |lm_eval/tasks/leaderboard/math/_leaderboard_math.yaml | | |
| |leaderboard_musr |lm_eval/tasks/leaderboard/musr/_musr.yaml | | |
| |lingoly |lm_eval/tasks/lingoly/lingoly_group.yaml | | |
| |mafand |lm_eval/tasks/afrobench/mafand/mafand.yaml | | |
| |masakhaner |lm_eval/tasks/afrobench/masakhaner/masakhaner.yaml | | |
| |masakhanews |lm_eval/tasks/afrobench/masakhanews/masakhanews.yaml | | |
| |masakhapos |lm_eval/tasks/afrobench/masakhapos/masakhapos.yaml | | |
| |med_concepts_qa |lm_eval/tasks/med_concepts_qa/_med_concepts_qa.yaml | | |
| |med_concepts_qa_atc |lm_eval/tasks/med_concepts_qa/_med_concepts_qa_atc.yaml | | |
| |med_concepts_qa_icd10cm |lm_eval/tasks/med_concepts_qa/_med_concepts_qa_icd10cm.yaml | | |
| |med_concepts_qa_icd10proc |lm_eval/tasks/med_concepts_qa/_med_concepts_qa_icd10proc.yaml | | |
| |med_concepts_qa_icd9cm |lm_eval/tasks/med_concepts_qa/_med_concepts_qa_icd9cm.yaml | | |
| |med_concepts_qa_icd9proc |lm_eval/tasks/med_concepts_qa/_med_concepts_qa_icd9proc.yaml | | |
| |mela |lm_eval/tasks/mela/_mela.yaml | | |
| |metabench |lm_eval/tasks/metabench/metabench.yaml | | |
| |metabench_permute |lm_eval/tasks/metabench/metabench_permute.yaml | | |
| |metabench_secondary |lm_eval/tasks/metabench/metabench_secondary.yaml | | |
| |metabench_secondary_permute |lm_eval/tasks/metabench/metabench_secondary_permute.yaml | | |
| |minerva_math |lm_eval/tasks/benchmarks/minerva_math.yaml | | |
| |mmlu |lm_eval/tasks/mmlu/default/_mmlu.yaml | | |
| |mmlu_continuation |lm_eval/tasks/mmlu/continuation/_mmlu.yaml | | |
| |mmlu_cot_llama |lm_eval/tasks/llama3/instruct/mmlu_cot/_mmlu_cot_llama.yaml | | |
| |mmlu_cot_llama_humanities |lm_eval/tasks/llama3/instruct/mmlu_cot/_mmlu_humanities.yaml | | |
| |mmlu_cot_llama_other |lm_eval/tasks/llama3/instruct/mmlu_cot/_mmlu_other.yaml | | |
| |mmlu_cot_llama_social_sciences |lm_eval/tasks/llama3/instruct/mmlu_cot/_mmlu_social_sciences.yaml | | |
| |mmlu_cot_llama_stem |lm_eval/tasks/llama3/instruct/mmlu_cot/_mmlu_stem.yaml | | |
| |mmlu_de_llama |lm_eval/tasks/llama3/instruct/mmlu_de/_mmlu_de_llama.yaml | | |
| |mmlu_de_llama_humanities |lm_eval/tasks/llama3/instruct/mmlu_de/_mmlu_de_humanities.yaml | | |
| |mmlu_de_llama_other |lm_eval/tasks/llama3/instruct/mmlu_de/_mmlu_de_other.yaml | | |
| |mmlu_de_llama_social_sciences |lm_eval/tasks/llama3/instruct/mmlu_de/_mmlu_de_social_sciences.yaml | | |
| |mmlu_de_llama_stem |lm_eval/tasks/llama3/instruct/mmlu_de/_mmlu_de_stem.yaml | | |
| |mmlu_es_llama |lm_eval/tasks/llama3/instruct/mmlu_es/_mmlu_es_llama.yaml | | |
| |mmlu_es_llama_humanities |lm_eval/tasks/llama3/instruct/mmlu_es/_mmlu_es_humanities.yaml | | |
| |mmlu_es_llama_other |lm_eval/tasks/llama3/instruct/mmlu_es/_mmlu_es_other.yaml | | |
| |mmlu_es_llama_social_sciences |lm_eval/tasks/llama3/instruct/mmlu_es/_mmlu_es_social_sciences.yaml | | |
| |mmlu_es_llama_stem |lm_eval/tasks/llama3/instruct/mmlu_es/_mmlu_es_stem.yaml | | |
| |mmlu_flan_cot_fewshot |lm_eval/tasks/mmlu/flan_cot_fewshot/_mmlu.yaml | | |
| |mmlu_flan_cot_zeroshot |lm_eval/tasks/mmlu/flan_cot_zeroshot/_mmlu.yaml | | |
| |mmlu_flan_n_shot_generative |lm_eval/tasks/mmlu/flan_n_shot/generative/_mmlu.yaml | | |
| |mmlu_flan_n_shot_loglikelihood |lm_eval/tasks/mmlu/flan_n_shot/loglikelihood/_mmlu.yaml | | |
| |mmlu_fr_llama |lm_eval/tasks/llama3/instruct/mmlu_fr/_mmlu_fr_llama.yaml | | |
| |mmlu_fr_llama_humanities |lm_eval/tasks/llama3/instruct/mmlu_fr/_mmlu_fr_humanities.yaml | | |
| |mmlu_fr_llama_other |lm_eval/tasks/llama3/instruct/mmlu_fr/_mmlu_fr_other.yaml | | |
| |mmlu_fr_llama_social_sciences |lm_eval/tasks/llama3/instruct/mmlu_fr/_mmlu_fr_social_sciences.yaml | | |
| |mmlu_fr_llama_stem |lm_eval/tasks/llama3/instruct/mmlu_fr/_mmlu_fr_stem.yaml | | |
| |mmlu_generative |lm_eval/tasks/mmlu/generative/_mmlu.yaml | | |
| |mmlu_hi_llama |lm_eval/tasks/llama3/instruct/mmlu_hi/_mmlu_hi_llama.yaml | | |
| |mmlu_hi_llama_humanities |lm_eval/tasks/llama3/instruct/mmlu_hi/_mmlu_hi_humanities.yaml | | |
| |mmlu_hi_llama_other |lm_eval/tasks/llama3/instruct/mmlu_hi/_mmlu_hi_other.yaml | | |
| |mmlu_hi_llama_social_sciences |lm_eval/tasks/llama3/instruct/mmlu_hi/_mmlu_hi_social_sciences.yaml | | |
| |mmlu_hi_llama_stem |lm_eval/tasks/llama3/instruct/mmlu_hi/_mmlu_hi_stem.yaml | | |
| |mmlu_humanities |lm_eval/tasks/mmlu/default/_mmlu_humanities.yaml | | |
| |mmlu_it_llama |lm_eval/tasks/llama3/instruct/mmlu_it/_mmlu_it_llama.yaml | | |
| |mmlu_it_llama_humanities |lm_eval/tasks/llama3/instruct/mmlu_it/_mmlu_it_humanities.yaml | | |
| |mmlu_it_llama_other |lm_eval/tasks/llama3/instruct/mmlu_it/_mmlu_it_other.yaml | | |
| |mmlu_it_llama_social_sciences |lm_eval/tasks/llama3/instruct/mmlu_it/_mmlu_it_social_sciences.yaml | | |
| |mmlu_it_llama_stem |lm_eval/tasks/llama3/instruct/mmlu_it/_mmlu_it_stem.yaml | | |
| |mmlu_llama |lm_eval/tasks/llama3/instruct/mmlu/llama.yaml | | |
| |mmlu_llama_humanities |lm_eval/tasks/llama3/instruct/mmlu/_mmlu_humanities.yaml | | |
| |mmlu_llama_other |lm_eval/tasks/llama3/instruct/mmlu/_mmlu_other.yaml | | |
| |mmlu_llama_social_sciences |lm_eval/tasks/llama3/instruct/mmlu/_mmlu_social_sciences.yaml | | |
| |mmlu_llama_stem |lm_eval/tasks/llama3/instruct/mmlu/_mmlu_stem.yaml | | |
| |mmlu_other |lm_eval/tasks/mmlu/default/_mmlu_other.yaml | | |
| |mmlu_pro |lm_eval/tasks/mmlu_pro/_mmlu_pro.yaml | | |
| |mmlu_pro_llama |lm_eval/tasks/llama3/instruct/mmlu_pro/_mmlu_pro.yaml | | |
| |mmlu_pro_plus |lm_eval/tasks/mmlu-pro-plus/_mmlu_pro_plus.yaml | | |
| |mmlu_prox_ar |lm_eval/tasks/mmlu_prox/ar/_mmlu_prox_ar.yaml | | |
| |mmlu_prox_bn |lm_eval/tasks/mmlu_prox/bn/_mmlu_prox_bn.yaml | | |
| |mmlu_prox_de |lm_eval/tasks/mmlu_prox/de/_mmlu_prox_de.yaml | | |
| |mmlu_prox_en |lm_eval/tasks/mmlu_prox/en/_mmlu_prox_en.yaml | | |
| |mmlu_prox_es |lm_eval/tasks/mmlu_prox/es/_mmlu_prox_es.yaml | | |
| |mmlu_prox_fr |lm_eval/tasks/mmlu_prox/fr/_mmlu_prox_fr.yaml | | |
| |mmlu_prox_hi |lm_eval/tasks/mmlu_prox/hi/_mmlu_prox_hi.yaml | | |
| |mmlu_prox_ja |lm_eval/tasks/mmlu_prox/ja/_mmlu_prox_ja.yaml | | |
| |mmlu_prox_ko |lm_eval/tasks/mmlu_prox/ko/_mmlu_prox_ko.yaml | | |
| |mmlu_prox_pt |lm_eval/tasks/mmlu_prox/pt/_mmlu_prox_pt.yaml | | |
| |mmlu_prox_sw |lm_eval/tasks/mmlu_prox/sw/_mmlu_prox_sw.yaml | | |
| |mmlu_prox_th |lm_eval/tasks/mmlu_prox/th/_mmlu_prox_th.yaml | | |
| |mmlu_prox_zh |lm_eval/tasks/mmlu_prox/zh/_mmlu_prox_zh.yaml | | |
| |mmlu_pt_llama |lm_eval/tasks/llama3/instruct/mmlu_pt/_mmlu_pt_llama.yaml | | |
| |mmlu_pt_llama_humanities |lm_eval/tasks/llama3/instruct/mmlu_pt/_mmlu_pt_humanities.yaml | | |
| |mmlu_pt_llama_other |lm_eval/tasks/llama3/instruct/mmlu_pt/_mmlu_pt_other.yaml | | |
| |mmlu_pt_llama_social_sciences |lm_eval/tasks/llama3/instruct/mmlu_pt/_mmlu_pt_social_sciences.yaml | | |
| |mmlu_pt_llama_stem |lm_eval/tasks/llama3/instruct/mmlu_pt/_mmlu_pt_stem.yaml | | |
| |mmlu_social_sciences |lm_eval/tasks/mmlu/default/_mmlu_social_sciences.yaml | | |
| |mmlu_stem |lm_eval/tasks/mmlu/default/_mmlu_stem.yaml | | |
| |mmlu_th_llama |lm_eval/tasks/llama3/instruct/mmlu_th/_mmlu_th_llama.yaml | | |
| |mmlu_th_llama_humanities |lm_eval/tasks/llama3/instruct/mmlu_th/_mmlu_th_humanities.yaml | | |
| |mmlu_th_llama_other |lm_eval/tasks/llama3/instruct/mmlu_th/_mmlu_th_other.yaml | | |
| |mmlu_th_llama_social_sciences |lm_eval/tasks/llama3/instruct/mmlu_th/_mmlu_th_social_sciences.yaml | | |
| |mmlu_th_llama_stem |lm_eval/tasks/llama3/instruct/mmlu_th/_mmlu_th_stem.yaml | | |
| |mmlusr |lm_eval/tasks/mmlusr/question_and_answer/_question_and_answer.yaml | | |
| |mmlusr_answer_only |lm_eval/tasks/mmlusr/answer_only/_answer_only.yaml | | |
| |mmlusr_question_only |lm_eval/tasks/mmlusr/question_only/_question_only.yaml | | |
| |mmmu_val |lm_eval/tasks/mmmu/_mmmu.yaml | | |
| |mmmu_val_art_and_design |lm_eval/tasks/mmmu/_art_and_design.yaml | | |
| |mmmu_val_business |lm_eval/tasks/mmmu/_business.yaml | | |
| |mmmu_val_health_and_medicine |lm_eval/tasks/mmmu/_health_and_medicine.yaml | | |
| |mmmu_val_humanities_and_social_science |lm_eval/tasks/mmmu/_humanities_and_social_sciences.yaml | | |
| |mmmu_val_science |lm_eval/tasks/mmmu/_science.yaml | | |
| |mmmu_val_tech_and_engineering |lm_eval/tasks/mmmu/_tech_and_engineering.yaml | | |
| |multimedqa |lm_eval/tasks/benchmarks/multimedqa/multimedqa.yaml | | |
| |naijarc |lm_eval/tasks/afrobench/naijarc/naijarc.yaml | | |
| |nollysenti |lm_eval/tasks/afrobench/nollysenti/nollysenti.yaml | | |
| |openai_mmlu |lm_eval/tasks/afrobench/openai_mmlu/openai_mmlu.yaml | | |
| |openllm |lm_eval/tasks/benchmarks/openllm.yaml | | |
| |pawsx |lm_eval/tasks/paws-x/_pawsx.yaml | | |
| |portuguese_bench |lm_eval/tasks/portuguese_bench/portuguese_bench.yaml | | |
| |pythia |lm_eval/tasks/benchmarks/pythia.yaml | | |
| |ruler |lm_eval/tasks/ruler/ruler.yaml | | |
| |salt |lm_eval/tasks/afrobench/salt/salt.yaml | | |
| |score_non_greedy_robustness_agieval |lm_eval/tasks/score/agi_eval/score_non_greedy_robustness_agieval.yaml | | |
| |score_non_greedy_robustness_math |lm_eval/tasks/score/math/score_non_greedy_robustness_math.yaml | | |
| |score_option_order_robustness_agieval |lm_eval/tasks/score/agi_eval/score_option_order_robustness_agieval.yaml | | |
| |score_prompt_robustness_agieval |lm_eval/tasks/score/agi_eval/score_prompt_robustness_agieval.yaml | | |
| |score_prompt_robustness_math |lm_eval/tasks/score/math/score_prompt_robustness_math.yaml | | |
| |score_robustness |lm_eval/tasks/score/score_robustness.yaml | | |
| |score_robustness_agieval |lm_eval/tasks/score/agi_eval/score_robustness_agieval.yaml | | |
| |score_robustness_math |lm_eval/tasks/score/math/score_robustness_math.yaml | | |
| |sib |lm_eval/tasks/afrobench/sib/sib.yaml | | |
| |spanish_bench |lm_eval/tasks/spanish_bench/spanish_bench.yaml | | |
| |t0_eval |lm_eval/tasks/benchmarks/t0_eval.yaml | | |
| |tinyBenchmarks |lm_eval/tasks/tinyBenchmarks/tinyBenchmarks.yaml | | |
| |tmlu |lm_eval/tasks/tmlu/default/_tmlu.yaml | | |
| |tmmluplus |lm_eval/tasks/tmmluplus/default/_tmmluplus.yaml | | |
| |tmmluplus_STEM |lm_eval/tasks/tmmluplus/default/_tmmluplus_STEM.yaml | | |
| |tmmluplus_humanities |lm_eval/tasks/tmmluplus/default/_tmmluplus_humanities.yaml | | |
| |tmmluplus_other |lm_eval/tasks/tmmluplus/default/_tmmluplus_other.yaml | | |
| |tmmluplus_social_sciences |lm_eval/tasks/tmmluplus/default/_tmmluplus_social_sciences.yaml | | |
| |uhura_arc_easy |lm_eval/tasks/afrobench/uhura-arc-easy/uhura.yaml | | |
| |wmdp |lm_eval/tasks/wmdp/_wmdp.yaml | | |
| |xcopa |lm_eval/tasks/xcopa/_xcopa.yaml | | |
| |xlum |lm_eval/tasks/afrobench/xlsum/xlsum.yaml | | |
| |xnli |lm_eval/tasks/xnli/_xnli.yaml | | |
| |xstorycloze |lm_eval/tasks/xstorycloze/_xstorycloze.yaml | | |
| |xwinograd |lm_eval/tasks/xwinograd/_xwinograd.yaml | | |
| | Tag | | |
| |------------------------------------------------| | |
| |AraDiCE_ArabicMMLU_humanities_egy | | |
| |AraDiCE_ArabicMMLU_humanities_lev | | |
| |AraDiCE_ArabicMMLU_language_egy | | |
| |AraDiCE_ArabicMMLU_language_lev | | |
| |AraDiCE_ArabicMMLU_other_egy | | |
| |AraDiCE_ArabicMMLU_other_lev | | |
| |AraDiCE_ArabicMMLU_social-science_egy | | |
| |AraDiCE_ArabicMMLU_social-science_lev | | |
| |AraDiCE_ArabicMMLU_stem_egy | | |
| |AraDiCE_ArabicMMLU_stem_lev | | |
| |RC_tasks | | |
| |acp_bench | | |
| |acp_bench_hard | | |
| |acp_bench_hard_with_pddl | | |
| |acp_bool_cot_2shot | | |
| |acp_gen_2shot | | |
| |acp_gen_2shot_with_pddl | | |
| |acp_mcq_cot_2shot | | |
| |adr_prompt_1 | | |
| |adr_prompt_2 | | |
| |adr_prompt_3 | | |
| |adr_prompt_4 | | |
| |adr_prompt_5 | | |
| |adr_tasks | | |
| |advanced_ai_risk | | |
| |african_flores_tasks | | |
| |afrimgsm_cot_tasks | | |
| |afrimgsm_cot_tasks_prompt_1 | | |
| |afrimgsm_cot_tasks_prompt_2 | | |
| |afrimgsm_cot_tasks_prompt_3 | | |
| |afrimgsm_cot_tasks_prompt_4 | | |
| |afrimgsm_cot_tasks_prompt_5 | | |
| |afrimgsm_tasks | | |
| |afrimgsm_tasks_prompt_1 | | |
| |afrimgsm_tasks_prompt_3 | | |
| |afrimgsm_tasks_prompt_4 | | |
| |afrimgsm_tasks_prompt_5 | | |
| |afrimgsm_tt_cot_tasks | | |
| |afrimgsm_tt_tasks | | |
| |afrimmlu_tasks | | |
| |afrimmlu_tasks_prompt_1 | | |
| |afrimmlu_tasks_prompt_2 | | |
| |afrimmlu_tasks_prompt_3 | | |
| |afrimmlu_tasks_prompt_4 | | |
| |afrimmlu_tasks_prompt_5 | | |
| |afrimmlu_tt_tasks | | |
| |afriqa_prompt_1 | | |
| |afriqa_prompt_2 | | |
| |afriqa_prompt_3 | | |
| |afriqa_prompt_4 | | |
| |afriqa_prompt_5 | | |
| |afrisent_prompt_2 | | |
| |afrisenti_prompt_1 | | |
| |afrisenti_prompt_3 | | |
| |afrisenti_prompt_4 | | |
| |afrisenti_prompt_5 | | |
| |afrixnli | | |
| |afrixnli_en_direct | | |
| |afrixnli_manual_direct | | |
| |afrixnli_native_direct | | |
| |afrixnli_tasks | | |
| |afrixnli_tasks_prompt_1 | | |
| |afrixnli_tasks_prompt_2 | | |
| |afrixnli_tasks_prompt_3 | | |
| |afrixnli_tasks_prompt_4 | | |
| |afrixnli_tasks_prompt_5 | | |
| |afrixnli_translate | | |
| |afrixnli_tt_tasks | | |
| |afrobench_MT_tasks | | |
| |afrobench_TC_tasks | | |
| |afrobench_mmlu_tasks | | |
| |afrobench_sentiment_tasks | | |
| |afrobench_xqa_tasks | | |
| |ai2_arc | | |
| |anli | | |
| |arab_culture_completion_gulf_tasks | | |
| |arab_culture_completion_levant_tasks | | |
| |arab_culture_completion_nile_valley_tasks | | |
| |arab_culture_completion_north_africa_tasks | | |
| |arab_culture_gulf_tasks | | |
| |arab_culture_levant_tasks | | |
| |arab_culture_nile_valley_tasks | | |
| |arab_culture_north_africa_tasks | | |
| |arabicmmlu_humanities_tasks | | |
| |arabicmmlu_language_tasks | | |
| |arabicmmlu_other_tasks | | |
| |arabicmmlu_social_science_tasks | | |
| |arabicmmlu_stem_tasks | | |
| |arc_challenge_mt | | |
| |arc_multilingual | | |
| |arithmetic | | |
| |ask_gec | | |
| |basque-glue | | |
| |belebele_prompt_1 | | |
| |belebele_prompt_2 | | |
| |belebele_prompt_3 | | |
| |belebele_prompt_4 | | |
| |belebele_prompt_5 | | |
| |belebele_tasks | | |
| |bertaqa | | |
| |bigbench_generate_until | | |
| |bigbench_multiple_choice_a | | |
| |bigbench_multiple_choice_b | | |
| |cabreu | | |
| |chain_of_thought | | |
| |copal_id | | |
| |crows_pairs | | |
| |darija_sentiment_tasks | | |
| |darija_translation_tasks_doda | | |
| |darija_translation_tasks_flores | | |
| |darija_translation_tasks_madar | | |
| |darija_translation_tasks_seed | | |
| |darija_transliteration_tasks | | |
| |darijammlu_ar_mmlu_tasks | | |
| |darijammlu_mmlu_tasks | | |
| |eus_exams_es | | |
| |eus_exams_eu | | |
| |evalita-mp_at_tasks | | |
| |evalita-mp_faq_tasks | | |
| |evalita-mp_hs_tasks | | |
| |evalita-mp_ls_tasks | | |
| |evalita-mp_ner-v2_tasks_adg | | |
| |evalita-mp_ner-v2_tasks_fic | | |
| |evalita-mp_ner-v2_tasks_wn | | |
| |evalita-mp_ner_tasks_adg | | |
| |evalita-mp_ner_tasks_fic | | |
| |evalita-mp_ner_tasks_wn | | |
| |evalita-mp_re_tasks | | |
| |evalita-mp_sa_tasks | | |
| |evalita-mp_sum_fp-small_tasks | | |
| |evalita-mp_sum_fp_tasks | | |
| |evalita-mp_te_tasks | | |
| |evalita-mp_wic_tasks | | |
| |flores | | |
| |flores_afr-eng | | |
| |flores_afr-eng_prompt_1 | | |
| |flores_afr-eng_prompt_2 | | |
| |flores_afr-eng_prompt_3 | | |
| |flores_eng-afr | | |
| |flores_eng-afr_prompt_1 | | |
| |flores_eng-afr_prompt_2 | | |
| |flores_eng-afr_prompt_3 | | |
| |freebase | | |
| |french_bench | | |
| |french_bench_extra | | |
| |french_bench_gen | | |
| |french_bench_mc | | |
| |french_bench_perplexity | | |
| |global_mmlu_full_am_humanities_tasks | | |
| |global_mmlu_full_am_other_tasks | | |
| |global_mmlu_full_am_social_sciences_tasks | | |
| |global_mmlu_full_am_stem_tasks | | |
| |global_mmlu_full_ar_humanities_tasks | | |
| |global_mmlu_full_ar_other_tasks | | |
| |global_mmlu_full_ar_social_sciences_tasks | | |
| |global_mmlu_full_ar_stem_tasks | | |
| |global_mmlu_full_bn_humanities_tasks | | |
| |global_mmlu_full_bn_other_tasks | | |
| |global_mmlu_full_bn_social_sciences_tasks | | |
| |global_mmlu_full_bn_stem_tasks | | |
| |global_mmlu_full_cs_humanities_tasks | | |
| |global_mmlu_full_cs_other_tasks | | |
| |global_mmlu_full_cs_social_sciences_tasks | | |
| |global_mmlu_full_cs_stem_tasks | | |
| |global_mmlu_full_de_humanities_tasks | | |
| |global_mmlu_full_de_other_tasks | | |
| |global_mmlu_full_de_social_sciences_tasks | | |
| |global_mmlu_full_de_stem_tasks | | |
| |global_mmlu_full_el_humanities_tasks | | |
| |global_mmlu_full_el_other_tasks | | |
| |global_mmlu_full_el_social_sciences_tasks | | |
| |global_mmlu_full_el_stem_tasks | | |
| |global_mmlu_full_en_humanities_tasks | | |
| |global_mmlu_full_en_other_tasks | | |
| |global_mmlu_full_en_social_sciences_tasks | | |
| |global_mmlu_full_en_stem_tasks | | |
| |global_mmlu_full_es_humanities_tasks | | |
| |global_mmlu_full_es_other_tasks | | |
| |global_mmlu_full_es_social_sciences_tasks | | |
| |global_mmlu_full_es_stem_tasks | | |
| |global_mmlu_full_fa_humanities_tasks | | |
| |global_mmlu_full_fa_other_tasks | | |
| |global_mmlu_full_fa_social_sciences_tasks | | |
| |global_mmlu_full_fa_stem_tasks | | |
| |global_mmlu_full_fil_humanities_tasks | | |
| |global_mmlu_full_fil_other_tasks | | |
| |global_mmlu_full_fil_social_sciences_tasks | | |
| |global_mmlu_full_fil_stem_tasks | | |
| |global_mmlu_full_fr_humanities_tasks | | |
| |global_mmlu_full_fr_other_tasks | | |
| |global_mmlu_full_fr_social_sciences_tasks | | |
| |global_mmlu_full_fr_stem_tasks | | |
| |global_mmlu_full_ha_humanities_tasks | | |
| |global_mmlu_full_ha_other_tasks | | |
| |global_mmlu_full_ha_social_sciences_tasks | | |
| |global_mmlu_full_ha_stem_tasks | | |
| |global_mmlu_full_he_humanities_tasks | | |
| |global_mmlu_full_he_other_tasks | | |
| |global_mmlu_full_he_social_sciences_tasks | | |
| |global_mmlu_full_he_stem_tasks | | |
| |global_mmlu_full_hi_humanities_tasks | | |
| |global_mmlu_full_hi_other_tasks | | |
| |global_mmlu_full_hi_social_sciences_tasks | | |
| |global_mmlu_full_hi_stem_tasks | | |
| |global_mmlu_full_id_humanities_tasks | | |
| |global_mmlu_full_id_other_tasks | | |
| |global_mmlu_full_id_social_sciences_tasks | | |
| |global_mmlu_full_id_stem_tasks | | |
| |global_mmlu_full_ig_humanities_tasks | | |
| |global_mmlu_full_ig_other_tasks | | |
| |global_mmlu_full_ig_social_sciences_tasks | | |
| |global_mmlu_full_ig_stem_tasks | | |
| |global_mmlu_full_it_humanities_tasks | | |
| |global_mmlu_full_it_other_tasks | | |
| |global_mmlu_full_it_social_sciences_tasks | | |
| |global_mmlu_full_it_stem_tasks | | |
| |global_mmlu_full_ja_humanities_tasks | | |
| |global_mmlu_full_ja_other_tasks | | |
| |global_mmlu_full_ja_social_sciences_tasks | | |
| |global_mmlu_full_ja_stem_tasks | | |
| |global_mmlu_full_ko_humanities_tasks | | |
| |global_mmlu_full_ko_other_tasks | | |
| |global_mmlu_full_ko_social_sciences_tasks | | |
| |global_mmlu_full_ko_stem_tasks | | |
| |global_mmlu_full_ky_humanities_tasks | | |
| |global_mmlu_full_ky_other_tasks | | |
| |global_mmlu_full_ky_social_sciences_tasks | | |
| |global_mmlu_full_ky_stem_tasks | | |
| |global_mmlu_full_lt_humanities_tasks | | |
| |global_mmlu_full_lt_other_tasks | | |
| |global_mmlu_full_lt_social_sciences_tasks | | |
| |global_mmlu_full_lt_stem_tasks | | |
| |global_mmlu_full_mg_humanities_tasks | | |
| |global_mmlu_full_mg_other_tasks | | |
| |global_mmlu_full_mg_social_sciences_tasks | | |
| |global_mmlu_full_mg_stem_tasks | | |
| |global_mmlu_full_ms_humanities_tasks | | |
| |global_mmlu_full_ms_other_tasks | | |
| |global_mmlu_full_ms_social_sciences_tasks | | |
| |global_mmlu_full_ms_stem_tasks | | |
| |global_mmlu_full_ne_humanities_tasks | | |
| |global_mmlu_full_ne_other_tasks | | |
| |global_mmlu_full_ne_social_sciences_tasks | | |
| |global_mmlu_full_ne_stem_tasks | | |
| |global_mmlu_full_nl_humanities_tasks | | |
| |global_mmlu_full_nl_other_tasks | | |
| |global_mmlu_full_nl_social_sciences_tasks | | |
| |global_mmlu_full_nl_stem_tasks | | |
| |global_mmlu_full_ny_humanities_tasks | | |
| |global_mmlu_full_ny_other_tasks | | |
| |global_mmlu_full_ny_social_sciences_tasks | | |
| |global_mmlu_full_ny_stem_tasks | | |
| |global_mmlu_full_pl_humanities_tasks | | |
| |global_mmlu_full_pl_other_tasks | | |
| |global_mmlu_full_pl_social_sciences_tasks | | |
| |global_mmlu_full_pl_stem_tasks | | |
| |global_mmlu_full_pt_humanities_tasks | | |
| |global_mmlu_full_pt_other_tasks | | |
| |global_mmlu_full_pt_social_sciences_tasks | | |
| |global_mmlu_full_pt_stem_tasks | | |
| |global_mmlu_full_ro_humanities_tasks | | |
| |global_mmlu_full_ro_other_tasks | | |
| |global_mmlu_full_ro_social_sciences_tasks | | |
| |global_mmlu_full_ro_stem_tasks | | |
| |global_mmlu_full_ru_humanities_tasks | | |
| |global_mmlu_full_ru_other_tasks | | |
| |global_mmlu_full_ru_social_sciences_tasks | | |
| |global_mmlu_full_ru_stem_tasks | | |
| |global_mmlu_full_si_humanities_tasks | | |
| |global_mmlu_full_si_other_tasks | | |
| |global_mmlu_full_si_social_sciences_tasks | | |
| |global_mmlu_full_si_stem_tasks | | |
| |global_mmlu_full_sn_humanities_tasks | | |
| |global_mmlu_full_sn_other_tasks | | |
| |global_mmlu_full_sn_social_sciences_tasks | | |
| |global_mmlu_full_sn_stem_tasks | | |
| |global_mmlu_full_so_humanities_tasks | | |
| |global_mmlu_full_so_other_tasks | | |
| |global_mmlu_full_so_social_sciences_tasks | | |
| |global_mmlu_full_so_stem_tasks | | |
| |global_mmlu_full_sr_humanities_tasks | | |
| |global_mmlu_full_sr_other_tasks | | |
| |global_mmlu_full_sr_social_sciences_tasks | | |
| |global_mmlu_full_sr_stem_tasks | | |
| |global_mmlu_full_sv_humanities_tasks | | |
| |global_mmlu_full_sv_other_tasks | | |
| |global_mmlu_full_sv_social_sciences_tasks | | |
| |global_mmlu_full_sv_stem_tasks | | |
| |global_mmlu_full_sw_humanities_tasks | | |
| |global_mmlu_full_sw_other_tasks | | |
| |global_mmlu_full_sw_social_sciences_tasks | | |
| |global_mmlu_full_sw_stem_tasks | | |
| |global_mmlu_full_te_humanities_tasks | | |
| |global_mmlu_full_te_other_tasks | | |
| |global_mmlu_full_te_social_sciences_tasks | | |
| |global_mmlu_full_te_stem_tasks | | |
| |global_mmlu_full_tr_humanities_tasks | | |
| |global_mmlu_full_tr_other_tasks | | |
| |global_mmlu_full_tr_social_sciences_tasks | | |
| |global_mmlu_full_tr_stem_tasks | | |
| |global_mmlu_full_uk_humanities_tasks | | |
| |global_mmlu_full_uk_other_tasks | | |
| |global_mmlu_full_uk_social_sciences_tasks | | |
| |global_mmlu_full_uk_stem_tasks | | |
| |global_mmlu_full_vi_humanities_tasks | | |
| |global_mmlu_full_vi_other_tasks | | |
| |global_mmlu_full_vi_social_sciences_tasks | | |
| |global_mmlu_full_vi_stem_tasks | | |
| |global_mmlu_full_yo_humanities_tasks | | |
| |global_mmlu_full_yo_other_tasks | | |
| |global_mmlu_full_yo_social_sciences_tasks | | |
| |global_mmlu_full_yo_stem_tasks | | |
| |global_mmlu_full_zh_humanities_tasks | | |
| |global_mmlu_full_zh_other_tasks | | |
| |global_mmlu_full_zh_social_sciences_tasks | | |
| |global_mmlu_full_zh_stem_tasks | | |
| |glue | | |
| |gpqa | | |
| |gpt3_translation_benchmarks | | |
| |headqa | | |
| |hellaswag_multilingual | | |
| |hendrycks_ethics | | |
| |injongointent_prompt_1 | | |
| |injongointent_prompt_2 | | |
| |injongointent_prompt_3 | | |
| |injongointent_prompt_4 | | |
| |injongointent_prompt_5 | | |
| |injongointent_tasks | | |
| |inverse_scaling_mc | | |
| |iwslt2017 | | |
| |jsonschema_bench | | |
| |kbl | | |
| |kbl_bar_exam_em | | |
| |kbl_bar_exam_em_civil | | |
| |kbl_bar_exam_em_criminal | | |
| |kbl_bar_exam_em_public | | |
| |kbl_bar_exam_em_responsibility | | |
| |kbl_knowledge_em | | |
| |kbl_reasoning_em | | |
| |kmmlu_applied_science_tasks | | |
| |kmmlu_cot_hard_applied_science_tasks | | |
| |kmmlu_cot_hard_humss_tasks | | |
| |kmmlu_cot_hard_other_tasks | | |
| |kmmlu_cot_hard_stem_tasks | | |
| |kmmlu_direct_applied_science_tasks | | |
| |kmmlu_direct_hard_applied_science_tasks | | |
| |kmmlu_direct_hard_humss_tasks | | |
| |kmmlu_direct_hard_other_tasks | | |
| |kmmlu_direct_hard_stem_tasks | | |
| |kmmlu_direct_humss_tasks | | |
| |kmmlu_direct_other_tasks | | |
| |kmmlu_direct_stem_tasks | | |
| |kmmlu_hard_applied_science_tasks | | |
| |kmmlu_hard_humss_tasks | | |
| |kmmlu_hard_other_tasks | | |
| |kmmlu_hard_stem_tasks | | |
| |kmmlu_humss_tasks | | |
| |kmmlu_other_tasks | | |
| |kmmlu_stem_tasks | | |
| |lambada | | |
| |lambada_cloze | | |
| |lambada_multilingual | | |
| |llama | | |
| |longbench | | |
| |longbench_e | | |
| |longcxt | | |
| |m_mmlu | | |
| |mafand_afr-eng | | |
| |mafand_afr-eng_prompt_1 | | |
| |mafand_afr-eng_prompt_3 | | |
| |mafand_eng-afr | | |
| |mafand_eng-afr_prompt_1 | | |
| |mafand_eng-afr_prompt_2 | | |
| |mafand_eng-afr_prompt_3 | | |
| |mafand_tasks | | |
| |masakhaner_prompt_1 | | |
| |masakhaner_prompt_2 | | |
| |masakhaner_prompt_3 | | |
| |masakhaner_prompt_4 | | |
| |masakhaner_prompt_5 | | |
| |masakhaner_tasks | | |
| |masakhanews_prompt_1 | | |
| |masakhanews_prompt_2 | | |
| |masakhanews_prompt_3 | | |
| |masakhanews_prompt_4 | | |
| |masakhanews_prompt_5 | | |
| |masakhanews_tasks | | |
| |masakhapos_prompt_1 | | |
| |masakhapos_prompt_2 | | |
| |masakhapos_prompt_3 | | |
| |masakhapos_prompt_4 | | |
| |masakhapos_prompt_5 | | |
| |masakhapos_tasks | | |
| |mastermind | | |
| |mastermind_easy | | |
| |mastermind_hard | | |
| |math_word_problems | | |
| |med_concepts_qa_atc_tasks | | |
| |med_concepts_qa_icd10cm_tasks | | |
| |med_concepts_qa_icd10proc_tasks | | |
| |med_concepts_qa_icd9cm_tasks | | |
| |med_concepts_qa_icd9proc_tasks | | |
| |metabench_arc_subset | | |
| |metabench_gsm8k_subset | | |
| |metabench_hellaswag_subset | | |
| |metabench_mmlu_subset | | |
| |metabench_truthfulqa_subset | | |
| |metabench_winogrande_subset | | |
| |mgsm_cot_native | | |
| |mgsm_direct | | |
| |mmlu_continuation_humanities | | |
| |mmlu_continuation_other | | |
| |mmlu_continuation_social_sciences | | |
| |mmlu_continuation_stem | | |
| |mmlu_cot_llama_humanities_tasks | | |
| |mmlu_cot_llama_other_tasks | | |
| |mmlu_cot_llama_social_sciences_tasks | | |
| |mmlu_cot_llama_stem_tasks | | |
| |mmlu_de_llama_humanities_tasks | | |
| |mmlu_de_llama_other_tasks | | |
| |mmlu_de_llama_social_sciences_tasks | | |
| |mmlu_de_llama_stem_tasks | | |
| |mmlu_es_llama_humanities_tasks | | |
| |mmlu_es_llama_other_tasks | | |
| |mmlu_es_llama_social_sciences_tasks | | |
| |mmlu_es_llama_stem_tasks | | |
| |mmlu_flan_cot_fewshot_humanities | | |
| |mmlu_flan_cot_fewshot_other | | |
| |mmlu_flan_cot_fewshot_social_sciences | | |
| |mmlu_flan_cot_fewshot_stem | | |
| |mmlu_flan_cot_zeroshot_humanities | | |
| |mmlu_flan_cot_zeroshot_other | | |
| |mmlu_flan_cot_zeroshot_social_sciences | | |
| |mmlu_flan_cot_zeroshot_stem | | |
| |mmlu_flan_n_shot_generative_humanities | | |
| |mmlu_flan_n_shot_generative_other | | |
| |mmlu_flan_n_shot_generative_social_sciences | | |
| |mmlu_flan_n_shot_generative_stem | | |
| |mmlu_flan_n_shot_loglikelihood_humanities | | |
| |mmlu_flan_n_shot_loglikelihood_other | | |
| |mmlu_flan_n_shot_loglikelihood_social_sciences | | |
| |mmlu_flan_n_shot_loglikelihood_stem | | |
| |mmlu_fr_llama_humanities_tasks | | |
| |mmlu_fr_llama_other_tasks | | |
| |mmlu_fr_llama_social_sciences_tasks | | |
| |mmlu_fr_llama_stem_tasks | | |
| |mmlu_hi_llama_humanities_tasks | | |
| |mmlu_hi_llama_other_tasks | | |
| |mmlu_hi_llama_social_sciences_tasks | | |
| |mmlu_hi_llama_stem_tasks | | |
| |mmlu_humanities_generative | | |
| |mmlu_humanities_tasks | | |
| |mmlu_it_llama_humanities_tasks | | |
| |mmlu_it_llama_other_tasks | | |
| |mmlu_it_llama_social_sciences_tasks | | |
| |mmlu_it_llama_stem_tasks | | |
| |mmlu_llama_humanities_tasks | | |
| |mmlu_llama_other_tasks | | |
| |mmlu_llama_social_sciences_tasks | | |
| |mmlu_llama_stem_tasks | | |
| |mmlu_other_generative | | |
| |mmlu_other_tasks | | |
| |mmlu_pt_llama_humanities_tasks | | |
| |mmlu_pt_llama_other_tasks | | |
| |mmlu_pt_llama_social_sciences_tasks | | |
| |mmlu_pt_llama_stem_tasks | | |
| |mmlu_social_sciences_generative | | |
| |mmlu_social_sciences_tasks | | |
| |mmlu_stem_generative | | |
| |mmlu_stem_tasks | | |
| |mmlu_th_llama_humanities_tasks | | |
| |mmlu_th_llama_other_tasks | | |
| |mmlu_th_llama_social_sciences_tasks | | |
| |mmlu_th_llama_stem_tasks | | |
| |mmlusr_answer_only_humanities_tasks | | |
| |mmlusr_answer_only_other_tasks | | |
| |mmlusr_answer_only_social_sciences_tasks | | |
| |mmlusr_answer_only_stem_tasks | | |
| |mmlusr_question_and_answer_humanities_tasks | | |
| |mmlusr_question_and_answer_other_tasks | | |
| |mmlusr_question_and_answer_social_sciences_tasks| | |
| |mmlusr_question_and_answer_stem_tasks | | |
| |mmlusr_question_only_humanities_tasks | | |
| |mmlusr_question_only_other_tasks | | |
| |mmlusr_question_only_social_sciences_tasks | | |
| |mmlusr_question_only_stem_tasks | | |
| |multiple_choice | | |
| |naijarc_prompt_1 | | |
| |naijarc_prompt_2 | | |
| |naijarc_prompt_3 | | |
| |naijarc_prompt_4 | | |
| |naijarc_prompt_5 | | |
| |naijarc_tasks | | |
| |nollysenti_prompt_1 | | |
| |nollysenti_prompt_2 | | |
| |nollysenti_prompt_3 | | |
| |nollysenti_prompt_4 | | |
| |nollysenti_prompt_5 | | |
| |norbelebele | | |
| |norcommonsenseqa_nno | | |
| |norcommonsenseqa_nob | | |
| |norec_document | | |
| |norec_sentence | | |
| |noridiom_nno | | |
| |noridiom_nob | | |
| |noropenbookqa_nno | | |
| |noropenbookqa_nob | | |
| |norquad | | |
| |norsumm_nno | | |
| |norsumm_nob | | |
| |nortruthfulqa_gen_nno | | |
| |nortruthfulqa_gen_nob | | |
| |nortruthfulqa_mc_nno | | |
| |nortruthfulqa_mc_nob | | |
| |nrk_quiz_qa_nno | | |
| |nrk_quiz_qa_nob | | |
| |ntrex_afr-eng | | |
| |ntrex_afr-eng_prompt_1 | | |
| |ntrex_afr-eng_prompt_2 | | |
| |ntrex_afr-eng_prompt_3 | | |
| |ntrex_eng-afr | | |
| |ntrex_eng-afr_prompt_1 | | |
| |ntrex_eng-afr_prompt_2 | | |
| |ntrex_eng-afr_prompt_3 | | |
| |ntrex_tasks | | |
| |openai_mmlu_prompt_1 | | |
| |openai_mmlu_prompt_2 | | |
| |openai_mmlu_prompt_3 | | |
| |openai_mmlu_prompt_4 | | |
| |openai_mmlu_prompt_5 | | |
| |openai_mmlu_tasks | | |
| |paloma | | |
| |persona | | |
| |phrases_es | | |
| |phrases_va | | |
| |polemo2 | | |
| |qa4mre | | |
| |qasper | | |
| |salt_prompt_1 | | |
| |salt_prompt_2 | | |
| |salt_prompt_3 | | |
| |salt_tasks | | |
| |score_robustness_mmlu_pro | | |
| |self_consistency | | |
| |sib_prompt_1 | | |
| |sib_prompt_2 | | |
| |sib_prompt_3 | | |
| |sib_prompt_4 | | |
| |sib_prompt_5 | | |
| |sib_tasks | | |
| |social_bias | | |
| |storycloze | | |
| |super-glue-lm-eval-v1 | | |
| |super-glue-lm-eval-v1-seq2seq | | |
| |super-glue-t5-prompt | | |
| |sycophancy | | |
| |tatoeba_eng_nno | | |
| |tatoeba_eng_nob | | |
| |tatoeba_nno_eng | | |
| |tatoeba_nob_eng | | |
| |tmlu_humanities_tasks | | |
| |tmlu_other_tasks | | |
| |tmlu_social_sciences_tasks | | |
| |tmlu_stem_tasks | | |
| |tmlu_taiwan_specific_tasks | | |
| |tmmluplus_STEM_tasks | | |
| |tmmluplus_humanities_tasks | | |
| |tmmluplus_other_tasks | | |
| |tmmluplus_social_sciences_tasks | | |
| |translation | | |
| |truthfulqa | | |
| |truthfulqa_gl | | |
| |truthfulqa_multilingual | | |
| |turkishmmlu | | |
| |turkishmmlu_cot | | |
| |uhura_arc_easy_prompt_1 | | |
| |uhura_arc_easy_prompt_2 | | |
| |uhura_arc_easy_prompt_3 | | |
| |uhura_arc_easy_prompt_4 | | |
| |uhura_arc_easy_prompt_5 | | |
| |uhura_arc_easy_tasks | | |
| |unscramble | | |
| |winogender | | |
| |wmt14 | | |
| |wmt16 | | |
| |xlsum_prompt_1 | | |
| |xlsum_prompt_2 | | |
| |xlsum_prompt_3 | | |
| |xlsum_tasks | | |
| |xnli_eu_mt_native | | |
| |xquad | | |
| | Task | Config Location | Output Type | | |
| |--------------------------------------------------------------------------------------|----------------------------------------------------------------------------------------------------------------------------------------------------------------|---------------------| | |
| |20_newsgroups |lm_eval/tasks/unitxt/20_newsgroups.yaml | | | |
| |AraDiCE_ArabicMMLU_high_humanities_history_egy |lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_high_humanities_history.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_high_humanities_history_lev |lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_high_humanities_history.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_high_humanities_islamic-studies_egy |lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_high_humanities_islamic-studies.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_high_humanities_islamic-studies_lev |lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_high_humanities_islamic-studies.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_high_humanities_philosophy_egy |lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_high_humanities_philosophy.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_high_humanities_philosophy_lev |lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_high_humanities_philosophy.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_high_language_arabic-language_egy |lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_high_language_arabic-language.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_high_language_arabic-language_lev |lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_high_language_arabic-language.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_high_social-science_civics_egy |lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_high_social-science_civics.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_high_social-science_civics_lev |lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_high_social-science_civics.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_high_social-science_economics_egy |lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_high_social-science_economics.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_high_social-science_economics_lev |lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_high_social-science_economics.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_high_social-science_geography_egy |lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_high_social-science_geography.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_high_social-science_geography_lev |lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_high_social-science_geography.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_high_stem_biology_egy |lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_high_stem_biology.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_high_stem_biology_lev |lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_high_stem_biology.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_high_stem_computer-science_egy |lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_high_stem_computer-science.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_high_stem_computer-science_lev |lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_high_stem_computer-science.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_high_stem_physics_egy |lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_high_stem_physics.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_high_stem_physics_lev |lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_high_stem_physics.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_middle_humanities_history_egy |lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_middle_humanities_history.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_middle_humanities_history_lev |lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_middle_humanities_history.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_middle_humanities_islamic-studies_egy |lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_middle_humanities_islamic-studies.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_middle_humanities_islamic-studies_lev |lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_middle_humanities_islamic-studies.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_middle_language_arabic-language_egy |lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_middle_language_arabic-language.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_middle_language_arabic-language_lev |lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_middle_language_arabic-language.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_middle_other_general-knowledge_egy |lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_middle_other_general-knowledge.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_middle_other_general-knowledge_lev |lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_middle_other_general-knowledge.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_middle_social-science_civics_egy |lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_middle_social-science_civics.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_middle_social-science_civics_lev |lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_middle_social-science_civics.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_middle_social-science_economics_egy |lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_middle_social-science_economics.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_middle_social-science_economics_lev |lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_middle_social-science_economics.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_middle_social-science_geography_egy |lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_middle_social-science_geography.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_middle_social-science_geography_lev |lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_middle_social-science_geography.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_middle_social-science_social-science_egy |lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_middle_social-science_social-science.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_middle_social-science_social-science_lev |lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_middle_social-science_social-science.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_middle_stem_computer-science_egy |lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_middle_stem_computer-science.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_middle_stem_computer-science_lev |lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_middle_stem_computer-science.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_middle_stem_natural-science_egy |lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_middle_stem_natural-science.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_middle_stem_natural-science_lev |lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_middle_stem_natural-science.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_na_humanities_islamic-studies_egy |lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_na_humanities_islamic-studies.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_na_humanities_islamic-studies_lev |lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_na_humanities_islamic-studies.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_na_language_arabic-language-general_egy |lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_na_language_arabic-language-general.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_na_language_arabic-language-general_lev |lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_na_language_arabic-language-general.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_na_language_arabic-language-grammar_egy |lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_na_language_arabic-language-grammar.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_na_language_arabic-language-grammar_lev |lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_na_language_arabic-language-grammar.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_na_other_driving-test_egy |lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_na_other_driving-test.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_na_other_driving-test_lev |lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_na_other_driving-test.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_na_other_general-knowledge_egy |lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_na_other_general-knowledge.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_na_other_general-knowledge_lev |lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_na_other_general-knowledge.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_primary_humanities_history_egy |lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_primary_humanities_history.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_primary_humanities_history_lev |lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_primary_humanities_history.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_primary_humanities_islamic-studies_egy |lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_primary_humanities_islamic-studies.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_primary_humanities_islamic-studies_lev |lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_primary_humanities_islamic-studies.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_primary_language_arabic-language_egy |lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_primary_language_arabic-language.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_primary_language_arabic-language_lev |lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_primary_language_arabic-language.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_primary_other_general-knowledge_egy |lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_primary_other_general-knowledge.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_primary_other_general-knowledge_lev |lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_primary_other_general-knowledge.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_primary_social-science_geography_egy |lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_primary_social-science_geography.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_primary_social-science_geography_lev |lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_primary_social-science_geography.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_primary_social-science_social-science_egy |lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_primary_social-science_social-science.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_primary_social-science_social-science_lev |lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_primary_social-science_social-science.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_primary_stem_computer-science_egy |lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_primary_stem_computer-science.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_primary_stem_computer-science_lev |lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_primary_stem_computer-science.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_primary_stem_math_egy |lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_primary_stem_math.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_primary_stem_math_lev |lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_primary_stem_math.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_primary_stem_natural-science_egy |lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_primary_stem_natural-science.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_primary_stem_natural-science_lev |lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_primary_stem_natural-science.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_prof_humanities_law_egy |lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_prof_humanities_law.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_prof_humanities_law_lev |lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_prof_humanities_law.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_univ_other_management_egy |lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_univ_other_management.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_univ_other_management_lev |lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_univ_other_management.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_univ_social-science_accounting_egy |lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_univ_social-science_accounting.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_univ_social-science_accounting_lev |lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_univ_social-science_accounting.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_univ_social-science_economics_egy |lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_univ_social-science_economics.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_univ_social-science_economics_lev |lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_univ_social-science_economics.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_univ_social-science_political-science_egy |lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_univ_social-science_political-science.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_univ_social-science_political-science_lev |lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_univ_social-science_political-science.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_univ_stem_computer-science_egy |lm_eval/tasks/aradice/ArabicMMLU/EGY/AraDiCE_ArabicMMLU_univ_stem_computer-science.yaml |multiple_choice | | |
| |AraDiCE_ArabicMMLU_univ_stem_computer-science_lev |lm_eval/tasks/aradice/ArabicMMLU/LEV/AraDiCE_ArabicMMLU_univ_stem_computer-science.yaml |multiple_choice | | |
| |AraDiCE_boolq_egy |lm_eval/tasks/aradice/boolq/EGY/boolq_egy.yaml |multiple_choice | | |
| |AraDiCE_boolq_eng |lm_eval/tasks/aradice/boolq/ENG/boolq_eng.yaml |multiple_choice | | |
| |AraDiCE_boolq_lev |lm_eval/tasks/aradice/boolq/LEV/boolq_lev.yaml |multiple_choice | | |
| |AraDiCE_boolq_msa |lm_eval/tasks/aradice/boolq/MSA/boolq_msa.yaml |multiple_choice | | |
| |AraDiCE_egypt_cultural |lm_eval/tasks/aradice/cultural-benchmark/egypt.yaml |multiple_choice | | |
| |AraDiCE_jordan_cultural |lm_eval/tasks/aradice/cultural-benchmark/jordan.yaml |multiple_choice | | |
| |AraDiCE_lebanon_cultural |lm_eval/tasks/aradice/cultural-benchmark/lebanon.yaml |multiple_choice | | |
| |AraDiCE_openbookqa_egy |lm_eval/tasks/aradice/openbookqa/openbookqa_egy.yaml |multiple_choice | | |
| |AraDiCE_openbookqa_eng |lm_eval/tasks/aradice/openbookqa/openbookqa_eng.yaml |multiple_choice | | |
| |AraDiCE_openbookqa_lev |lm_eval/tasks/aradice/openbookqa/openbookqa_lev.yaml |multiple_choice | | |
| |AraDiCE_openbookqa_msa |lm_eval/tasks/aradice/openbookqa/openbookqa_msa.yaml |multiple_choice | | |
| |AraDiCE_palestine_cultural |lm_eval/tasks/aradice/cultural-benchmark/palestine.yaml |multiple_choice | | |
| |AraDiCE_piqa_egy |lm_eval/tasks/aradice/piqa/piqa_egy.yaml |multiple_choice | | |
| |AraDiCE_piqa_eng |lm_eval/tasks/aradice/piqa/piqa_eng.yaml |multiple_choice | | |
| |AraDiCE_piqa_lev |lm_eval/tasks/aradice/piqa/piqa_lev.yaml |multiple_choice | | |
| |AraDiCE_piqa_msa |lm_eval/tasks/aradice/piqa/piqa_msa.yaml |multiple_choice | | |
| |AraDiCE_qatar_cultural |lm_eval/tasks/aradice/cultural-benchmark/qatar.yaml |multiple_choice | | |
| |AraDiCE_syria_cultural |lm_eval/tasks/aradice/cultural-benchmark/syria.yaml |multiple_choice | | |
| |AraDiCE_truthfulqa_mc1_egy |lm_eval/tasks/aradice/truthfulqa_mcq/truthfulqa_mc1_egy.yaml |multiple_choice | | |
| |AraDiCE_truthfulqa_mc1_eng |lm_eval/tasks/aradice/truthfulqa_mcq/truthfulqa_mc1_eng.yaml |multiple_choice | | |
| |AraDiCE_truthfulqa_mc1_lev |lm_eval/tasks/aradice/truthfulqa_mcq/truthfulqa_mc1_lev.yaml |multiple_choice | | |
| |AraDiCE_truthfulqa_mc1_msa |lm_eval/tasks/aradice/truthfulqa_mcq/truthfulqa_mc1_msa.yaml |multiple_choice | | |
| |AraDiCE_winogrande_egy |lm_eval/tasks/aradice/winogrande/winogrande_egy.yaml |multiple_choice | | |
| |AraDiCE_winogrande_eng |lm_eval/tasks/aradice/winogrande/winogrande_eng.yaml |multiple_choice | | |
| |AraDiCE_winogrande_lev |lm_eval/tasks/aradice/winogrande/winogrande_lev.yaml |multiple_choice | | |
| |AraDiCE_winogrande_msa |lm_eval/tasks/aradice/winogrande/winogrande_msa.yaml |multiple_choice | | |
| |aclue_ancient_chinese_culture |lm_eval/tasks/aclue/aclue_ancient_chinese_culture.yaml |multiple_choice | | |
| |aclue_ancient_literature |lm_eval/tasks/aclue/aclue_ancient_literature.yaml |multiple_choice | | |
| |aclue_ancient_medical |lm_eval/tasks/aclue/aclue_ancient_medical.yaml |multiple_choice | | |
| |aclue_ancient_phonetics |lm_eval/tasks/aclue/aclue_ancient_phonetics.yaml |multiple_choice | | |
| |aclue_basic_ancient_chinese |lm_eval/tasks/aclue/aclue_basic_ancient_chinese.yaml |multiple_choice | | |
| |aclue_couplet_prediction |lm_eval/tasks/aclue/aclue_couplet_prediction.yaml |multiple_choice | | |
| |aclue_homographic_character_resolution |lm_eval/tasks/aclue/aclue_homographic_character_resolution.yaml |multiple_choice | | |
| |aclue_named_entity_recognition |lm_eval/tasks/aclue/aclue_named_entity_recognition.yaml |multiple_choice | | |
| |aclue_poetry_appreciate |lm_eval/tasks/aclue/aclue_poetry_appreciate.yaml |multiple_choice | | |
| |aclue_poetry_context_prediction |lm_eval/tasks/aclue/aclue_poetry_context_prediction.yaml |multiple_choice | | |
| |aclue_poetry_quality_assessment |lm_eval/tasks/aclue/aclue_poetry_quality_assessment.yaml |multiple_choice | | |
| |aclue_poetry_sentiment_analysis |lm_eval/tasks/aclue/aclue_poetry_sentiment_analysis.yaml |multiple_choice | | |
| |aclue_polysemy_resolution |lm_eval/tasks/aclue/aclue_polysemy_resolution.yaml |multiple_choice | | |
| |aclue_reading_comprehension |lm_eval/tasks/aclue/aclue_reading_comprehension.yaml |multiple_choice | | |
| |aclue_sentence_segmentation |lm_eval/tasks/aclue/aclue_sentence_segmentation.yaml |multiple_choice | | |
| |acp_app_bool |lm_eval/tasks/acpbench/boolq_cot_2shot/app.yaml |generate_until | | |
| |acp_app_gen |lm_eval/tasks/acpbench/gen_2shot/app.yaml |generate_until | | |
| |acp_app_gen_with_pddl |lm_eval/tasks/acpbench/gen_2shot_with_pddl/app.yaml |generate_until | | |
| |acp_app_mcq |lm_eval/tasks/acpbench/mcq_cot_2shot/app.yaml |generate_until | | |
| |acp_areach_bool |lm_eval/tasks/acpbench/boolq_cot_2shot/act_reach.yaml |generate_until | | |
| |acp_areach_gen |lm_eval/tasks/acpbench/gen_2shot/act_reach.yaml |generate_until | | |
| |acp_areach_gen_with_pddl |lm_eval/tasks/acpbench/gen_2shot_with_pddl/act_reach.yaml |generate_until | | |
| |acp_areach_mcq |lm_eval/tasks/acpbench/mcq_cot_2shot/act_reach.yaml |generate_until | | |
| |acp_just_bool |lm_eval/tasks/acpbench/boolq_cot_2shot/just.yaml |generate_until | | |
| |acp_just_gen |lm_eval/tasks/acpbench/gen_2shot/just.yaml |generate_until | | |
| |acp_just_gen_with_pddl |lm_eval/tasks/acpbench/gen_2shot_with_pddl/just.yaml |generate_until | | |
| |acp_just_mcq |lm_eval/tasks/acpbench/mcq_cot_2shot/just.yaml |generate_until | | |
| |acp_land_bool |lm_eval/tasks/acpbench/boolq_cot_2shot/land.yaml |generate_until | | |
| |acp_land_gen |lm_eval/tasks/acpbench/gen_2shot/land.yaml |generate_until | | |
| |acp_land_gen_with_pddl |lm_eval/tasks/acpbench/gen_2shot_with_pddl/land.yaml |generate_until | | |
| |acp_land_mcq |lm_eval/tasks/acpbench/mcq_cot_2shot/land.yaml |generate_until | | |
| |acp_nexta_gen |lm_eval/tasks/acpbench/gen_2shot/next_act.yaml |generate_until | | |
| |acp_nexta_gen_with_pddl |lm_eval/tasks/acpbench/gen_2shot_with_pddl/next_act.yaml |generate_until | | |
| |acp_prog_bool |lm_eval/tasks/acpbench/boolq_cot_2shot/prog.yaml |generate_until | | |
| |acp_prog_gen |lm_eval/tasks/acpbench/gen_2shot/prog.yaml |generate_until | | |
| |acp_prog_gen_with_pddl |lm_eval/tasks/acpbench/gen_2shot_with_pddl/prog.yaml |generate_until | | |
| |acp_prog_mcq |lm_eval/tasks/acpbench/mcq_cot_2shot/prog.yaml |generate_until | | |
| |acp_reach_bool |lm_eval/tasks/acpbench/boolq_cot_2shot/reach.yaml |generate_until | | |
| |acp_reach_gen |lm_eval/tasks/acpbench/gen_2shot/reach.yaml |generate_until | | |
| |acp_reach_gen_with_pddl |lm_eval/tasks/acpbench/gen_2shot_with_pddl/reach.yaml |generate_until | | |
| |acp_reach_mcq |lm_eval/tasks/acpbench/mcq_cot_2shot/reach.yaml |generate_until | | |
| |acp_val_bool |lm_eval/tasks/acpbench/boolq_cot_2shot/val.yaml |generate_until | | |
| |acp_val_gen |lm_eval/tasks/acpbench/gen_2shot/val.yaml |generate_until | | |
| |acp_val_gen_with_pddl |lm_eval/tasks/acpbench/gen_2shot_with_pddl/val.yaml |generate_until | | |
| |acp_val_mcq |lm_eval/tasks/acpbench/mcq_cot_2shot/val.yaml |generate_until | | |
| |advanced_ai_risk_fewshot-coordinate-itself |lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-coordinate-itself.yaml |multiple_choice | | |
| |advanced_ai_risk_fewshot-coordinate-other-ais |lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-coordinate-other-ais.yaml |multiple_choice | | |
| |advanced_ai_risk_fewshot-coordinate-other-versions |lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-coordinate-other-versions.yaml |multiple_choice | | |
| |advanced_ai_risk_fewshot-corrigible-less-HHH |lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-corrigible-less-HHH.yaml |multiple_choice | | |
| |advanced_ai_risk_fewshot-corrigible-more-HHH |lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-corrigible-more-HHH.yaml |multiple_choice | | |
| |advanced_ai_risk_fewshot-corrigible-neutral-HHH |lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-corrigible-neutral-HHH.yaml |multiple_choice | | |
| |advanced_ai_risk_fewshot-myopic-reward |lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-myopic-reward.yaml |multiple_choice | | |
| |advanced_ai_risk_fewshot-one-box-tendency |lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-one-box-tendency.yaml |multiple_choice | | |
| |advanced_ai_risk_fewshot-power-seeking-inclination |lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-power-seeking-inclination.yaml |multiple_choice | | |
| |advanced_ai_risk_fewshot-self-awareness-general-ai |lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-self-awareness-general-ai.yaml |multiple_choice | | |
| |advanced_ai_risk_fewshot-self-awareness-good-text-model |lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-self-awareness-good-text-model.yaml |multiple_choice | | |
| |advanced_ai_risk_fewshot-self-awareness-text-model |lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-self-awareness-text-model.yaml |multiple_choice | | |
| |advanced_ai_risk_fewshot-self-awareness-training-architecture |lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-self-awareness-training-architecture.yaml |multiple_choice | | |
| |advanced_ai_risk_fewshot-self-awareness-training-web-gpt |lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-self-awareness-training-web-gpt.yaml |multiple_choice | | |
| |advanced_ai_risk_fewshot-survival-instinct |lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-survival-instinct.yaml |multiple_choice | | |
| |advanced_ai_risk_fewshot-wealth-seeking-inclination |lm_eval/tasks/model_written_evals/advanced_ai_risk/fewshot-wealth-seeking-inclination.yaml |multiple_choice | | |
| |advanced_ai_risk_human-coordinate-itself |lm_eval/tasks/model_written_evals/advanced_ai_risk/human-coordinate-itself.yaml |multiple_choice | | |
| |advanced_ai_risk_human-coordinate-other-ais |lm_eval/tasks/model_written_evals/advanced_ai_risk/human-coordinate-other-ais.yaml |multiple_choice | | |
| |advanced_ai_risk_human-coordinate-other-versions |lm_eval/tasks/model_written_evals/advanced_ai_risk/human-coordinate-other-versions.yaml |multiple_choice | | |
| |advanced_ai_risk_human-corrigible-less-HHH |lm_eval/tasks/model_written_evals/advanced_ai_risk/human-corrigible-less-HHH.yaml |multiple_choice | | |
| |advanced_ai_risk_human-corrigible-more-HHH |lm_eval/tasks/model_written_evals/advanced_ai_risk/human-corrigible-more-HHH.yaml |multiple_choice | | |
| |advanced_ai_risk_human-corrigible-neutral-HHH |lm_eval/tasks/model_written_evals/advanced_ai_risk/human-corrigible-neutral-HHH.yaml |multiple_choice | | |
| |advanced_ai_risk_human-myopic-reward |lm_eval/tasks/model_written_evals/advanced_ai_risk/human-myopic-reward.yaml |multiple_choice | | |
| |advanced_ai_risk_human-one-box-tendency |lm_eval/tasks/model_written_evals/advanced_ai_risk/human-one-box-tendency.yaml |multiple_choice | | |
| |advanced_ai_risk_human-power-seeking-inclination |lm_eval/tasks/model_written_evals/advanced_ai_risk/human-power-seeking-inclination.yaml |multiple_choice | | |
| |advanced_ai_risk_human-self-awareness-general-ai |lm_eval/tasks/model_written_evals/advanced_ai_risk/human-self-awareness-general-ai.yaml |multiple_choice | | |
| |advanced_ai_risk_human-self-awareness-good-text-model |lm_eval/tasks/model_written_evals/advanced_ai_risk/human-self-awareness-good-text-model.yaml |multiple_choice | | |
| |advanced_ai_risk_human-self-awareness-text-model |lm_eval/tasks/model_written_evals/advanced_ai_risk/human-self-awareness-text-model.yaml |multiple_choice | | |
| |advanced_ai_risk_human-self-awareness-training-architecture |lm_eval/tasks/model_written_evals/advanced_ai_risk/human-self-awareness-training-architecture.yaml |multiple_choice | | |
| |advanced_ai_risk_human-self-awareness-web-gpt |lm_eval/tasks/model_written_evals/advanced_ai_risk/human-self-awareness-web-gpt.yaml |multiple_choice | | |
| |advanced_ai_risk_human-survival-instinct |lm_eval/tasks/model_written_evals/advanced_ai_risk/human-survival-instinct.yaml |multiple_choice | | |
| |advanced_ai_risk_human-wealth-seeking-inclination |lm_eval/tasks/model_written_evals/advanced_ai_risk/human-wealth-seeking-inclination.yaml |multiple_choice | | |
| |advanced_ai_risk_lm-coordinate-itself |lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-coordinate-itself.yaml |multiple_choice | | |
| |advanced_ai_risk_lm-coordinate-other-ais |lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-coordinate-other-ais.yaml |multiple_choice | | |
| |advanced_ai_risk_lm-coordinate-other-versions |lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-coordinate-other-versions.yaml |multiple_choice | | |
| |advanced_ai_risk_lm-corrigible-less-HHH |lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-corrigible-less-HHH.yaml |multiple_choice | | |
| |advanced_ai_risk_lm-corrigible-more-HHH |lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-corrigible-more-HHH.yaml |multiple_choice | | |
| |advanced_ai_risk_lm-corrigible-neutral-HHH |lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-corrigible-neutral-HHH.yaml |multiple_choice | | |
| |advanced_ai_risk_lm-myopic-reward |lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-myopic-reward.yaml |multiple_choice | | |
| |advanced_ai_risk_lm-one-box-tendency |lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-one-box-tendency.yaml |multiple_choice | | |
| |advanced_ai_risk_lm-power-seeking-inclination |lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-power-seeking-inclination.yaml |multiple_choice | | |
| |advanced_ai_risk_lm-self-awareness-general-ai |lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-self-awareness-general-ai.yaml |multiple_choice | | |
| |advanced_ai_risk_lm-self-awareness-good-text-model |lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-self-awareness-good-text-model.yaml |multiple_choice | | |
| |advanced_ai_risk_lm-self-awareness-text-model |lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-self-awareness-text-model.yaml |multiple_choice | | |
| |advanced_ai_risk_lm-self-awareness-training-architecture |lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-self-awareness-training-architecture.yaml |multiple_choice | | |
| |advanced_ai_risk_lm-self-awareness-training-nn-architecture |lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-self-awareness-training-nn-architecture.yaml |multiple_choice | | |
| |advanced_ai_risk_lm-self-awareness-training-web-gpt |lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-self-awareness-training-web-gpt.yaml |multiple_choice | | |
| |advanced_ai_risk_lm-survival-instinct |lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-survival-instinct.yaml |multiple_choice | | |
| |advanced_ai_risk_lm-wealth-seeking-inclination |lm_eval/tasks/model_written_evals/advanced_ai_risk/lm-wealth-seeking-inclination.yaml |multiple_choice | | |
| |aexams_Biology |lm_eval/tasks/aexams/aexams_Biology.yaml |multiple_choice | | |
| |aexams_IslamicStudies |lm_eval/tasks/aexams/aexams_IslamicStudies.yaml |multiple_choice | | |
| |aexams_Physics |lm_eval/tasks/aexams/aexams_Physics.yaml |multiple_choice | | |
| |aexams_Science |lm_eval/tasks/aexams/aexams_Science.yaml |multiple_choice | | |
| |aexams_Social |lm_eval/tasks/aexams/aexams_Social.yaml |multiple_choice | | |
| |afridiacritics_bbj_prompt_1 |lm_eval/tasks/afrobench/adr/prompt_1/afridiacritics_bbj.yaml |generate_until | | |
| |afridiacritics_bbj_prompt_2 |lm_eval/tasks/afrobench/adr/prompt_2/afridiacritics_bbj.yaml |generate_until | | |
| |afridiacritics_bbj_prompt_3 |lm_eval/tasks/afrobench/adr/prompt_3/afridiacritics_bbj.yaml |generate_until | | |
| |afridiacritics_bbj_prompt_4 |lm_eval/tasks/afrobench/adr/prompt_4/afridiacritics_bbj.yaml |generate_until | | |
| |afridiacritics_bbj_prompt_5 |lm_eval/tasks/afrobench/adr/prompt_5/afridiacritics_bbj.yaml |generate_until | | |
| |afridiacritics_fon_prompt_1 |lm_eval/tasks/afrobench/adr/prompt_1/afridiacritics_fon.yaml |generate_until | | |
| |afridiacritics_fon_prompt_2 |lm_eval/tasks/afrobench/adr/prompt_2/afridiacritics_fon.yaml |generate_until | | |
| |afridiacritics_fon_prompt_3 |lm_eval/tasks/afrobench/adr/prompt_3/afridiacritics_fon.yaml |generate_until | | |
| |afridiacritics_fon_prompt_4 |lm_eval/tasks/afrobench/adr/prompt_4/afridiacritics_fon.yaml |generate_until | | |
| |afridiacritics_fon_prompt_5 |lm_eval/tasks/afrobench/adr/prompt_5/afridiacritics_fon.yaml |generate_until | | |
| |afridiacritics_ibo_prompt_1 |lm_eval/tasks/afrobench/adr/prompt_1/afridiacritics_ibo.yaml |generate_until | | |
| |afridiacritics_ibo_prompt_2 |lm_eval/tasks/afrobench/adr/prompt_2/afridiacritics_ibo.yaml |generate_until | | |
| |afridiacritics_ibo_prompt_3 |lm_eval/tasks/afrobench/adr/prompt_3/afridiacritics_ibo.yaml |generate_until | | |
| |afridiacritics_ibo_prompt_4 |lm_eval/tasks/afrobench/adr/prompt_4/afridiacritics_ibo.yaml |generate_until | | |
| |afridiacritics_ibo_prompt_5 |lm_eval/tasks/afrobench/adr/prompt_5/afridiacritics_ibo.yaml |generate_until | | |
| |afridiacritics_wol_prompt_1 |lm_eval/tasks/afrobench/adr/prompt_1/afridiacritics_wol.yaml |generate_until | | |
| |afridiacritics_wol_prompt_2 |lm_eval/tasks/afrobench/adr/prompt_2/afridiacritics_wol.yaml |generate_until | | |
| |afridiacritics_wol_prompt_3 |lm_eval/tasks/afrobench/adr/prompt_3/afridiacritics_wol.yaml |generate_until | | |
| |afridiacritics_wol_prompt_4 |lm_eval/tasks/afrobench/adr/prompt_4/afridiacritics_wol.yaml |generate_until | | |
| |afridiacritics_wol_prompt_5 |lm_eval/tasks/afrobench/adr/prompt_5/afridiacritics_wol.yaml |generate_until | | |
| |afridiacritics_yor_prompt_1 |lm_eval/tasks/afrobench/adr/prompt_1/afridiacritics_yor.yaml |generate_until | | |
| |afridiacritics_yor_prompt_2 |lm_eval/tasks/afrobench/adr/prompt_2/afridiacritics_yor.yaml |generate_until | | |
| |afridiacritics_yor_prompt_3 |lm_eval/tasks/afrobench/adr/prompt_3/afridiacritics_yor.yaml |generate_until | | |
| |afridiacritics_yor_prompt_4 |lm_eval/tasks/afrobench/adr/prompt_4/afridiacritics_yor.yaml |generate_until | | |
| |afridiacritics_yor_prompt_5 |lm_eval/tasks/afrobench/adr/prompt_5/afridiacritics_yor.yaml |generate_until | | |
| |afrimgsm_amh_prompt_1 |lm_eval/tasks/afrimgsm/direct/prompt_1/afrimgsm_amh.yaml |generate_until | | |
| |afrimgsm_amh_prompt_2 |lm_eval/tasks/afrimgsm/direct/prompt_2/afrimgsm_amh.yaml |generate_until | | |
| |afrimgsm_amh_prompt_3 |lm_eval/tasks/afrimgsm/direct/prompt_3/afrimgsm_amh.yaml |generate_until | | |
| |afrimgsm_amh_prompt_4 |lm_eval/tasks/afrimgsm/direct/prompt_4/afrimgsm_amh.yaml |generate_until | | |
| |afrimgsm_amh_prompt_5 |lm_eval/tasks/afrimgsm/direct/prompt_5/afrimgsm_amh.yaml |generate_until | | |
| |afrimgsm_cot_amh_prompt_1 |lm_eval/tasks/afrimgsm/direct_cot/prompt_1/afrimgsm_cot_amh.yaml |generate_until | | |
| |afrimgsm_cot_amh_prompt_2 |lm_eval/tasks/afrimgsm/direct_cot/prompt_2/afrimgsm_cot_amh.yaml |generate_until | | |
| |afrimgsm_cot_amh_prompt_3 |lm_eval/tasks/afrimgsm/direct_cot/prompt_3/afrimgsm_cot_amh.yaml |generate_until | | |
| |afrimgsm_cot_amh_prompt_4 |lm_eval/tasks/afrimgsm/direct_cot/prompt_4/afrimgsm_cot_amh.yaml |generate_until | | |
| |afrimgsm_cot_amh_prompt_5 |lm_eval/tasks/afrimgsm/direct_cot/prompt_5/afrimgsm_cot_amh.yaml |generate_until | | |
| |afrimgsm_cot_eng_prompt_1 |lm_eval/tasks/afrimgsm/direct_cot/prompt_1/afrimgsm_cot_eng.yaml |generate_until | | |
| |afrimgsm_cot_eng_prompt_2 |lm_eval/tasks/afrimgsm/direct_cot/prompt_2/afrimgsm_cot_eng.yaml |generate_until | | |
| |afrimgsm_cot_eng_prompt_3 |lm_eval/tasks/afrimgsm/direct_cot/prompt_3/afrimgsm_cot_eng.yaml |generate_until | | |
| |afrimgsm_cot_eng_prompt_4 |lm_eval/tasks/afrimgsm/direct_cot/prompt_4/afrimgsm_cot_eng.yaml |generate_until | | |
| |afrimgsm_cot_eng_prompt_5 |lm_eval/tasks/afrimgsm/direct_cot/prompt_5/afrimgsm_cot_eng.yaml |generate_until | | |
| |afrimgsm_cot_ewe_prompt_1 |lm_eval/tasks/afrimgsm/direct_cot/prompt_1/afrimgsm_cot_ewe.yaml |generate_until | | |
| |afrimgsm_cot_ewe_prompt_2 |lm_eval/tasks/afrimgsm/direct_cot/prompt_2/afrimgsm_cot_ewe.yaml |generate_until | | |
| |afrimgsm_cot_ewe_prompt_3 |lm_eval/tasks/afrimgsm/direct_cot/prompt_3/afrimgsm_cot_ewe.yaml |generate_until | | |
| |afrimgsm_cot_ewe_prompt_4 |lm_eval/tasks/afrimgsm/direct_cot/prompt_4/afrimgsm_cot_ewe.yaml |generate_until | | |
| |afrimgsm_cot_ewe_prompt_5 |lm_eval/tasks/afrimgsm/direct_cot/prompt_5/afrimgsm_cot_ewe.yaml |generate_until | | |
| |afrimgsm_cot_fra_prompt_1 |lm_eval/tasks/afrimgsm/direct_cot/prompt_1/afrimgsm_cot_fra.yaml |generate_until | | |
| |afrimgsm_cot_fra_prompt_2 |lm_eval/tasks/afrimgsm/direct_cot/prompt_2/afrimgsm_cot_fra.yaml |generate_until | | |
| |afrimgsm_cot_fra_prompt_3 |lm_eval/tasks/afrimgsm/direct_cot/prompt_3/afrimgsm_cot_fra.yaml |generate_until | | |
| |afrimgsm_cot_fra_prompt_4 |lm_eval/tasks/afrimgsm/direct_cot/prompt_4/afrimgsm_cot_fra.yaml |generate_until | | |
| |afrimgsm_cot_fra_prompt_5 |lm_eval/tasks/afrimgsm/direct_cot/prompt_5/afrimgsm_cot_fra.yaml |generate_until | | |
| |afrimgsm_cot_hau_prompt_1 |lm_eval/tasks/afrimgsm/direct_cot/prompt_1/afrimgsm_cot_hau.yaml |generate_until | | |
| |afrimgsm_cot_hau_prompt_2 |lm_eval/tasks/afrimgsm/direct_cot/prompt_2/afrimgsm_cot_hau.yaml |generate_until | | |
| |afrimgsm_cot_hau_prompt_3 |lm_eval/tasks/afrimgsm/direct_cot/prompt_3/afrimgsm_cot_hau.yaml |generate_until | | |
| |afrimgsm_cot_hau_prompt_4 |lm_eval/tasks/afrimgsm/direct_cot/prompt_4/afrimgsm_cot_hau.yaml |generate_until | | |
| |afrimgsm_cot_hau_prompt_5 |lm_eval/tasks/afrimgsm/direct_cot/prompt_5/afrimgsm_cot_hau.yaml |generate_until | | |
| |afrimgsm_cot_ibo_prompt_1 |lm_eval/tasks/afrimgsm/direct_cot/prompt_1/afrimgsm_cot_ibo.yaml |generate_until | | |
| |afrimgsm_cot_ibo_prompt_2 |lm_eval/tasks/afrimgsm/direct_cot/prompt_2/afrimgsm_cot_ibo.yaml |generate_until | | |
| |afrimgsm_cot_ibo_prompt_3 |lm_eval/tasks/afrimgsm/direct_cot/prompt_3/afrimgsm_cot_ibo.yaml |generate_until | | |
| |afrimgsm_cot_ibo_prompt_4 |lm_eval/tasks/afrimgsm/direct_cot/prompt_4/afrimgsm_cot_ibo.yaml |generate_until | | |
| |afrimgsm_cot_ibo_prompt_5 |lm_eval/tasks/afrimgsm/direct_cot/prompt_5/afrimgsm_cot_ibo.yaml |generate_until | | |
| |afrimgsm_cot_kin_prompt_1 |lm_eval/tasks/afrimgsm/direct_cot/prompt_1/afrimgsm_cot_kin.yaml |generate_until | | |
| |afrimgsm_cot_kin_prompt_2 |lm_eval/tasks/afrimgsm/direct_cot/prompt_2/afrimgsm_cot_kin.yaml |generate_until | | |
| |afrimgsm_cot_kin_prompt_3 |lm_eval/tasks/afrimgsm/direct_cot/prompt_3/afrimgsm_cot_kin.yaml |generate_until | | |
| |afrimgsm_cot_kin_prompt_4 |lm_eval/tasks/afrimgsm/direct_cot/prompt_4/afrimgsm_cot_kin.yaml |generate_until | | |
| |afrimgsm_cot_kin_prompt_5 |lm_eval/tasks/afrimgsm/direct_cot/prompt_5/afrimgsm_cot_kin.yaml |generate_until | | |
| |afrimgsm_cot_lin_prompt_1 |lm_eval/tasks/afrimgsm/direct_cot/prompt_1/afrimgsm_cot_lin.yaml |generate_until | | |
| |afrimgsm_cot_lin_prompt_2 |lm_eval/tasks/afrimgsm/direct_cot/prompt_2/afrimgsm_cot_lin.yaml |generate_until | | |
| |afrimgsm_cot_lin_prompt_3 |lm_eval/tasks/afrimgsm/direct_cot/prompt_3/afrimgsm_cot_lin.yaml |generate_until | | |
| |afrimgsm_cot_lin_prompt_4 |lm_eval/tasks/afrimgsm/direct_cot/prompt_4/afrimgsm_cot_lin.yaml |generate_until | | |
| |afrimgsm_cot_lin_prompt_5 |lm_eval/tasks/afrimgsm/direct_cot/prompt_5/afrimgsm_cot_lin.yaml |generate_until | | |
| |afrimgsm_cot_lug_prompt_1 |lm_eval/tasks/afrimgsm/direct_cot/prompt_1/afrimgsm_cot_lug.yaml |generate_until | | |
| |afrimgsm_cot_lug_prompt_2 |lm_eval/tasks/afrimgsm/direct_cot/prompt_2/afrimgsm_cot_lug.yaml |generate_until | | |
| |afrimgsm_cot_lug_prompt_3 |lm_eval/tasks/afrimgsm/direct_cot/prompt_3/afrimgsm_cot_lug.yaml |generate_until | | |
| |afrimgsm_cot_lug_prompt_4 |lm_eval/tasks/afrimgsm/direct_cot/prompt_4/afrimgsm_cot_lug.yaml |generate_until | | |
| |afrimgsm_cot_lug_prompt_5 |lm_eval/tasks/afrimgsm/direct_cot/prompt_5/afrimgsm_cot_lug.yaml |generate_until | | |
| |afrimgsm_cot_orm_prompt_1 |lm_eval/tasks/afrimgsm/direct_cot/prompt_1/afrimgsm_cot_orm.yaml |generate_until | | |
| |afrimgsm_cot_orm_prompt_2 |lm_eval/tasks/afrimgsm/direct_cot/prompt_2/afrimgsm_cot_orm.yaml |generate_until | | |
| |afrimgsm_cot_orm_prompt_3 |lm_eval/tasks/afrimgsm/direct_cot/prompt_3/afrimgsm_cot_orm.yaml |generate_until | | |
| |afrimgsm_cot_orm_prompt_4 |lm_eval/tasks/afrimgsm/direct_cot/prompt_4/afrimgsm_cot_orm.yaml |generate_until | | |
| |afrimgsm_cot_orm_prompt_5 |lm_eval/tasks/afrimgsm/direct_cot/prompt_5/afrimgsm_cot_orm.yaml |generate_until | | |
| |afrimgsm_cot_sna_prompt_1 |lm_eval/tasks/afrimgsm/direct_cot/prompt_1/afrimgsm_cot_sna.yaml |generate_until | | |
| |afrimgsm_cot_sna_prompt_2 |lm_eval/tasks/afrimgsm/direct_cot/prompt_2/afrimgsm_cot_sna.yaml |generate_until | | |
| |afrimgsm_cot_sna_prompt_3 |lm_eval/tasks/afrimgsm/direct_cot/prompt_3/afrimgsm_cot_sna.yaml |generate_until | | |
| |afrimgsm_cot_sna_prompt_4 |lm_eval/tasks/afrimgsm/direct_cot/prompt_4/afrimgsm_cot_sna.yaml |generate_until | | |
| |afrimgsm_cot_sna_prompt_5 |lm_eval/tasks/afrimgsm/direct_cot/prompt_5/afrimgsm_cot_sna.yaml |generate_until | | |
| |afrimgsm_cot_sot_prompt_1 |lm_eval/tasks/afrimgsm/direct_cot/prompt_1/afrimgsm_cot_sot.yaml |generate_until | | |
| |afrimgsm_cot_sot_prompt_2 |lm_eval/tasks/afrimgsm/direct_cot/prompt_2/afrimgsm_cot_sot.yaml |generate_until | | |
| |afrimgsm_cot_sot_prompt_3 |lm_eval/tasks/afrimgsm/direct_cot/prompt_3/afrimgsm_cot_sot.yaml |generate_until | | |
| |afrimgsm_cot_sot_prompt_4 |lm_eval/tasks/afrimgsm/direct_cot/prompt_4/afrimgsm_cot_sot.yaml |generate_until | | |
| |afrimgsm_cot_sot_prompt_5 |lm_eval/tasks/afrimgsm/direct_cot/prompt_5/afrimgsm_cot_sot.yaml |generate_until | | |
| |afrimgsm_cot_swa_prompt_1 |lm_eval/tasks/afrimgsm/direct_cot/prompt_1/afrimgsm_cot_swa.yaml |generate_until | | |
| |afrimgsm_cot_swa_prompt_2 |lm_eval/tasks/afrimgsm/direct_cot/prompt_2/afrimgsm_cot_swa.yaml |generate_until | | |
| |afrimgsm_cot_swa_prompt_3 |lm_eval/tasks/afrimgsm/direct_cot/prompt_3/afrimgsm_cot_swa.yaml |generate_until | | |
| |afrimgsm_cot_swa_prompt_4 |lm_eval/tasks/afrimgsm/direct_cot/prompt_4/afrimgsm_cot_swa.yaml |generate_until | | |
| |afrimgsm_cot_swa_prompt_5 |lm_eval/tasks/afrimgsm/direct_cot/prompt_5/afrimgsm_cot_swa.yaml |generate_until | | |
| |afrimgsm_cot_translate_amh_prompt_1 |lm_eval/tasks/afrimgsm/translate_cot/prompt_1/afrimgsm_cot_translate_amh.yaml |generate_until | | |
| |afrimgsm_cot_translate_amh_prompt_2 |lm_eval/tasks/afrimgsm/translate_cot/prompt_2/afrimgsm_cot_translate_amh.yaml |generate_until | | |
| |afrimgsm_cot_translate_amh_prompt_3 |lm_eval/tasks/afrimgsm/translate_cot/prompt_3/afrimgsm_cot_translate_amh.yaml |generate_until | | |
| |afrimgsm_cot_translate_amh_prompt_4 |lm_eval/tasks/afrimgsm/translate_cot/prompt_4/afrimgsm_cot_translate_amh.yaml |generate_until | | |
| |afrimgsm_cot_translate_amh_prompt_5 |lm_eval/tasks/afrimgsm/translate_cot/prompt_5/afrimgsm_cot_translate_amh.yaml |generate_until | | |
| |afrimgsm_cot_translate_ewe_prompt_1 |lm_eval/tasks/afrimgsm/translate_cot/prompt_1/afrimgsm_cot_translate_ewe.yaml |generate_until | | |
| |afrimgsm_cot_translate_ewe_prompt_2 |lm_eval/tasks/afrimgsm/translate_cot/prompt_2/afrimgsm_cot_translate_ewe.yaml |generate_until | | |
| |afrimgsm_cot_translate_ewe_prompt_3 |lm_eval/tasks/afrimgsm/translate_cot/prompt_3/afrimgsm_cot_translate_ewe.yaml |generate_until | | |
| |afrimgsm_cot_translate_ewe_prompt_4 |lm_eval/tasks/afrimgsm/translate_cot/prompt_4/afrimgsm_cot_translate_ewe.yaml |generate_until | | |
| |afrimgsm_cot_translate_ewe_prompt_5 |lm_eval/tasks/afrimgsm/translate_cot/prompt_5/afrimgsm_cot_translate_ewe.yaml |generate_until | | |
| |afrimgsm_cot_translate_fra_prompt_1 |lm_eval/tasks/afrimgsm/translate_cot/prompt_1/afrimgsm_cot_translate_fra.yaml |generate_until | | |
| |afrimgsm_cot_translate_fra_prompt_2 |lm_eval/tasks/afrimgsm/translate_cot/prompt_2/afrimgsm_cot_translate_fra.yaml |generate_until | | |
| |afrimgsm_cot_translate_fra_prompt_3 |lm_eval/tasks/afrimgsm/translate_cot/prompt_3/afrimgsm_cot_translate_fra.yaml |generate_until | | |
| |afrimgsm_cot_translate_fra_prompt_4 |lm_eval/tasks/afrimgsm/translate_cot/prompt_4/afrimgsm_cot_translate_fra.yaml |generate_until | | |
| |afrimgsm_cot_translate_fra_prompt_5 |lm_eval/tasks/afrimgsm/translate_cot/prompt_5/afrimgsm_cot_translate_fra.yaml |generate_until | | |
| |afrimgsm_cot_translate_hau_prompt_1 |lm_eval/tasks/afrimgsm/translate_cot/prompt_1/afrimgsm_cot_translate_hau.yaml |generate_until | | |
| |afrimgsm_cot_translate_hau_prompt_2 |lm_eval/tasks/afrimgsm/translate_cot/prompt_2/afrimgsm_cot_translate_hau.yaml |generate_until | | |
| |afrimgsm_cot_translate_hau_prompt_3 |lm_eval/tasks/afrimgsm/translate_cot/prompt_3/afrimgsm_cot_translate_hau.yaml |generate_until | | |
| |afrimgsm_cot_translate_hau_prompt_4 |lm_eval/tasks/afrimgsm/translate_cot/prompt_4/afrimgsm_cot_translate_hau.yaml |generate_until | | |
| |afrimgsm_cot_translate_hau_prompt_5 |lm_eval/tasks/afrimgsm/translate_cot/prompt_5/afrimgsm_cot_translate_hau.yaml |generate_until | | |
| |afrimgsm_cot_translate_ibo_prompt_1 |lm_eval/tasks/afrimgsm/translate_cot/prompt_1/afrimgsm_cot_translate_ibo.yaml |generate_until | | |
| |afrimgsm_cot_translate_ibo_prompt_2 |lm_eval/tasks/afrimgsm/translate_cot/prompt_2/afrimgsm_cot_translate_ibo.yaml |generate_until | | |
| |afrimgsm_cot_translate_ibo_prompt_3 |lm_eval/tasks/afrimgsm/translate_cot/prompt_3/afrimgsm_cot_translate_ibo.yaml |generate_until | | |
| |afrimgsm_cot_translate_ibo_prompt_4 |lm_eval/tasks/afrimgsm/translate_cot/prompt_4/afrimgsm_cot_translate_ibo.yaml |generate_until | | |
| |afrimgsm_cot_translate_ibo_prompt_5 |lm_eval/tasks/afrimgsm/translate_cot/prompt_5/afrimgsm_cot_translate_ibo.yaml |generate_until | | |
| |afrimgsm_cot_translate_kin_prompt_1 |lm_eval/tasks/afrimgsm/translate_cot/prompt_1/afrimgsm_cot_translate_kin.yaml |generate_until | | |
| |afrimgsm_cot_translate_kin_prompt_2 |lm_eval/tasks/afrimgsm/translate_cot/prompt_2/afrimgsm_cot_translate_kin.yaml |generate_until | | |
| |afrimgsm_cot_translate_kin_prompt_3 |lm_eval/tasks/afrimgsm/translate_cot/prompt_3/afrimgsm_cot_translate_kin.yaml |generate_until | | |
| |afrimgsm_cot_translate_kin_prompt_4 |lm_eval/tasks/afrimgsm/translate_cot/prompt_4/afrimgsm_cot_translate_kin.yaml |generate_until | | |
| |afrimgsm_cot_translate_kin_prompt_5 |lm_eval/tasks/afrimgsm/translate_cot/prompt_5/afrimgsm_cot_translate_kin.yaml |generate_until | | |
| |afrimgsm_cot_translate_lin_prompt_1 |lm_eval/tasks/afrimgsm/translate_cot/prompt_1/afrimgsm_cot_translate_lin.yaml |generate_until | | |
| |afrimgsm_cot_translate_lin_prompt_2 |lm_eval/tasks/afrimgsm/translate_cot/prompt_2/afrimgsm_cot_translate_lin.yaml |generate_until | | |
| |afrimgsm_cot_translate_lin_prompt_3 |lm_eval/tasks/afrimgsm/translate_cot/prompt_3/afrimgsm_cot_translate_lin.yaml |generate_until | | |
| |afrimgsm_cot_translate_lin_prompt_4 |lm_eval/tasks/afrimgsm/translate_cot/prompt_4/afrimgsm_cot_translate_lin.yaml |generate_until | | |
| |afrimgsm_cot_translate_lin_prompt_5 |lm_eval/tasks/afrimgsm/translate_cot/prompt_5/afrimgsm_cot_translate_lin.yaml |generate_until | | |
| |afrimgsm_cot_translate_lug_prompt_1 |lm_eval/tasks/afrimgsm/translate_cot/prompt_1/afrimgsm_cot_translate_lug.yaml |generate_until | | |
| |afrimgsm_cot_translate_lug_prompt_2 |lm_eval/tasks/afrimgsm/translate_cot/prompt_2/afrimgsm_cot_translate_lug.yaml |generate_until | | |
| |afrimgsm_cot_translate_lug_prompt_3 |lm_eval/tasks/afrimgsm/translate_cot/prompt_3/afrimgsm_cot_translate_lug.yaml |generate_until | | |
| |afrimgsm_cot_translate_lug_prompt_4 |lm_eval/tasks/afrimgsm/translate_cot/prompt_4/afrimgsm_cot_translate_lug.yaml |generate_until | | |
| |afrimgsm_cot_translate_lug_prompt_5 |lm_eval/tasks/afrimgsm/translate_cot/prompt_5/afrimgsm_cot_translate_lug.yaml |generate_until | | |
| |afrimgsm_cot_translate_orm_prompt_1 |lm_eval/tasks/afrimgsm/translate_cot/prompt_1/afrimgsm_cot_translate_orm.yaml |generate_until | | |
| |afrimgsm_cot_translate_orm_prompt_2 |lm_eval/tasks/afrimgsm/translate_cot/prompt_2/afrimgsm_cot_translate_orm.yaml |generate_until | | |
| |afrimgsm_cot_translate_orm_prompt_3 |lm_eval/tasks/afrimgsm/translate_cot/prompt_3/afrimgsm_cot_translate_orm.yaml |generate_until | | |
| |afrimgsm_cot_translate_orm_prompt_4 |lm_eval/tasks/afrimgsm/translate_cot/prompt_4/afrimgsm_cot_translate_orm.yaml |generate_until | | |
| |afrimgsm_cot_translate_orm_prompt_5 |lm_eval/tasks/afrimgsm/translate_cot/prompt_5/afrimgsm_cot_translate_orm.yaml |generate_until | | |
| |afrimgsm_cot_translate_sna_prompt_1 |lm_eval/tasks/afrimgsm/translate_cot/prompt_1/afrimgsm_cot_translate_sna.yaml |generate_until | | |
| |afrimgsm_cot_translate_sna_prompt_2 |lm_eval/tasks/afrimgsm/translate_cot/prompt_2/afrimgsm_cot_translate_sna.yaml |generate_until | | |
| |afrimgsm_cot_translate_sna_prompt_3 |lm_eval/tasks/afrimgsm/translate_cot/prompt_3/afrimgsm_cot_translate_sna.yaml |generate_until | | |
| |afrimgsm_cot_translate_sna_prompt_4 |lm_eval/tasks/afrimgsm/translate_cot/prompt_4/afrimgsm_cot_translate_sna.yaml |generate_until | | |
| |afrimgsm_cot_translate_sna_prompt_5 |lm_eval/tasks/afrimgsm/translate_cot/prompt_5/afrimgsm_cot_translate_sna.yaml |generate_until | | |
| |afrimgsm_cot_translate_sot_prompt_1 |lm_eval/tasks/afrimgsm/translate_cot/prompt_1/afrimgsm_cot_translate_sot.yaml |generate_until | | |
| |afrimgsm_cot_translate_sot_prompt_2 |lm_eval/tasks/afrimgsm/translate_cot/prompt_2/afrimgsm_cot_translate_sot.yaml |generate_until | | |
| |afrimgsm_cot_translate_sot_prompt_3 |lm_eval/tasks/afrimgsm/translate_cot/prompt_3/afrimgsm_cot_translate_sot.yaml |generate_until | | |
| |afrimgsm_cot_translate_sot_prompt_4 |lm_eval/tasks/afrimgsm/translate_cot/prompt_4/afrimgsm_cot_translate_sot.yaml |generate_until | | |
| |afrimgsm_cot_translate_sot_prompt_5 |lm_eval/tasks/afrimgsm/translate_cot/prompt_5/afrimgsm_cot_translate_sot.yaml |generate_until | | |
| |afrimgsm_cot_translate_swa_prompt_1 |lm_eval/tasks/afrimgsm/translate_cot/prompt_1/afrimgsm_cot_translate_swa.yaml |generate_until | | |
| |afrimgsm_cot_translate_swa_prompt_2 |lm_eval/tasks/afrimgsm/translate_cot/prompt_2/afrimgsm_cot_translate_swa.yaml |generate_until | | |
| |afrimgsm_cot_translate_swa_prompt_3 |lm_eval/tasks/afrimgsm/translate_cot/prompt_3/afrimgsm_cot_translate_swa.yaml |generate_until | | |
| |afrimgsm_cot_translate_swa_prompt_4 |lm_eval/tasks/afrimgsm/translate_cot/prompt_4/afrimgsm_cot_translate_swa.yaml |generate_until | | |
| |afrimgsm_cot_translate_swa_prompt_5 |lm_eval/tasks/afrimgsm/translate_cot/prompt_5/afrimgsm_cot_translate_swa.yaml |generate_until | | |
| |afrimgsm_cot_translate_twi_prompt_1 |lm_eval/tasks/afrimgsm/translate_cot/prompt_1/afrimgsm_cot_translate_twi.yaml |generate_until | | |
| |afrimgsm_cot_translate_twi_prompt_2 |lm_eval/tasks/afrimgsm/translate_cot/prompt_2/afrimgsm_cot_translate_twi.yaml |generate_until | | |
| |afrimgsm_cot_translate_twi_prompt_3 |lm_eval/tasks/afrimgsm/translate_cot/prompt_3/afrimgsm_cot_translate_twi.yaml |generate_until | | |
| |afrimgsm_cot_translate_twi_prompt_4 |lm_eval/tasks/afrimgsm/translate_cot/prompt_4/afrimgsm_cot_translate_twi.yaml |generate_until | | |
| |afrimgsm_cot_translate_twi_prompt_5 |lm_eval/tasks/afrimgsm/translate_cot/prompt_5/afrimgsm_cot_translate_twi.yaml |generate_until | | |
| |afrimgsm_cot_translate_vai_prompt_1 |lm_eval/tasks/afrimgsm/translate_cot/prompt_1/afrimgsm_cot_translate_vai.yaml |generate_until | | |
| |afrimgsm_cot_translate_vai_prompt_2 |lm_eval/tasks/afrimgsm/translate_cot/prompt_2/afrimgsm_cot_translate_vai.yaml |generate_until | | |
| |afrimgsm_cot_translate_vai_prompt_3 |lm_eval/tasks/afrimgsm/translate_cot/prompt_3/afrimgsm_cot_translate_vai.yaml |generate_until | | |
| |afrimgsm_cot_translate_vai_prompt_4 |lm_eval/tasks/afrimgsm/translate_cot/prompt_4/afrimgsm_cot_translate_vai.yaml |generate_until | | |
| |afrimgsm_cot_translate_vai_prompt_5 |lm_eval/tasks/afrimgsm/translate_cot/prompt_5/afrimgsm_cot_translate_vai.yaml |generate_until | | |
| |afrimgsm_cot_translate_wol_prompt_1 |lm_eval/tasks/afrimgsm/translate_cot/prompt_1/afrimgsm_cot_translate_wol.yaml |generate_until | | |
| |afrimgsm_cot_translate_wol_prompt_2 |lm_eval/tasks/afrimgsm/translate_cot/prompt_2/afrimgsm_cot_translate_wol.yaml |generate_until | | |
| |afrimgsm_cot_translate_wol_prompt_3 |lm_eval/tasks/afrimgsm/translate_cot/prompt_3/afrimgsm_cot_translate_wol.yaml |generate_until | | |
| |afrimgsm_cot_translate_wol_prompt_4 |lm_eval/tasks/afrimgsm/translate_cot/prompt_4/afrimgsm_cot_translate_wol.yaml |generate_until | | |
| |afrimgsm_cot_translate_wol_prompt_5 |lm_eval/tasks/afrimgsm/translate_cot/prompt_5/afrimgsm_cot_translate_wol.yaml |generate_until | | |
| |afrimgsm_cot_translate_xho_prompt_1 |lm_eval/tasks/afrimgsm/translate_cot/prompt_1/afrimgsm_cot_translate_xho.yaml |generate_until | | |
| |afrimgsm_cot_translate_xho_prompt_2 |lm_eval/tasks/afrimgsm/translate_cot/prompt_2/afrimgsm_cot_translate_xho.yaml |generate_until | | |
| |afrimgsm_cot_translate_xho_prompt_3 |lm_eval/tasks/afrimgsm/translate_cot/prompt_3/afrimgsm_cot_translate_xho.yaml |generate_until | | |
| |afrimgsm_cot_translate_xho_prompt_4 |lm_eval/tasks/afrimgsm/translate_cot/prompt_4/afrimgsm_cot_translate_xho.yaml |generate_until | | |
| |afrimgsm_cot_translate_xho_prompt_5 |lm_eval/tasks/afrimgsm/translate_cot/prompt_5/afrimgsm_cot_translate_xho.yaml |generate_until | | |
| |afrimgsm_cot_translate_yor_prompt_1 |lm_eval/tasks/afrimgsm/translate_cot/prompt_1/afrimgsm_cot_translate_yor.yaml |generate_until | | |
| |afrimgsm_cot_translate_yor_prompt_2 |lm_eval/tasks/afrimgsm/translate_cot/prompt_2/afrimgsm_cot_translate_yor.yaml |generate_until | | |
| |afrimgsm_cot_translate_yor_prompt_3 |lm_eval/tasks/afrimgsm/translate_cot/prompt_3/afrimgsm_cot_translate_yor.yaml |generate_until | | |
| |afrimgsm_cot_translate_yor_prompt_4 |lm_eval/tasks/afrimgsm/translate_cot/prompt_4/afrimgsm_cot_translate_yor.yaml |generate_until | | |
| |afrimgsm_cot_translate_yor_prompt_5 |lm_eval/tasks/afrimgsm/translate_cot/prompt_5/afrimgsm_cot_translate_yor.yaml |generate_until | | |
| |afrimgsm_cot_translate_zul_prompt_1 |lm_eval/tasks/afrimgsm/translate_cot/prompt_1/afrimgsm_cot_translate_zul.yaml |generate_until | | |
| |afrimgsm_cot_translate_zul_prompt_2 |lm_eval/tasks/afrimgsm/translate_cot/prompt_2/afrimgsm_cot_translate_zul.yaml |generate_until | | |
| |afrimgsm_cot_translate_zul_prompt_3 |lm_eval/tasks/afrimgsm/translate_cot/prompt_3/afrimgsm_cot_translate_zul.yaml |generate_until | | |
| |afrimgsm_cot_translate_zul_prompt_4 |lm_eval/tasks/afrimgsm/translate_cot/prompt_4/afrimgsm_cot_translate_zul.yaml |generate_until | | |
| |afrimgsm_cot_translate_zul_prompt_5 |lm_eval/tasks/afrimgsm/translate_cot/prompt_5/afrimgsm_cot_translate_zul.yaml |generate_until | | |
| |afrimgsm_cot_twi_prompt_1 |lm_eval/tasks/afrimgsm/direct_cot/prompt_1/afrimgsm_cot_twi.yaml |generate_until | | |
| |afrimgsm_cot_twi_prompt_2 |lm_eval/tasks/afrimgsm/direct_cot/prompt_2/afrimgsm_cot_twi.yaml |generate_until | | |
| |afrimgsm_cot_twi_prompt_3 |lm_eval/tasks/afrimgsm/direct_cot/prompt_3/afrimgsm_cot_twi.yaml |generate_until | | |
| |afrimgsm_cot_twi_prompt_4 |lm_eval/tasks/afrimgsm/direct_cot/prompt_4/afrimgsm_cot_twi.yaml |generate_until | | |
| |afrimgsm_cot_twi_prompt_5 |lm_eval/tasks/afrimgsm/direct_cot/prompt_5/afrimgsm_cot_twi.yaml |generate_until | | |
| |afrimgsm_cot_vai_prompt_1 |lm_eval/tasks/afrimgsm/direct_cot/prompt_1/afrimgsm_cot_vai.yaml |generate_until | | |
| |afrimgsm_cot_vai_prompt_2 |lm_eval/tasks/afrimgsm/direct_cot/prompt_2/afrimgsm_cot_vai.yaml |generate_until | | |
| |afrimgsm_cot_vai_prompt_3 |lm_eval/tasks/afrimgsm/direct_cot/prompt_3/afrimgsm_cot_vai.yaml |generate_until | | |
| |afrimgsm_cot_vai_prompt_4 |lm_eval/tasks/afrimgsm/direct_cot/prompt_4/afrimgsm_cot_vai.yaml |generate_until | | |
| |afrimgsm_cot_vai_prompt_5 |lm_eval/tasks/afrimgsm/direct_cot/prompt_5/afrimgsm_cot_vai.yaml |generate_until | | |
| |afrimgsm_cot_wol_prompt_1 |lm_eval/tasks/afrimgsm/direct_cot/prompt_1/afrimgsm_cot_wol.yaml |generate_until | | |
| |afrimgsm_cot_wol_prompt_2 |lm_eval/tasks/afrimgsm/direct_cot/prompt_2/afrimgsm_cot_wol.yaml |generate_until | | |
| |afrimgsm_cot_wol_prompt_3 |lm_eval/tasks/afrimgsm/direct_cot/prompt_3/afrimgsm_cot_wol.yaml |generate_until | | |
| |afrimgsm_cot_wol_prompt_4 |lm_eval/tasks/afrimgsm/direct_cot/prompt_4/afrimgsm_cot_wol.yaml |generate_until | | |
| |afrimgsm_cot_wol_prompt_5 |lm_eval/tasks/afrimgsm/direct_cot/prompt_5/afrimgsm_cot_wol.yaml |generate_until | | |
| |afrimgsm_cot_xho_prompt_1 |lm_eval/tasks/afrimgsm/direct_cot/prompt_1/afrimgsm_cot_xho.yaml |generate_until | | |
| |afrimgsm_cot_xho_prompt_2 |lm_eval/tasks/afrimgsm/direct_cot/prompt_2/afrimgsm_cot_xho.yaml |generate_until | | |
| |afrimgsm_cot_xho_prompt_3 |lm_eval/tasks/afrimgsm/direct_cot/prompt_3/afrimgsm_cot_xho.yaml |generate_until | | |
| |afrimgsm_cot_xho_prompt_4 |lm_eval/tasks/afrimgsm/direct_cot/prompt_4/afrimgsm_cot_xho.yaml |generate_until | | |
| |afrimgsm_cot_xho_prompt_5 |lm_eval/tasks/afrimgsm/direct_cot/prompt_5/afrimgsm_cot_xho.yaml |generate_until | | |
| |afrimgsm_cot_yor_prompt_1 |lm_eval/tasks/afrimgsm/direct_cot/prompt_1/afrimgsm_cot_yor.yaml |generate_until | | |
| |afrimgsm_cot_yor_prompt_2 |lm_eval/tasks/afrimgsm/direct_cot/prompt_2/afrimgsm_cot_yor.yaml |generate_until | | |
| |afrimgsm_cot_yor_prompt_3 |lm_eval/tasks/afrimgsm/direct_cot/prompt_3/afrimgsm_cot_yor.yaml |generate_until | | |
| |afrimgsm_cot_yor_prompt_4 |lm_eval/tasks/afrimgsm/direct_cot/prompt_4/afrimgsm_cot_yor.yaml |generate_until | | |
| |afrimgsm_cot_yor_prompt_5 |lm_eval/tasks/afrimgsm/direct_cot/prompt_5/afrimgsm_cot_yor.yaml |generate_until | | |
| |afrimgsm_cot_zul_prompt_1 |lm_eval/tasks/afrimgsm/direct_cot/prompt_1/afrimgsm_cot_zul.yaml |generate_until | | |
| |afrimgsm_cot_zul_prompt_2 |lm_eval/tasks/afrimgsm/direct_cot/prompt_2/afrimgsm_cot_zul.yaml |generate_until | | |
| |afrimgsm_cot_zul_prompt_3 |lm_eval/tasks/afrimgsm/direct_cot/prompt_3/afrimgsm_cot_zul.yaml |generate_until | | |
| |afrimgsm_cot_zul_prompt_4 |lm_eval/tasks/afrimgsm/direct_cot/prompt_4/afrimgsm_cot_zul.yaml |generate_until | | |
| |afrimgsm_cot_zul_prompt_5 |lm_eval/tasks/afrimgsm/direct_cot/prompt_5/afrimgsm_cot_zul.yaml |generate_until | | |
| |afrimgsm_eng_prompt_1 |lm_eval/tasks/afrimgsm/direct/prompt_1/afrimgsm_eng.yaml |generate_until | | |
| |afrimgsm_eng_prompt_2 |lm_eval/tasks/afrimgsm/direct/prompt_2/afrimgsm_eng.yaml |generate_until | | |
| |afrimgsm_eng_prompt_3 |lm_eval/tasks/afrimgsm/direct/prompt_3/afrimgsm_eng.yaml |generate_until | | |
| |afrimgsm_eng_prompt_4 |lm_eval/tasks/afrimgsm/direct/prompt_4/afrimgsm_eng.yaml |generate_until | | |
| |afrimgsm_eng_prompt_5 |lm_eval/tasks/afrimgsm/direct/prompt_5/afrimgsm_eng.yaml |generate_until | | |
| |afrimgsm_ewe_prompt_1 |lm_eval/tasks/afrimgsm/direct/prompt_1/afrimgsm_ewe.yaml |generate_until | | |
| |afrimgsm_ewe_prompt_2 |lm_eval/tasks/afrimgsm/direct/prompt_2/afrimgsm_ewe.yaml |generate_until | | |
| |afrimgsm_ewe_prompt_3 |lm_eval/tasks/afrimgsm/direct/prompt_3/afrimgsm_ewe.yaml |generate_until | | |
| |afrimgsm_ewe_prompt_4 |lm_eval/tasks/afrimgsm/direct/prompt_4/afrimgsm_ewe.yaml |generate_until | | |
| |afrimgsm_ewe_prompt_5 |lm_eval/tasks/afrimgsm/direct/prompt_5/afrimgsm_ewe.yaml |generate_until | | |
| |afrimgsm_fra_prompt_1 |lm_eval/tasks/afrimgsm/direct/prompt_1/afrimgsm_fra.yaml |generate_until | | |
| |afrimgsm_fra_prompt_2 |lm_eval/tasks/afrimgsm/direct/prompt_2/afrimgsm_fra.yaml |generate_until | | |
| |afrimgsm_fra_prompt_3 |lm_eval/tasks/afrimgsm/direct/prompt_3/afrimgsm_fra.yaml |generate_until | | |
| |afrimgsm_fra_prompt_4 |lm_eval/tasks/afrimgsm/direct/prompt_4/afrimgsm_fra.yaml |generate_until | | |
| |afrimgsm_fra_prompt_5 |lm_eval/tasks/afrimgsm/direct/prompt_5/afrimgsm_fra.yaml |generate_until | | |
| |afrimgsm_hau_prompt_1 |lm_eval/tasks/afrimgsm/direct/prompt_1/afrimgsm_hau.yaml |generate_until | | |
| |afrimgsm_hau_prompt_2 |lm_eval/tasks/afrimgsm/direct/prompt_2/afrimgsm_hau.yaml |generate_until | | |
| |afrimgsm_hau_prompt_3 |lm_eval/tasks/afrimgsm/direct/prompt_3/afrimgsm_hau.yaml |generate_until | | |
| |afrimgsm_hau_prompt_4 |lm_eval/tasks/afrimgsm/direct/prompt_4/afrimgsm_hau.yaml |generate_until | | |
| |afrimgsm_hau_prompt_5 |lm_eval/tasks/afrimgsm/direct/prompt_5/afrimgsm_hau.yaml |generate_until | | |
| |afrimgsm_ibo_prompt_1 |lm_eval/tasks/afrimgsm/direct/prompt_1/afrimgsm_ibo.yaml |generate_until | | |
| |afrimgsm_ibo_prompt_2 |lm_eval/tasks/afrimgsm/direct/prompt_2/afrimgsm_ibo.yaml |generate_until | | |
| |afrimgsm_ibo_prompt_3 |lm_eval/tasks/afrimgsm/direct/prompt_3/afrimgsm_ibo.yaml |generate_until | | |
| |afrimgsm_ibo_prompt_4 |lm_eval/tasks/afrimgsm/direct/prompt_4/afrimgsm_ibo.yaml |generate_until | | |
| |afrimgsm_ibo_prompt_5 |lm_eval/tasks/afrimgsm/direct/prompt_5/afrimgsm_ibo.yaml |generate_until | | |
| |afrimgsm_kin_prompt_1 |lm_eval/tasks/afrimgsm/direct/prompt_1/afrimgsm_kin.yaml |generate_until | | |
| |afrimgsm_kin_prompt_2 |lm_eval/tasks/afrimgsm/direct/prompt_2/afrimgsm_kin.yaml |generate_until | | |
| |afrimgsm_kin_prompt_3 |lm_eval/tasks/afrimgsm/direct/prompt_3/afrimgsm_kin.yaml |generate_until | | |
| |afrimgsm_kin_prompt_4 |lm_eval/tasks/afrimgsm/direct/prompt_4/afrimgsm_kin.yaml |generate_until | | |
| |afrimgsm_kin_prompt_5 |lm_eval/tasks/afrimgsm/direct/prompt_5/afrimgsm_kin.yaml |generate_until | | |
| |afrimgsm_lin_prompt_1 |lm_eval/tasks/afrimgsm/direct/prompt_1/afrimgsm_lin.yaml |generate_until | | |
| |afrimgsm_lin_prompt_2 |lm_eval/tasks/afrimgsm/direct/prompt_2/afrimgsm_lin.yaml |generate_until | | |
| |afrimgsm_lin_prompt_3 |lm_eval/tasks/afrimgsm/direct/prompt_3/afrimgsm_lin.yaml |generate_until | | |
| |afrimgsm_lin_prompt_4 |lm_eval/tasks/afrimgsm/direct/prompt_4/afrimgsm_lin.yaml |generate_until | | |
| |afrimgsm_lin_prompt_5 |lm_eval/tasks/afrimgsm/direct/prompt_5/afrimgsm_lin.yaml |generate_until | | |
| |afrimgsm_lug_prompt_1 |lm_eval/tasks/afrimgsm/direct/prompt_1/afrimgsm_lug.yaml |generate_until | | |
| |afrimgsm_lug_prompt_2 |lm_eval/tasks/afrimgsm/direct/prompt_2/afrimgsm_lug.yaml |generate_until | | |
| |afrimgsm_lug_prompt_3 |lm_eval/tasks/afrimgsm/direct/prompt_3/afrimgsm_lug.yaml |generate_until | | |
| |afrimgsm_lug_prompt_4 |lm_eval/tasks/afrimgsm/direct/prompt_4/afrimgsm_lug.yaml |generate_until | | |
| |afrimgsm_lug_prompt_5 |lm_eval/tasks/afrimgsm/direct/prompt_5/afrimgsm_lug.yaml |generate_until | | |
| |afrimgsm_orm_prompt_1 |lm_eval/tasks/afrimgsm/direct/prompt_1/afrimgsm_orm.yaml |generate_until | | |
| |afrimgsm_orm_prompt_2 |lm_eval/tasks/afrimgsm/direct/prompt_2/afrimgsm_orm.yaml |generate_until | | |
| |afrimgsm_orm_prompt_3 |lm_eval/tasks/afrimgsm/direct/prompt_3/afrimgsm_orm.yaml |generate_until | | |
| |afrimgsm_orm_prompt_4 |lm_eval/tasks/afrimgsm/direct/prompt_4/afrimgsm_orm.yaml |generate_until | | |
| |afrimgsm_orm_prompt_5 |lm_eval/tasks/afrimgsm/direct/prompt_5/afrimgsm_orm.yaml |generate_until | | |
| |afrimgsm_sna_prompt_1 |lm_eval/tasks/afrimgsm/direct/prompt_1/afrimgsm_sna.yaml |generate_until | | |
| |afrimgsm_sna_prompt_2 |lm_eval/tasks/afrimgsm/direct/prompt_2/afrimgsm_sna.yaml |generate_until | | |
| |afrimgsm_sna_prompt_3 |lm_eval/tasks/afrimgsm/direct/prompt_3/afrimgsm_sna.yaml |generate_until | | |
| |afrimgsm_sna_prompt_4 |lm_eval/tasks/afrimgsm/direct/prompt_4/afrimgsm_sna.yaml |generate_until | | |
| |afrimgsm_sna_prompt_5 |lm_eval/tasks/afrimgsm/direct/prompt_5/afrimgsm_sna.yaml |generate_until | | |
| |afrimgsm_sot_prompt_1 |lm_eval/tasks/afrimgsm/direct/prompt_1/afrimgsm_sot.yaml |generate_until | | |
| |afrimgsm_sot_prompt_2 |lm_eval/tasks/afrimgsm/direct/prompt_2/afrimgsm_sot.yaml |generate_until | | |
| |afrimgsm_sot_prompt_3 |lm_eval/tasks/afrimgsm/direct/prompt_3/afrimgsm_sot.yaml |generate_until | | |
| |afrimgsm_sot_prompt_4 |lm_eval/tasks/afrimgsm/direct/prompt_4/afrimgsm_sot.yaml |generate_until | | |
| |afrimgsm_sot_prompt_5 |lm_eval/tasks/afrimgsm/direct/prompt_5/afrimgsm_sot.yaml |generate_until | | |
| |afrimgsm_swa_prompt_1 |lm_eval/tasks/afrimgsm/direct/prompt_1/afrimgsm_swa.yaml |generate_until | | |
| |afrimgsm_swa_prompt_2 |lm_eval/tasks/afrimgsm/direct/prompt_2/afrimgsm_swa.yaml |generate_until | | |
| |afrimgsm_swa_prompt_3 |lm_eval/tasks/afrimgsm/direct/prompt_3/afrimgsm_swa.yaml |generate_until | | |
| |afrimgsm_swa_prompt_4 |lm_eval/tasks/afrimgsm/direct/prompt_4/afrimgsm_swa.yaml |generate_until | | |
| |afrimgsm_swa_prompt_5 |lm_eval/tasks/afrimgsm/direct/prompt_5/afrimgsm_swa.yaml |generate_until | | |
| |afrimgsm_translate_amh_prompt_1 |lm_eval/tasks/afrimgsm/translate/prompt_1/afrimgsm_translate_amh.yaml |generate_until | | |
| |afrimgsm_translate_amh_prompt_2 |lm_eval/tasks/afrimgsm/translate/prompt_2/afrimgsm_translate_amh.yaml |generate_until | | |
| |afrimgsm_translate_amh_prompt_3 |lm_eval/tasks/afrimgsm/translate/prompt_3/afrimgsm_translate_amh.yaml |generate_until | | |
| |afrimgsm_translate_amh_prompt_4 |lm_eval/tasks/afrimgsm/translate/prompt_4/afrimgsm_translate_amh.yaml |generate_until | | |
| |afrimgsm_translate_amh_prompt_5 |lm_eval/tasks/afrimgsm/translate/prompt_5/afrimgsm_translate_amh.yaml |generate_until | | |
| |afrimgsm_translate_ewe_prompt_1 |lm_eval/tasks/afrimgsm/translate/prompt_1/afrimgsm_translate_ewe.yaml |generate_until | | |
| |afrimgsm_translate_ewe_prompt_2 |lm_eval/tasks/afrimgsm/translate/prompt_2/afrimgsm_translate_ewe.yaml |generate_until | | |
| |afrimgsm_translate_ewe_prompt_3 |lm_eval/tasks/afrimgsm/translate/prompt_3/afrimgsm_translate_ewe.yaml |generate_until | | |
| |afrimgsm_translate_ewe_prompt_4 |lm_eval/tasks/afrimgsm/translate/prompt_4/afrimgsm_translate_ewe.yaml |generate_until | | |
| |afrimgsm_translate_ewe_prompt_5 |lm_eval/tasks/afrimgsm/translate/prompt_5/afrimgsm_translate_ewe.yaml |generate_until | | |
| |afrimgsm_translate_fra_prompt_1 |lm_eval/tasks/afrimgsm/translate/prompt_1/afrimgsm_translate_fra.yaml |generate_until | | |
| |afrimgsm_translate_fra_prompt_2 |lm_eval/tasks/afrimgsm/translate/prompt_2/afrimgsm_translate_fra.yaml |generate_until | | |
| |afrimgsm_translate_fra_prompt_3 |lm_eval/tasks/afrimgsm/translate/prompt_3/afrimgsm_translate_fra.yaml |generate_until | | |
| |afrimgsm_translate_fra_prompt_4 |lm_eval/tasks/afrimgsm/translate/prompt_4/afrimgsm_translate_fra.yaml |generate_until | | |
| |afrimgsm_translate_fra_prompt_5 |lm_eval/tasks/afrimgsm/translate/prompt_5/afrimgsm_translate_fra.yaml |generate_until | | |
| |afrimgsm_translate_hau_prompt_1 |lm_eval/tasks/afrimgsm/translate/prompt_1/afrimgsm_translate_hau.yaml |generate_until | | |
| |afrimgsm_translate_hau_prompt_2 |lm_eval/tasks/afrimgsm/translate/prompt_2/afrimgsm_translate_hau.yaml |generate_until | | |
| |afrimgsm_translate_hau_prompt_3 |lm_eval/tasks/afrimgsm/translate/prompt_3/afrimgsm_translate_hau.yaml |generate_until | | |
| |afrimgsm_translate_hau_prompt_4 |lm_eval/tasks/afrimgsm/translate/prompt_4/afrimgsm_translate_hau.yaml |generate_until | | |
| |afrimgsm_translate_hau_prompt_5 |lm_eval/tasks/afrimgsm/translate/prompt_5/afrimgsm_translate_hau.yaml |generate_until | | |
| |afrimgsm_translate_ibo_prompt_1 |lm_eval/tasks/afrimgsm/translate/prompt_1/afrimgsm_translate_ibo.yaml |generate_until | | |
| |afrimgsm_translate_ibo_prompt_2 |lm_eval/tasks/afrimgsm/translate/prompt_2/afrimgsm_translate_ibo.yaml |generate_until | | |
| |afrimgsm_translate_ibo_prompt_3 |lm_eval/tasks/afrimgsm/translate/prompt_3/afrimgsm_translate_ibo.yaml |generate_until | | |
| |afrimgsm_translate_ibo_prompt_4 |lm_eval/tasks/afrimgsm/translate/prompt_4/afrimgsm_translate_ibo.yaml |generate_until | | |
| |afrimgsm_translate_ibo_prompt_5 |lm_eval/tasks/afrimgsm/translate/prompt_5/afrimgsm_translate_ibo.yaml |generate_until | | |
| |afrimgsm_translate_kin_prompt_1 |lm_eval/tasks/afrimgsm/translate/prompt_1/afrimgsm_translate_kin.yaml |generate_until | | |
| |afrimgsm_translate_kin_prompt_2 |lm_eval/tasks/afrimgsm/translate/prompt_2/afrimgsm_translate_kin.yaml |generate_until | | |
| |afrimgsm_translate_kin_prompt_3 |lm_eval/tasks/afrimgsm/translate/prompt_3/afrimgsm_translate_kin.yaml |generate_until | | |
| |afrimgsm_translate_kin_prompt_4 |lm_eval/tasks/afrimgsm/translate/prompt_4/afrimgsm_translate_kin.yaml |generate_until | | |
| |afrimgsm_translate_kin_prompt_5 |lm_eval/tasks/afrimgsm/translate/prompt_5/afrimgsm_translate_kin.yaml |generate_until | | |
| |afrimgsm_translate_lin_prompt_1 |lm_eval/tasks/afrimgsm/translate/prompt_1/afrimgsm_translate_lin.yaml |generate_until | | |
| |afrimgsm_translate_lin_prompt_2 |lm_eval/tasks/afrimgsm/translate/prompt_2/afrimgsm_translate_lin.yaml |generate_until | | |
| |afrimgsm_translate_lin_prompt_3 |lm_eval/tasks/afrimgsm/translate/prompt_3/afrimgsm_translate_lin.yaml |generate_until | | |
| |afrimgsm_translate_lin_prompt_4 |lm_eval/tasks/afrimgsm/translate/prompt_4/afrimgsm_translate_lin.yaml |generate_until | | |
| |afrimgsm_translate_lin_prompt_5 |lm_eval/tasks/afrimgsm/translate/prompt_5/afrimgsm_translate_lin.yaml |generate_until | | |
| |afrimgsm_translate_lug_prompt_1 |lm_eval/tasks/afrimgsm/translate/prompt_1/afrimgsm_translate_lug.yaml |generate_until | | |
| |afrimgsm_translate_lug_prompt_2 |lm_eval/tasks/afrimgsm/translate/prompt_2/afrimgsm_translate_lug.yaml |generate_until | | |
| |afrimgsm_translate_lug_prompt_3 |lm_eval/tasks/afrimgsm/translate/prompt_3/afrimgsm_translate_lug.yaml |generate_until | | |
| |afrimgsm_translate_lug_prompt_4 |lm_eval/tasks/afrimgsm/translate/prompt_4/afrimgsm_translate_lug.yaml |generate_until | | |
| |afrimgsm_translate_lug_prompt_5 |lm_eval/tasks/afrimgsm/translate/prompt_5/afrimgsm_translate_lug.yaml |generate_until | | |
| |afrimgsm_translate_orm_prompt_1 |lm_eval/tasks/afrimgsm/translate/prompt_1/afrimgsm_translate_orm.yaml |generate_until | | |
| |afrimgsm_translate_orm_prompt_2 |lm_eval/tasks/afrimgsm/translate/prompt_2/afrimgsm_translate_orm.yaml |generate_until | | |
| |afrimgsm_translate_orm_prompt_3 |lm_eval/tasks/afrimgsm/translate/prompt_3/afrimgsm_translate_orm.yaml |generate_until | | |
| |afrimgsm_translate_orm_prompt_4 |lm_eval/tasks/afrimgsm/translate/prompt_4/afrimgsm_translate_orm.yaml |generate_until | | |
| |afrimgsm_translate_orm_prompt_5 |lm_eval/tasks/afrimgsm/translate/prompt_5/afrimgsm_translate_orm.yaml |generate_until | | |
| |afrimgsm_translate_sna_prompt_1 |lm_eval/tasks/afrimgsm/translate/prompt_1/afrimgsm_translate_sna.yaml |generate_until | | |
| |afrimgsm_translate_sna_prompt_2 |lm_eval/tasks/afrimgsm/translate/prompt_2/afrimgsm_translate_sna.yaml |generate_until | | |
| |afrimgsm_translate_sna_prompt_3 |lm_eval/tasks/afrimgsm/translate/prompt_3/afrimgsm_translate_sna.yaml |generate_until | | |
| |afrimgsm_translate_sna_prompt_4 |lm_eval/tasks/afrimgsm/translate/prompt_4/afrimgsm_translate_sna.yaml |generate_until | | |
| |afrimgsm_translate_sna_prompt_5 |lm_eval/tasks/afrimgsm/translate/prompt_5/afrimgsm_translate_sna.yaml |generate_until | | |
| |afrimgsm_translate_sot_prompt_1 |lm_eval/tasks/afrimgsm/translate/prompt_1/afrimgsm_translate_sot.yaml |generate_until | | |
| |afrimgsm_translate_sot_prompt_2 |lm_eval/tasks/afrimgsm/translate/prompt_2/afrimgsm_translate_sot.yaml |generate_until | | |
| |afrimgsm_translate_sot_prompt_3 |lm_eval/tasks/afrimgsm/translate/prompt_3/afrimgsm_translate_sot.yaml |generate_until | | |
| |afrimgsm_translate_sot_prompt_4 |lm_eval/tasks/afrimgsm/translate/prompt_4/afrimgsm_translate_sot.yaml |generate_until | | |
| |afrimgsm_translate_sot_prompt_5 |lm_eval/tasks/afrimgsm/translate/prompt_5/afrimgsm_translate_sot.yaml |generate_until | | |
| |afrimgsm_translate_swa_prompt_1 |lm_eval/tasks/afrimgsm/translate/prompt_1/afrimgsm_translate_swa.yaml |generate_until | | |
| |afrimgsm_translate_swa_prompt_2 |lm_eval/tasks/afrimgsm/translate/prompt_2/afrimgsm_translate_swa.yaml |generate_until | | |
| |afrimgsm_translate_swa_prompt_3 |lm_eval/tasks/afrimgsm/translate/prompt_3/afrimgsm_translate_swa.yaml |generate_until | | |
| |afrimgsm_translate_swa_prompt_4 |lm_eval/tasks/afrimgsm/translate/prompt_4/afrimgsm_translate_swa.yaml |generate_until | | |
| |afrimgsm_translate_swa_prompt_5 |lm_eval/tasks/afrimgsm/translate/prompt_5/afrimgsm_translate_swa.yaml |generate_until | | |
| |afrimgsm_translate_twi_prompt_1 |lm_eval/tasks/afrimgsm/translate/prompt_1/afrimgsm_translate_twi.yaml |generate_until | | |
| |afrimgsm_translate_twi_prompt_2 |lm_eval/tasks/afrimgsm/translate/prompt_2/afrimgsm_translate_twi.yaml |generate_until | | |
| |afrimgsm_translate_twi_prompt_3 |lm_eval/tasks/afrimgsm/translate/prompt_3/afrimgsm_translate_twi.yaml |generate_until | | |
| |afrimgsm_translate_twi_prompt_4 |lm_eval/tasks/afrimgsm/translate/prompt_4/afrimgsm_translate_twi.yaml |generate_until | | |
| |afrimgsm_translate_twi_prompt_5 |lm_eval/tasks/afrimgsm/translate/prompt_5/afrimgsm_translate_twi.yaml |generate_until | | |
| |afrimgsm_translate_wol_prompt_1 |lm_eval/tasks/afrimgsm/translate/prompt_1/afrimgsm_translate_wol.yaml |generate_until | | |
| |afrimgsm_translate_wol_prompt_2 |lm_eval/tasks/afrimgsm/translate/prompt_2/afrimgsm_translate_wol.yaml |generate_until | | |
| |afrimgsm_translate_wol_prompt_3 |lm_eval/tasks/afrimgsm/translate/prompt_3/afrimgsm_translate_wol.yaml |generate_until | | |
| |afrimgsm_translate_wol_prompt_4 |lm_eval/tasks/afrimgsm/translate/prompt_4/afrimgsm_translate_wol.yaml |generate_until | | |
| |afrimgsm_translate_wol_prompt_5 |lm_eval/tasks/afrimgsm/translate/prompt_5/afrimgsm_translate_wol.yaml |generate_until | | |
| |afrimgsm_translate_xho_prompt_1 |lm_eval/tasks/afrimgsm/translate/prompt_1/afrimgsm_translate_xho.yaml |generate_until | | |
| |afrimgsm_translate_xho_prompt_2 |lm_eval/tasks/afrimgsm/translate/prompt_2/afrimgsm_translate_xho.yaml |generate_until | | |
| |afrimgsm_translate_xho_prompt_3 |lm_eval/tasks/afrimgsm/translate/prompt_3/afrimgsm_translate_xho.yaml |generate_until | | |
| |afrimgsm_translate_xho_prompt_4 |lm_eval/tasks/afrimgsm/translate/prompt_4/afrimgsm_translate_xho.yaml |generate_until | | |
| |afrimgsm_translate_xho_prompt_5 |lm_eval/tasks/afrimgsm/translate/prompt_5/afrimgsm_translate_xho.yaml |generate_until | | |
| |afrimgsm_translate_yor_prompt_1 |lm_eval/tasks/afrimgsm/translate/prompt_1/afrimgsm_translate_yor.yaml |generate_until | | |
| |afrimgsm_translate_yor_prompt_2 |lm_eval/tasks/afrimgsm/translate/prompt_2/afrimgsm_translate_yor.yaml |generate_until | | |
| |afrimgsm_translate_yor_prompt_3 |lm_eval/tasks/afrimgsm/translate/prompt_3/afrimgsm_translate_yor.yaml |generate_until | | |
| |afrimgsm_translate_yor_prompt_4 |lm_eval/tasks/afrimgsm/translate/prompt_4/afrimgsm_translate_yor.yaml |generate_until | | |
| |afrimgsm_translate_yor_prompt_5 |lm_eval/tasks/afrimgsm/translate/prompt_5/afrimgsm_translate_yor.yaml |generate_until | | |
| |afrimgsm_translate_zul_prompt_1 |lm_eval/tasks/afrimgsm/translate/prompt_1/afrimgsm_translate_zul.yaml |generate_until | | |
| |afrimgsm_translate_zul_prompt_2 |lm_eval/tasks/afrimgsm/translate/prompt_2/afrimgsm_translate_zul.yaml |generate_until | | |
| |afrimgsm_translate_zul_prompt_3 |lm_eval/tasks/afrimgsm/translate/prompt_3/afrimgsm_translate_zul.yaml |generate_until | | |
| |afrimgsm_translate_zul_prompt_4 |lm_eval/tasks/afrimgsm/translate/prompt_4/afrimgsm_translate_zul.yaml |generate_until | | |
| |afrimgsm_translate_zul_prompt_5 |lm_eval/tasks/afrimgsm/translate/prompt_5/afrimgsm_translate_zul.yaml |generate_until | | |
| |afrimgsm_twi_prompt_1 |lm_eval/tasks/afrimgsm/direct/prompt_1/afrimgsm_twi.yaml |generate_until | | |
| |afrimgsm_twi_prompt_2 |lm_eval/tasks/afrimgsm/direct/prompt_2/afrimgsm_twi.yaml |generate_until | | |
| |afrimgsm_twi_prompt_3 |lm_eval/tasks/afrimgsm/direct/prompt_3/afrimgsm_twi.yaml |generate_until | | |
| |afrimgsm_twi_prompt_4 |lm_eval/tasks/afrimgsm/direct/prompt_4/afrimgsm_twi.yaml |generate_until | | |
| |afrimgsm_twi_prompt_5 |lm_eval/tasks/afrimgsm/direct/prompt_5/afrimgsm_twi.yaml |generate_until | | |
| |afrimgsm_vai_prompt_1 |lm_eval/tasks/afrimgsm/direct/prompt_1/afrimgsm_vai.yaml |generate_until | | |
| |afrimgsm_vai_prompt_2 |lm_eval/tasks/afrimgsm/direct/prompt_2/afrimgsm_vai.yaml |generate_until | | |
| |afrimgsm_vai_prompt_3 |lm_eval/tasks/afrimgsm/direct/prompt_3/afrimgsm_vai.yaml |generate_until | | |
| |afrimgsm_vai_prompt_4 |lm_eval/tasks/afrimgsm/direct/prompt_4/afrimgsm_vai.yaml |generate_until | | |
| |afrimgsm_vai_prompt_5 |lm_eval/tasks/afrimgsm/direct/prompt_5/afrimgsm_vai.yaml |generate_until | | |
| |afrimgsm_wol_prompt_1 |lm_eval/tasks/afrimgsm/direct/prompt_1/afrimgsm_wol.yaml |generate_until | | |
| |afrimgsm_wol_prompt_2 |lm_eval/tasks/afrimgsm/direct/prompt_2/afrimgsm_wol.yaml |generate_until | | |
| |afrimgsm_wol_prompt_3 |lm_eval/tasks/afrimgsm/direct/prompt_3/afrimgsm_wol.yaml |generate_until | | |
| |afrimgsm_wol_prompt_4 |lm_eval/tasks/afrimgsm/direct/prompt_4/afrimgsm_wol.yaml |generate_until | | |
| |afrimgsm_wol_prompt_5 |lm_eval/tasks/afrimgsm/direct/prompt_5/afrimgsm_wol.yaml |generate_until | | |
| |afrimgsm_xho_prompt_1 |lm_eval/tasks/afrimgsm/direct/prompt_1/afrimgsm_xho.yaml |generate_until | | |
| |afrimgsm_xho_prompt_2 |lm_eval/tasks/afrimgsm/direct/prompt_2/afrimgsm_xho.yaml |generate_until | | |
| |afrimgsm_xho_prompt_3 |lm_eval/tasks/afrimgsm/direct/prompt_3/afrimgsm_xho.yaml |generate_until | | |
| |afrimgsm_xho_prompt_4 |lm_eval/tasks/afrimgsm/direct/prompt_4/afrimgsm_xho.yaml |generate_until | | |
| |afrimgsm_xho_prompt_5 |lm_eval/tasks/afrimgsm/direct/prompt_5/afrimgsm_xho.yaml |generate_until | | |
| |afrimgsm_yor_prompt_1 |lm_eval/tasks/afrimgsm/direct/prompt_1/afrimgsm_yor.yaml |generate_until | | |
| |afrimgsm_yor_prompt_2 |lm_eval/tasks/afrimgsm/direct/prompt_2/afrimgsm_yor.yaml |generate_until | | |
| |afrimgsm_yor_prompt_3 |lm_eval/tasks/afrimgsm/direct/prompt_3/afrimgsm_yor.yaml |generate_until | | |
| |afrimgsm_yor_prompt_4 |lm_eval/tasks/afrimgsm/direct/prompt_4/afrimgsm_yor.yaml |generate_until | | |
| |afrimgsm_yor_prompt_5 |lm_eval/tasks/afrimgsm/direct/prompt_5/afrimgsm_yor.yaml |generate_until | | |
| |afrimgsm_zul_prompt_1 |lm_eval/tasks/afrimgsm/direct/prompt_1/afrimgsm_zul.yaml |generate_until | | |
| |afrimgsm_zul_prompt_2 |lm_eval/tasks/afrimgsm/direct/prompt_2/afrimgsm_zul.yaml |generate_until | | |
| |afrimgsm_zul_prompt_3 |lm_eval/tasks/afrimgsm/direct/prompt_3/afrimgsm_zul.yaml |generate_until | | |
| |afrimgsm_zul_prompt_4 |lm_eval/tasks/afrimgsm/direct/prompt_4/afrimgsm_zul.yaml |generate_until | | |
| |afrimgsm_zul_prompt_5 |lm_eval/tasks/afrimgsm/direct/prompt_5/afrimgsm_zul.yaml |generate_until | | |
| |afrimmlu_direct_amh_prompt_1 |lm_eval/tasks/afrimmlu/direct/prompt_1/afrimmlu_direct_amh.yaml |multiple_choice | | |
| |afrimmlu_direct_amh_prompt_2 |lm_eval/tasks/afrimmlu/direct/prompt_2/afrimmlu_direct_amh.yaml |multiple_choice | | |
| |afrimmlu_direct_amh_prompt_3 |lm_eval/tasks/afrimmlu/direct/prompt_3/afrimmlu_direct_amh.yaml |multiple_choice | | |
| |afrimmlu_direct_amh_prompt_4 |lm_eval/tasks/afrimmlu/direct/prompt_4/afrimmlu_direct_amh.yaml |multiple_choice | | |
| |afrimmlu_direct_amh_prompt_5 |lm_eval/tasks/afrimmlu/direct/prompt_5/afrimmlu_direct_amh.yaml |multiple_choice | | |
| |afrimmlu_direct_eng_prompt_1 |lm_eval/tasks/afrimmlu/direct/prompt_1/afrimmlu_direct_eng.yaml |multiple_choice | | |
| |afrimmlu_direct_eng_prompt_2 |lm_eval/tasks/afrimmlu/direct/prompt_2/afrimmlu_direct_eng.yaml |multiple_choice | | |
| |afrimmlu_direct_eng_prompt_3 |lm_eval/tasks/afrimmlu/direct/prompt_3/afrimmlu_direct_eng.yaml |multiple_choice | | |
| |afrimmlu_direct_eng_prompt_4 |lm_eval/tasks/afrimmlu/direct/prompt_4/afrimmlu_direct_eng.yaml |multiple_choice | | |
| |afrimmlu_direct_eng_prompt_5 |lm_eval/tasks/afrimmlu/direct/prompt_5/afrimmlu_direct_eng.yaml |multiple_choice | | |
| |afrimmlu_direct_ewe_prompt_1 |lm_eval/tasks/afrimmlu/direct/prompt_1/afrimmlu_direct_ewe.yaml |multiple_choice | | |
| |afrimmlu_direct_ewe_prompt_2 |lm_eval/tasks/afrimmlu/direct/prompt_2/afrimmlu_direct_ewe.yaml |multiple_choice | | |
| |afrimmlu_direct_ewe_prompt_3 |lm_eval/tasks/afrimmlu/direct/prompt_3/afrimmlu_direct_ewe.yaml |multiple_choice | | |
| |afrimmlu_direct_ewe_prompt_4 |lm_eval/tasks/afrimmlu/direct/prompt_4/afrimmlu_direct_ewe.yaml |multiple_choice | | |
| |afrimmlu_direct_ewe_prompt_5 |lm_eval/tasks/afrimmlu/direct/prompt_5/afrimmlu_direct_ewe.yaml |multiple_choice | | |
| |afrimmlu_direct_fra_prompt_1 |lm_eval/tasks/afrimmlu/direct/prompt_1/afrimmlu_direct_fra.yaml |multiple_choice | | |
| |afrimmlu_direct_fra_prompt_2 |lm_eval/tasks/afrimmlu/direct/prompt_2/afrimmlu_direct_fra.yaml |multiple_choice | | |
| |afrimmlu_direct_fra_prompt_3 |lm_eval/tasks/afrimmlu/direct/prompt_3/afrimmlu_direct_fra.yaml |multiple_choice | | |
| |afrimmlu_direct_fra_prompt_4 |lm_eval/tasks/afrimmlu/direct/prompt_4/afrimmlu_direct_fra.yaml |multiple_choice | | |
| |afrimmlu_direct_fra_prompt_5 |lm_eval/tasks/afrimmlu/direct/prompt_5/afrimmlu_direct_fra.yaml |multiple_choice | | |
| |afrimmlu_direct_hau_prompt_1 |lm_eval/tasks/afrimmlu/direct/prompt_1/afrimmlu_direct_hau.yaml |multiple_choice | | |
| |afrimmlu_direct_hau_prompt_2 |lm_eval/tasks/afrimmlu/direct/prompt_2/afrimmlu_direct_hau.yaml |multiple_choice | | |
| |afrimmlu_direct_hau_prompt_3 |lm_eval/tasks/afrimmlu/direct/prompt_3/afrimmlu_direct_hau.yaml |multiple_choice | | |
| |afrimmlu_direct_hau_prompt_4 |lm_eval/tasks/afrimmlu/direct/prompt_4/afrimmlu_direct_hau.yaml |multiple_choice | | |
| |afrimmlu_direct_hau_prompt_5 |lm_eval/tasks/afrimmlu/direct/prompt_5/afrimmlu_direct_hau.yaml |multiple_choice | | |
| |afrimmlu_direct_ibo_prompt_1 |lm_eval/tasks/afrimmlu/direct/prompt_1/afrimmlu_direct_ibo.yaml |multiple_choice | | |
| |afrimmlu_direct_ibo_prompt_2 |lm_eval/tasks/afrimmlu/direct/prompt_2/afrimmlu_direct_ibo.yaml |multiple_choice | | |
| |afrimmlu_direct_ibo_prompt_3 |lm_eval/tasks/afrimmlu/direct/prompt_3/afrimmlu_direct_ibo.yaml |multiple_choice | | |
| |afrimmlu_direct_ibo_prompt_4 |lm_eval/tasks/afrimmlu/direct/prompt_4/afrimmlu_direct_ibo.yaml |multiple_choice | | |
| |afrimmlu_direct_ibo_prompt_5 |lm_eval/tasks/afrimmlu/direct/prompt_5/afrimmlu_direct_ibo.yaml |multiple_choice | | |
| |afrimmlu_direct_kin_prompt_1 |lm_eval/tasks/afrimmlu/direct/prompt_1/afrimmlu_direct_kin.yaml |multiple_choice | | |
| |afrimmlu_direct_kin_prompt_2 |lm_eval/tasks/afrimmlu/direct/prompt_2/afrimmlu_direct_kin.yaml |multiple_choice | | |
| |afrimmlu_direct_kin_prompt_3 |lm_eval/tasks/afrimmlu/direct/prompt_3/afrimmlu_direct_kin.yaml |multiple_choice | | |
| |afrimmlu_direct_kin_prompt_4 |lm_eval/tasks/afrimmlu/direct/prompt_4/afrimmlu_direct_kin.yaml |multiple_choice | | |
| |afrimmlu_direct_kin_prompt_5 |lm_eval/tasks/afrimmlu/direct/prompt_5/afrimmlu_direct_kin.yaml |multiple_choice | | |
| |afrimmlu_direct_lin_prompt_1 |lm_eval/tasks/afrimmlu/direct/prompt_1/afrimmlu_direct_lin.yaml |multiple_choice | | |
| |afrimmlu_direct_lin_prompt_2 |lm_eval/tasks/afrimmlu/direct/prompt_2/afrimmlu_direct_lin.yaml |multiple_choice | | |
| |afrimmlu_direct_lin_prompt_3 |lm_eval/tasks/afrimmlu/direct/prompt_3/afrimmlu_direct_lin.yaml |multiple_choice | | |
| |afrimmlu_direct_lin_prompt_4 |lm_eval/tasks/afrimmlu/direct/prompt_4/afrimmlu_direct_lin.yaml |multiple_choice | | |
| |afrimmlu_direct_lin_prompt_5 |lm_eval/tasks/afrimmlu/direct/prompt_5/afrimmlu_direct_lin.yaml |multiple_choice | | |
| |afrimmlu_direct_lug_prompt_1 |lm_eval/tasks/afrimmlu/direct/prompt_1/afrimmlu_direct_lug.yaml |multiple_choice | | |
| |afrimmlu_direct_lug_prompt_2 |lm_eval/tasks/afrimmlu/direct/prompt_2/afrimmlu_direct_lug.yaml |multiple_choice | | |
| |afrimmlu_direct_lug_prompt_3 |lm_eval/tasks/afrimmlu/direct/prompt_3/afrimmlu_direct_lug.yaml |multiple_choice | | |
| |afrimmlu_direct_lug_prompt_4 |lm_eval/tasks/afrimmlu/direct/prompt_4/afrimmlu_direct_lug.yaml |multiple_choice | | |
| |afrimmlu_direct_lug_prompt_5 |lm_eval/tasks/afrimmlu/direct/prompt_5/afrimmlu_direct_lug.yaml |multiple_choice | | |
| |afrimmlu_direct_orm_prompt_1 |lm_eval/tasks/afrimmlu/direct/prompt_1/afrimmlu_direct_orm.yaml |multiple_choice | | |
| |afrimmlu_direct_orm_prompt_2 |lm_eval/tasks/afrimmlu/direct/prompt_2/afrimmlu_direct_orm.yaml |multiple_choice | | |
| |afrimmlu_direct_orm_prompt_3 |lm_eval/tasks/afrimmlu/direct/prompt_3/afrimmlu_direct_orm.yaml |multiple_choice | | |
| |afrimmlu_direct_orm_prompt_4 |lm_eval/tasks/afrimmlu/direct/prompt_4/afrimmlu_direct_orm.yaml |multiple_choice | | |
| |afrimmlu_direct_orm_prompt_5 |lm_eval/tasks/afrimmlu/direct/prompt_5/afrimmlu_direct_orm.yaml |multiple_choice | | |
| |afrimmlu_direct_sna_prompt_1 |lm_eval/tasks/afrimmlu/direct/prompt_1/afrimmlu_direct_sna.yaml |multiple_choice | | |
| |afrimmlu_direct_sna_prompt_2 |lm_eval/tasks/afrimmlu/direct/prompt_2/afrimmlu_direct_sna.yaml |multiple_choice | | |
| |afrimmlu_direct_sna_prompt_3 |lm_eval/tasks/afrimmlu/direct/prompt_3/afrimmlu_direct_sna.yaml |multiple_choice | | |
| |afrimmlu_direct_sna_prompt_4 |lm_eval/tasks/afrimmlu/direct/prompt_4/afrimmlu_direct_sna.yaml |multiple_choice | | |
| |afrimmlu_direct_sna_prompt_5 |lm_eval/tasks/afrimmlu/direct/prompt_5/afrimmlu_direct_sna.yaml |multiple_choice | | |
| |afrimmlu_direct_sot_prompt_1 |lm_eval/tasks/afrimmlu/direct/prompt_1/afrimmlu_direct_sot.yaml |multiple_choice | | |
| |afrimmlu_direct_sot_prompt_2 |lm_eval/tasks/afrimmlu/direct/prompt_2/afrimmlu_direct_sot.yaml |multiple_choice | | |
| |afrimmlu_direct_sot_prompt_3 |lm_eval/tasks/afrimmlu/direct/prompt_3/afrimmlu_direct_sot.yaml |multiple_choice | | |
| |afrimmlu_direct_sot_prompt_4 |lm_eval/tasks/afrimmlu/direct/prompt_4/afrimmlu_direct_sot.yaml |multiple_choice | | |
| |afrimmlu_direct_sot_prompt_5 |lm_eval/tasks/afrimmlu/direct/prompt_5/afrimmlu_direct_sot.yaml |multiple_choice | | |
| |afrimmlu_direct_swa_prompt_1 |lm_eval/tasks/afrimmlu/direct/prompt_1/afrimmlu_direct_swa.yaml |multiple_choice | | |
| |afrimmlu_direct_swa_prompt_2 |lm_eval/tasks/afrimmlu/direct/prompt_2/afrimmlu_direct_swa.yaml |multiple_choice | | |
| |afrimmlu_direct_swa_prompt_3 |lm_eval/tasks/afrimmlu/direct/prompt_3/afrimmlu_direct_swa.yaml |multiple_choice | | |
| |afrimmlu_direct_swa_prompt_4 |lm_eval/tasks/afrimmlu/direct/prompt_4/afrimmlu_direct_swa.yaml |multiple_choice | | |
| |afrimmlu_direct_swa_prompt_5 |lm_eval/tasks/afrimmlu/direct/prompt_5/afrimmlu_direct_swa.yaml |multiple_choice | | |
| |afrimmlu_direct_twi_prompt_1 |lm_eval/tasks/afrimmlu/direct/prompt_1/afrimmlu_direct_twi.yaml |multiple_choice | | |
| |afrimmlu_direct_twi_prompt_2 |lm_eval/tasks/afrimmlu/direct/prompt_2/afrimmlu_direct_twi.yaml |multiple_choice | | |
| |afrimmlu_direct_twi_prompt_3 |lm_eval/tasks/afrimmlu/direct/prompt_3/afrimmlu_direct_twi.yaml |multiple_choice | | |
| |afrimmlu_direct_twi_prompt_4 |lm_eval/tasks/afrimmlu/direct/prompt_4/afrimmlu_direct_twi.yaml |multiple_choice | | |
| |afrimmlu_direct_twi_prompt_5 |lm_eval/tasks/afrimmlu/direct/prompt_5/afrimmlu_direct_twi.yaml |multiple_choice | | |
| |afrimmlu_direct_wol_prompt_1 |lm_eval/tasks/afrimmlu/direct/prompt_1/afrimmlu_direct_wol.yaml |multiple_choice | | |
| |afrimmlu_direct_wol_prompt_2 |lm_eval/tasks/afrimmlu/direct/prompt_2/afrimmlu_direct_wol.yaml |multiple_choice | | |
| |afrimmlu_direct_wol_prompt_3 |lm_eval/tasks/afrimmlu/direct/prompt_3/afrimmlu_direct_wol.yaml |multiple_choice | | |
| |afrimmlu_direct_wol_prompt_4 |lm_eval/tasks/afrimmlu/direct/prompt_4/afrimmlu_direct_wol.yaml |multiple_choice | | |
| |afrimmlu_direct_wol_prompt_5 |lm_eval/tasks/afrimmlu/direct/prompt_5/afrimmlu_direct_wol.yaml |multiple_choice | | |
| |afrimmlu_direct_xho_prompt_1 |lm_eval/tasks/afrimmlu/direct/prompt_1/afrimmlu_direct_xho.yaml |multiple_choice | | |
| |afrimmlu_direct_xho_prompt_2 |lm_eval/tasks/afrimmlu/direct/prompt_2/afrimmlu_direct_xho.yaml |multiple_choice | | |
| |afrimmlu_direct_xho_prompt_3 |lm_eval/tasks/afrimmlu/direct/prompt_3/afrimmlu_direct_xho.yaml |multiple_choice | | |
| |afrimmlu_direct_xho_prompt_4 |lm_eval/tasks/afrimmlu/direct/prompt_4/afrimmlu_direct_xho.yaml |multiple_choice | | |
| |afrimmlu_direct_xho_prompt_5 |lm_eval/tasks/afrimmlu/direct/prompt_5/afrimmlu_direct_xho.yaml |multiple_choice | | |
| |afrimmlu_direct_yor_prompt_1 |lm_eval/tasks/afrimmlu/direct/prompt_1/afrimmlu_direct_yor.yaml |multiple_choice | | |
| |afrimmlu_direct_yor_prompt_2 |lm_eval/tasks/afrimmlu/direct/prompt_2/afrimmlu_direct_yor.yaml |multiple_choice | | |
| |afrimmlu_direct_yor_prompt_3 |lm_eval/tasks/afrimmlu/direct/prompt_3/afrimmlu_direct_yor.yaml |multiple_choice | | |
| |afrimmlu_direct_yor_prompt_4 |lm_eval/tasks/afrimmlu/direct/prompt_4/afrimmlu_direct_yor.yaml |multiple_choice | | |
| |afrimmlu_direct_yor_prompt_5 |lm_eval/tasks/afrimmlu/direct/prompt_5/afrimmlu_direct_yor.yaml |multiple_choice | | |
| |afrimmlu_direct_zul_prompt_1 |lm_eval/tasks/afrimmlu/direct/prompt_1/afrimmlu_direct_zul.yaml |multiple_choice | | |
| |afrimmlu_direct_zul_prompt_2 |lm_eval/tasks/afrimmlu/direct/prompt_2/afrimmlu_direct_zul.yaml |multiple_choice | | |
| |afrimmlu_direct_zul_prompt_3 |lm_eval/tasks/afrimmlu/direct/prompt_3/afrimmlu_direct_zul.yaml |multiple_choice | | |
| |afrimmlu_direct_zul_prompt_4 |lm_eval/tasks/afrimmlu/direct/prompt_4/afrimmlu_direct_zul.yaml |multiple_choice | | |
| |afrimmlu_direct_zul_prompt_5 |lm_eval/tasks/afrimmlu/direct/prompt_5/afrimmlu_direct_zul.yaml |multiple_choice | | |
| |afrimmlu_translate_amh_prompt_1 |lm_eval/tasks/afrimmlu/translate/prompt_1/afrimmlu_translate_amh.yaml |multiple_choice | | |
| |afrimmlu_translate_amh_prompt_2 |lm_eval/tasks/afrimmlu/translate/prompt_2/afrimmlu_translate_amh.yaml |multiple_choice | | |
| |afrimmlu_translate_amh_prompt_3 |lm_eval/tasks/afrimmlu/translate/prompt_3/afrimmlu_translate_amh.yaml |multiple_choice | | |
| |afrimmlu_translate_amh_prompt_4 |lm_eval/tasks/afrimmlu/translate/prompt_4/afrimmlu_translate_amh.yaml |multiple_choice | | |
| |afrimmlu_translate_amh_prompt_5 |lm_eval/tasks/afrimmlu/translate/prompt_5/afrimmlu_translate_amh.yaml |multiple_choice | | |
| |afrimmlu_translate_ewe_prompt_1 |lm_eval/tasks/afrimmlu/translate/prompt_1/afrimmlu_translate_ewe.yaml |multiple_choice | | |
| |afrimmlu_translate_ewe_prompt_2 |lm_eval/tasks/afrimmlu/translate/prompt_2/afrimmlu_translate_ewe.yaml |multiple_choice | | |
| |afrimmlu_translate_ewe_prompt_3 |lm_eval/tasks/afrimmlu/translate/prompt_3/afrimmlu_translate_ewe.yaml |multiple_choice | | |
| |afrimmlu_translate_ewe_prompt_4 |lm_eval/tasks/afrimmlu/translate/prompt_4/afrimmlu_translate_ewe.yaml |multiple_choice | | |
| |afrimmlu_translate_ewe_prompt_5 |lm_eval/tasks/afrimmlu/translate/prompt_5/afrimmlu_translate_ewe.yaml |multiple_choice | | |
| |afrimmlu_translate_fra_prompt_1 |lm_eval/tasks/afrimmlu/translate/prompt_1/afrimmlu_translate_fra.yaml |multiple_choice | | |
| |afrimmlu_translate_fra_prompt_2 |lm_eval/tasks/afrimmlu/translate/prompt_2/afrimmlu_translate_fra.yaml |multiple_choice | | |
| |afrimmlu_translate_fra_prompt_3 |lm_eval/tasks/afrimmlu/translate/prompt_3/afrimmlu_translate_fra.yaml |multiple_choice | | |
| |afrimmlu_translate_fra_prompt_4 |lm_eval/tasks/afrimmlu/translate/prompt_4/afrimmlu_translate_fra.yaml |multiple_choice | | |
| |afrimmlu_translate_fra_prompt_5 |lm_eval/tasks/afrimmlu/translate/prompt_5/afrimmlu_translate_fra.yaml |multiple_choice | | |
| |afrimmlu_translate_hau_prompt_1 |lm_eval/tasks/afrimmlu/translate/prompt_1/afrimmlu_translate_hau.yaml |multiple_choice | | |
| |afrimmlu_translate_hau_prompt_2 |lm_eval/tasks/afrimmlu/translate/prompt_2/afrimmlu_translate_hau.yaml |multiple_choice | | |
| |afrimmlu_translate_hau_prompt_3 |lm_eval/tasks/afrimmlu/translate/prompt_3/afrimmlu_translate_hau.yaml |multiple_choice | | |
| |afrimmlu_translate_hau_prompt_4 |lm_eval/tasks/afrimmlu/translate/prompt_4/afrimmlu_translate_hau.yaml |multiple_choice | | |
| |afrimmlu_translate_hau_prompt_5 |lm_eval/tasks/afrimmlu/translate/prompt_5/afrimmlu_translate_hau.yaml |multiple_choice | | |
| |afrimmlu_translate_ibo_prompt_1 |lm_eval/tasks/afrimmlu/translate/prompt_1/afrimmlu_translate_ibo.yaml |multiple_choice | | |
| |afrimmlu_translate_ibo_prompt_2 |lm_eval/tasks/afrimmlu/translate/prompt_2/afrimmlu_translate_ibo.yaml |multiple_choice | | |
| |afrimmlu_translate_ibo_prompt_3 |lm_eval/tasks/afrimmlu/translate/prompt_3/afrimmlu_translate_ibo.yaml |multiple_choice | | |
| |afrimmlu_translate_ibo_prompt_4 |lm_eval/tasks/afrimmlu/translate/prompt_4/afrimmlu_translate_ibo.yaml |multiple_choice | | |
| |afrimmlu_translate_ibo_prompt_5 |lm_eval/tasks/afrimmlu/translate/prompt_5/afrimmlu_translate_ibo.yaml |multiple_choice | | |
| |afrimmlu_translate_kin_prompt_1 |lm_eval/tasks/afrimmlu/translate/prompt_1/afrimmlu_translate_kin.yaml |multiple_choice | | |
| |afrimmlu_translate_kin_prompt_2 |lm_eval/tasks/afrimmlu/translate/prompt_2/afrimmlu_translate_kin.yaml |multiple_choice | | |
| |afrimmlu_translate_kin_prompt_3 |lm_eval/tasks/afrimmlu/translate/prompt_3/afrimmlu_translate_kin.yaml |multiple_choice | | |
| |afrimmlu_translate_kin_prompt_4 |lm_eval/tasks/afrimmlu/translate/prompt_4/afrimmlu_translate_kin.yaml |multiple_choice | | |
| |afrimmlu_translate_kin_prompt_5 |lm_eval/tasks/afrimmlu/translate/prompt_5/afrimmlu_translate_kin.yaml |multiple_choice | | |
| |afrimmlu_translate_lin_prompt_1 |lm_eval/tasks/afrimmlu/translate/prompt_1/afrimmlu_translate_lin.yaml |multiple_choice | | |
| |afrimmlu_translate_lin_prompt_2 |lm_eval/tasks/afrimmlu/translate/prompt_2/afrimmlu_translate_lin.yaml |multiple_choice | | |
| |afrimmlu_translate_lin_prompt_3 |lm_eval/tasks/afrimmlu/translate/prompt_3/afrimmlu_translate_lin.yaml |multiple_choice | | |
| |afrimmlu_translate_lin_prompt_4 |lm_eval/tasks/afrimmlu/translate/prompt_4/afrimmlu_translate_lin.yaml |multiple_choice | | |
| |afrimmlu_translate_lin_prompt_5 |lm_eval/tasks/afrimmlu/translate/prompt_5/afrimmlu_translate_lin.yaml |multiple_choice | | |
| |afrimmlu_translate_lug_prompt_1 |lm_eval/tasks/afrimmlu/translate/prompt_1/afrimmlu_translate_lug.yaml |multiple_choice | | |
| |afrimmlu_translate_lug_prompt_2 |lm_eval/tasks/afrimmlu/translate/prompt_2/afrimmlu_translate_lug.yaml |multiple_choice | | |
| |afrimmlu_translate_lug_prompt_3 |lm_eval/tasks/afrimmlu/translate/prompt_3/afrimmlu_translate_lug.yaml |multiple_choice | | |
| |afrimmlu_translate_lug_prompt_4 |lm_eval/tasks/afrimmlu/translate/prompt_4/afrimmlu_translate_lug.yaml |multiple_choice | | |
| |afrimmlu_translate_lug_prompt_5 |lm_eval/tasks/afrimmlu/translate/prompt_5/afrimmlu_translate_lug.yaml |multiple_choice | | |
| |afrimmlu_translate_orm_prompt_1 |lm_eval/tasks/afrimmlu/translate/prompt_1/afrimmlu_translate_orm.yaml |multiple_choice | | |
| |afrimmlu_translate_orm_prompt_2 |lm_eval/tasks/afrimmlu/translate/prompt_2/afrimmlu_translate_orm.yaml |multiple_choice | | |
| |afrimmlu_translate_orm_prompt_3 |lm_eval/tasks/afrimmlu/translate/prompt_3/afrimmlu_translate_orm.yaml |multiple_choice | | |
| |afrimmlu_translate_orm_prompt_4 |lm_eval/tasks/afrimmlu/translate/prompt_4/afrimmlu_translate_orm.yaml |multiple_choice | | |
| |afrimmlu_translate_orm_prompt_5 |lm_eval/tasks/afrimmlu/translate/prompt_5/afrimmlu_translate_orm.yaml |multiple_choice | | |
| |afrimmlu_translate_sna_prompt_1 |lm_eval/tasks/afrimmlu/translate/prompt_1/afrimmlu_translate_sna.yaml |multiple_choice | | |
| |afrimmlu_translate_sna_prompt_2 |lm_eval/tasks/afrimmlu/translate/prompt_2/afrimmlu_translate_sna.yaml |multiple_choice | | |
| |afrimmlu_translate_sna_prompt_3 |lm_eval/tasks/afrimmlu/translate/prompt_3/afrimmlu_translate_sna.yaml |multiple_choice | | |
| |afrimmlu_translate_sna_prompt_4 |lm_eval/tasks/afrimmlu/translate/prompt_4/afrimmlu_translate_sna.yaml |multiple_choice | | |
| |afrimmlu_translate_sna_prompt_5 |lm_eval/tasks/afrimmlu/translate/prompt_5/afrimmlu_translate_sna.yaml |multiple_choice | | |
| |afrimmlu_translate_sot_prompt_1 |lm_eval/tasks/afrimmlu/translate/prompt_1/afrimmlu_translate_sot.yaml |multiple_choice | | |
| |afrimmlu_translate_sot_prompt_2 |lm_eval/tasks/afrimmlu/translate/prompt_2/afrimmlu_translate_sot.yaml |multiple_choice | | |
| |afrimmlu_translate_sot_prompt_3 |lm_eval/tasks/afrimmlu/translate/prompt_3/afrimmlu_translate_sot.yaml |multiple_choice | | |
| |afrimmlu_translate_sot_prompt_4 |lm_eval/tasks/afrimmlu/translate/prompt_4/afrimmlu_translate_sot.yaml |multiple_choice | | |
| |afrimmlu_translate_sot_prompt_5 |lm_eval/tasks/afrimmlu/translate/prompt_5/afrimmlu_translate_sot.yaml |multiple_choice | | |
| |afrimmlu_translate_swa_prompt_1 |lm_eval/tasks/afrimmlu/translate/prompt_1/afrimmlu_translate_swa.yaml |multiple_choice | | |
| |afrimmlu_translate_swa_prompt_2 |lm_eval/tasks/afrimmlu/translate/prompt_2/afrimmlu_translate_swa.yaml |multiple_choice | | |
| |afrimmlu_translate_swa_prompt_3 |lm_eval/tasks/afrimmlu/translate/prompt_3/afrimmlu_translate_swa.yaml |multiple_choice | | |
| |afrimmlu_translate_swa_prompt_4 |lm_eval/tasks/afrimmlu/translate/prompt_4/afrimmlu_translate_swa.yaml |multiple_choice | | |
| |afrimmlu_translate_swa_prompt_5 |lm_eval/tasks/afrimmlu/translate/prompt_5/afrimmlu_translate_swa.yaml |multiple_choice | | |
| |afrimmlu_translate_twi_prompt_1 |lm_eval/tasks/afrimmlu/translate/prompt_1/afrimmlu_translate_twi.yaml |multiple_choice | | |
| |afrimmlu_translate_twi_prompt_2 |lm_eval/tasks/afrimmlu/translate/prompt_2/afrimmlu_translate_twi.yaml |multiple_choice | | |
| |afrimmlu_translate_twi_prompt_3 |lm_eval/tasks/afrimmlu/translate/prompt_3/afrimmlu_translate_twi.yaml |multiple_choice | | |
| |afrimmlu_translate_twi_prompt_4 |lm_eval/tasks/afrimmlu/translate/prompt_4/afrimmlu_translate_twi.yaml |multiple_choice | | |
| |afrimmlu_translate_twi_prompt_5 |lm_eval/tasks/afrimmlu/translate/prompt_5/afrimmlu_translate_twi.yaml |multiple_choice | | |
| |afrimmlu_translate_wol_prompt_1 |lm_eval/tasks/afrimmlu/translate/prompt_1/afrimmlu_translate_wol.yaml |multiple_choice | | |
| |afrimmlu_translate_wol_prompt_2 |lm_eval/tasks/afrimmlu/translate/prompt_2/afrimmlu_translate_wol.yaml |multiple_choice | | |
| |afrimmlu_translate_wol_prompt_3 |lm_eval/tasks/afrimmlu/translate/prompt_3/afrimmlu_translate_wol.yaml |multiple_choice | | |
| |afrimmlu_translate_wol_prompt_4 |lm_eval/tasks/afrimmlu/translate/prompt_4/afrimmlu_translate_wol.yaml |multiple_choice | | |
| |afrimmlu_translate_wol_prompt_5 |lm_eval/tasks/afrimmlu/translate/prompt_5/afrimmlu_translate_wol.yaml |multiple_choice | | |
| |afrimmlu_translate_xho_prompt_1 |lm_eval/tasks/afrimmlu/translate/prompt_1/afrimmlu_translate_xho.yaml |multiple_choice | | |
| |afrimmlu_translate_xho_prompt_2 |lm_eval/tasks/afrimmlu/translate/prompt_2/afrimmlu_translate_xho.yaml |multiple_choice | | |
| |afrimmlu_translate_xho_prompt_3 |lm_eval/tasks/afrimmlu/translate/prompt_3/afrimmlu_translate_xho.yaml |multiple_choice | | |
| |afrimmlu_translate_xho_prompt_4 |lm_eval/tasks/afrimmlu/translate/prompt_4/afrimmlu_translate_xho.yaml |multiple_choice | | |
| |afrimmlu_translate_xho_prompt_5 |lm_eval/tasks/afrimmlu/translate/prompt_5/afrimmlu_translate_xho.yaml |multiple_choice | | |
| |afrimmlu_translate_yor_prompt_1 |lm_eval/tasks/afrimmlu/translate/prompt_1/afrimmlu_translate_yor.yaml |multiple_choice | | |
| |afrimmlu_translate_yor_prompt_2 |lm_eval/tasks/afrimmlu/translate/prompt_2/afrimmlu_translate_yor.yaml |multiple_choice | | |
| |afrimmlu_translate_yor_prompt_3 |lm_eval/tasks/afrimmlu/translate/prompt_3/afrimmlu_translate_yor.yaml |multiple_choice | | |
| |afrimmlu_translate_yor_prompt_4 |lm_eval/tasks/afrimmlu/translate/prompt_4/afrimmlu_translate_yor.yaml |multiple_choice | | |
| |afrimmlu_translate_yor_prompt_5 |lm_eval/tasks/afrimmlu/translate/prompt_5/afrimmlu_translate_yor.yaml |multiple_choice | | |
| |afrimmlu_translate_zul_prompt_1 |lm_eval/tasks/afrimmlu/translate/prompt_1/afrimmlu_translate_zul.yaml |multiple_choice | | |
| |afrimmlu_translate_zul_prompt_2 |lm_eval/tasks/afrimmlu/translate/prompt_2/afrimmlu_translate_zul.yaml |multiple_choice | | |
| |afrimmlu_translate_zul_prompt_3 |lm_eval/tasks/afrimmlu/translate/prompt_3/afrimmlu_translate_zul.yaml |multiple_choice | | |
| |afrimmlu_translate_zul_prompt_4 |lm_eval/tasks/afrimmlu/translate/prompt_4/afrimmlu_translate_zul.yaml |multiple_choice | | |
| |afrimmlu_translate_zul_prompt_5 |lm_eval/tasks/afrimmlu/translate/prompt_5/afrimmlu_translate_zul.yaml |multiple_choice | | |
| |afriqa_bem_prompt_1 |lm_eval/tasks/afrobench/afriqa/prompt_1/afriqa_bem.yaml |generate_until | | |
| |afriqa_bem_prompt_2 |lm_eval/tasks/afrobench/afriqa/prompt_2/afriqa_bem.yaml |generate_until | | |
| |afriqa_bem_prompt_3 |lm_eval/tasks/afrobench/afriqa/prompt_3/afriqa_bem.yaml |generate_until | | |
| |afriqa_bem_prompt_4 |lm_eval/tasks/afrobench/afriqa/prompt_4/afriqa_bem.yaml |generate_until | | |
| |afriqa_bem_prompt_5 |lm_eval/tasks/afrobench/afriqa/prompt_5/afriqa_bem.yaml |generate_until | | |
| |afriqa_fon_prompt_1 |lm_eval/tasks/afrobench/afriqa/prompt_1/afriqa_fon.yaml |generate_until | | |
| |afriqa_fon_prompt_2 |lm_eval/tasks/afrobench/afriqa/prompt_2/afriqa_fon.yaml |generate_until | | |
| |afriqa_fon_prompt_3 |lm_eval/tasks/afrobench/afriqa/prompt_3/afriqa_fon.yaml |generate_until | | |
| |afriqa_fon_prompt_4 |lm_eval/tasks/afrobench/afriqa/prompt_4/afriqa_fon.yaml |generate_until | | |
| |afriqa_fon_prompt_5 |lm_eval/tasks/afrobench/afriqa/prompt_5/afriqa_fon.yaml |generate_until | | |
| |afriqa_hau_prompt_1 |lm_eval/tasks/afrobench/afriqa/prompt_1/afriqa_hau.yaml |generate_until | | |
| |afriqa_hau_prompt_2 |lm_eval/tasks/afrobench/afriqa/prompt_2/afriqa_hau.yaml |generate_until | | |
| |afriqa_hau_prompt_3 |lm_eval/tasks/afrobench/afriqa/prompt_3/afriqa_hau.yaml |generate_until | | |
| |afriqa_hau_prompt_4 |lm_eval/tasks/afrobench/afriqa/prompt_4/afriqa_hau.yaml |generate_until | | |
| |afriqa_hau_prompt_5 |lm_eval/tasks/afrobench/afriqa/prompt_5/afriqa_hau.yaml |generate_until | | |
| |afriqa_ibo_prompt_1 |lm_eval/tasks/afrobench/afriqa/prompt_1/afriqa_ibo.yaml |generate_until | | |
| |afriqa_ibo_prompt_2 |lm_eval/tasks/afrobench/afriqa/prompt_2/afriqa_ibo.yaml |generate_until | | |
| |afriqa_ibo_prompt_3 |lm_eval/tasks/afrobench/afriqa/prompt_3/afriqa_ibo.yaml |generate_until | | |
| |afriqa_ibo_prompt_4 |lm_eval/tasks/afrobench/afriqa/prompt_4/afriqa_ibo.yaml |generate_until | | |
| |afriqa_ibo_prompt_5 |lm_eval/tasks/afrobench/afriqa/prompt_5/afriqa_ibo.yaml |generate_until | | |
| |afriqa_kin_prompt_1 |lm_eval/tasks/afrobench/afriqa/prompt_1/afriqa_kin.yaml |generate_until | | |
| |afriqa_kin_prompt_2 |lm_eval/tasks/afrobench/afriqa/prompt_2/afriqa_kin.yaml |generate_until | | |
| |afriqa_kin_prompt_3 |lm_eval/tasks/afrobench/afriqa/prompt_3/afriqa_kin.yaml |generate_until | | |
| |afriqa_kin_prompt_4 |lm_eval/tasks/afrobench/afriqa/prompt_4/afriqa_kin.yaml |generate_until | | |
| |afriqa_kin_prompt_5 |lm_eval/tasks/afrobench/afriqa/prompt_5/afriqa_kin.yaml |generate_until | | |
| |afriqa_swa_prompt_1 |lm_eval/tasks/afrobench/afriqa/prompt_1/afriqa_swa.yaml |generate_until | | |
| |afriqa_swa_prompt_2 |lm_eval/tasks/afrobench/afriqa/prompt_2/afriqa_swa.yaml |generate_until | | |
| |afriqa_swa_prompt_3 |lm_eval/tasks/afrobench/afriqa/prompt_3/afriqa_swa.yaml |generate_until | | |
| |afriqa_swa_prompt_4 |lm_eval/tasks/afrobench/afriqa/prompt_4/afriqa_swa.yaml |generate_until | | |
| |afriqa_swa_prompt_5 |lm_eval/tasks/afrobench/afriqa/prompt_5/afriqa_swa.yaml |generate_until | | |
| |afriqa_twi_prompt_1 |lm_eval/tasks/afrobench/afriqa/prompt_1/afriqa_twi.yaml |generate_until | | |
| |afriqa_twi_prompt_2 |lm_eval/tasks/afrobench/afriqa/prompt_2/afriqa_twi.yaml |generate_until | | |
| |afriqa_twi_prompt_3 |lm_eval/tasks/afrobench/afriqa/prompt_3/afriqa_twi.yaml |generate_until | | |
| |afriqa_twi_prompt_4 |lm_eval/tasks/afrobench/afriqa/prompt_4/afriqa_twi.yaml |generate_until | | |
| |afriqa_twi_prompt_5 |lm_eval/tasks/afrobench/afriqa/prompt_5/afriqa_twi.yaml |generate_until | | |
| |afriqa_yor_prompt_1 |lm_eval/tasks/afrobench/afriqa/prompt_1/afriqa_yor.yaml |generate_until | | |
| |afriqa_yor_prompt_2 |lm_eval/tasks/afrobench/afriqa/prompt_2/afriqa_yor.yaml |generate_until | | |
| |afriqa_yor_prompt_3 |lm_eval/tasks/afrobench/afriqa/prompt_3/afriqa_yor.yaml |generate_until | | |
| |afriqa_yor_prompt_4 |lm_eval/tasks/afrobench/afriqa/prompt_4/afriqa_yor.yaml |generate_until | | |
| |afriqa_yor_prompt_5 |lm_eval/tasks/afrobench/afriqa/prompt_5/afriqa_yor.yaml |generate_until | | |
| |afriqa_zul_prompt_1 |lm_eval/tasks/afrobench/afriqa/prompt_1/afriqa_zul.yaml |generate_until | | |
| |afriqa_zul_prompt_2 |lm_eval/tasks/afrobench/afriqa/prompt_2/afriqa_zul.yaml |generate_until | | |
| |afriqa_zul_prompt_3 |lm_eval/tasks/afrobench/afriqa/prompt_3/afriqa_zul.yaml |generate_until | | |
| |afriqa_zul_prompt_4 |lm_eval/tasks/afrobench/afriqa/prompt_4/afriqa_zul.yaml |generate_until | | |
| |afriqa_zul_prompt_5 |lm_eval/tasks/afrobench/afriqa/prompt_5/afriqa_zul.yaml |generate_until | | |
| |afrisenti_amh_prompt_1 |lm_eval/tasks/afrobench/afrisenti/prompt_1/afrisenti_amh.yaml |multiple_choice | | |
| |afrisenti_amh_prompt_2 |lm_eval/tasks/afrobench/afrisenti/prompt_2/afrisenti_amh.yaml |multiple_choice | | |
| |afrisenti_amh_prompt_3 |lm_eval/tasks/afrobench/afrisenti/prompt_3/afrisenti_amh.yaml |multiple_choice | | |
| |afrisenti_amh_prompt_4 |lm_eval/tasks/afrobench/afrisenti/prompt_4/afrisenti_amh.yaml |multiple_choice | | |
| |afrisenti_amh_prompt_5 |lm_eval/tasks/afrobench/afrisenti/prompt_5/afrisenti_amh.yaml |multiple_choice | | |
| |afrisenti_arq_prompt_1 |lm_eval/tasks/afrobench/afrisenti/prompt_1/afrisenti_arq.yaml |multiple_choice | | |
| |afrisenti_arq_prompt_2 |lm_eval/tasks/afrobench/afrisenti/prompt_2/afrisenti_arq.yaml |multiple_choice | | |
| |afrisenti_arq_prompt_3 |lm_eval/tasks/afrobench/afrisenti/prompt_3/afrisenti_arq.yaml |multiple_choice | | |
| |afrisenti_arq_prompt_4 |lm_eval/tasks/afrobench/afrisenti/prompt_4/afrisenti_arq.yaml |multiple_choice | | |
| |afrisenti_arq_prompt_5 |lm_eval/tasks/afrobench/afrisenti/prompt_5/afrisenti_arq.yaml |multiple_choice | | |
| |afrisenti_ary_prompt_1 |lm_eval/tasks/afrobench/afrisenti/prompt_1/afrisenti_ary.yaml |multiple_choice | | |
| |afrisenti_ary_prompt_2 |lm_eval/tasks/afrobench/afrisenti/prompt_2/afrisenti_ary.yaml |multiple_choice | | |
| |afrisenti_ary_prompt_3 |lm_eval/tasks/afrobench/afrisenti/prompt_3/afrisenti_ary.yaml |multiple_choice | | |
| |afrisenti_ary_prompt_4 |lm_eval/tasks/afrobench/afrisenti/prompt_4/afrisenti_ary.yaml |multiple_choice | | |
| |afrisenti_ary_prompt_5 |lm_eval/tasks/afrobench/afrisenti/prompt_5/afrisenti_ary.yaml |multiple_choice | | |
| |afrisenti_hau_prompt_1 |lm_eval/tasks/afrobench/afrisenti/prompt_1/afrisenti_hau.yaml |multiple_choice | | |
| |afrisenti_hau_prompt_2 |lm_eval/tasks/afrobench/afrisenti/prompt_2/afrisenti_hau.yaml |multiple_choice | | |
| |afrisenti_hau_prompt_3 |lm_eval/tasks/afrobench/afrisenti/prompt_3/afrisenti_hau.yaml |multiple_choice | | |
| |afrisenti_hau_prompt_4 |lm_eval/tasks/afrobench/afrisenti/prompt_4/afrisenti_hau.yaml |multiple_choice | | |
| |afrisenti_hau_prompt_5 |lm_eval/tasks/afrobench/afrisenti/prompt_5/afrisenti_hau.yaml |multiple_choice | | |
| |afrisenti_ibo_prompt_1 |lm_eval/tasks/afrobench/afrisenti/prompt_1/afrisenti_ibo.yaml |multiple_choice | | |
| |afrisenti_ibo_prompt_2 |lm_eval/tasks/afrobench/afrisenti/prompt_2/afrisenti_ibo.yaml |multiple_choice | | |
| |afrisenti_ibo_prompt_3 |lm_eval/tasks/afrobench/afrisenti/prompt_3/afrisenti_ibo.yaml |multiple_choice | | |
| |afrisenti_ibo_prompt_4 |lm_eval/tasks/afrobench/afrisenti/prompt_4/afrisenti_ibo.yaml |multiple_choice | | |
| |afrisenti_ibo_prompt_5 |lm_eval/tasks/afrobench/afrisenti/prompt_5/afrisenti_ibo.yaml |multiple_choice | | |
| |afrisenti_kin_prompt_1 |lm_eval/tasks/afrobench/afrisenti/prompt_1/afrisenti_kin.yaml |multiple_choice | | |
| |afrisenti_kin_prompt_2 |lm_eval/tasks/afrobench/afrisenti/prompt_2/afrisenti_kin.yaml |multiple_choice | | |
| |afrisenti_kin_prompt_3 |lm_eval/tasks/afrobench/afrisenti/prompt_3/afrisenti_kin.yaml |multiple_choice | | |
| |afrisenti_kin_prompt_4 |lm_eval/tasks/afrobench/afrisenti/prompt_4/afrisenti_kin.yaml |multiple_choice | | |
| |afrisenti_kin_prompt_5 |lm_eval/tasks/afrobench/afrisenti/prompt_5/afrisenti_kin.yaml |multiple_choice | | |
| |afrisenti_orm_prompt_1 |lm_eval/tasks/afrobench/afrisenti/prompt_1/afrisenti_orm.yaml |multiple_choice | | |
| |afrisenti_orm_prompt_2 |lm_eval/tasks/afrobench/afrisenti/prompt_2/afrisenti_orm.yaml |multiple_choice | | |
| |afrisenti_orm_prompt_3 |lm_eval/tasks/afrobench/afrisenti/prompt_3/afrisenti_orm.yaml |multiple_choice | | |
| |afrisenti_orm_prompt_4 |lm_eval/tasks/afrobench/afrisenti/prompt_4/afrisenti_orm.yaml |multiple_choice | | |
| |afrisenti_orm_prompt_5 |lm_eval/tasks/afrobench/afrisenti/prompt_5/afrisenti_orm.yaml |multiple_choice | | |
| |afrisenti_pcm_prompt_1 |lm_eval/tasks/afrobench/afrisenti/prompt_1/afrisenti_pcm.yaml |multiple_choice | | |
| |afrisenti_pcm_prompt_2 |lm_eval/tasks/afrobench/afrisenti/prompt_2/afrisenti_pcm.yaml |multiple_choice | | |
| |afrisenti_pcm_prompt_3 |lm_eval/tasks/afrobench/afrisenti/prompt_3/afrisenti_pcm.yaml |multiple_choice | | |
| |afrisenti_pcm_prompt_4 |lm_eval/tasks/afrobench/afrisenti/prompt_4/afrisenti_pcm.yaml |multiple_choice | | |
| |afrisenti_pcm_prompt_5 |lm_eval/tasks/afrobench/afrisenti/prompt_5/afrisenti_pcm.yaml |multiple_choice | | |
| |afrisenti_por_prompt_1 |lm_eval/tasks/afrobench/afrisenti/prompt_1/afrisenti_por.yaml |multiple_choice | | |
| |afrisenti_por_prompt_2 |lm_eval/tasks/afrobench/afrisenti/prompt_2/afrisenti_por.yaml |multiple_choice | | |
| |afrisenti_por_prompt_3 |lm_eval/tasks/afrobench/afrisenti/prompt_3/afrisenti_por.yaml |multiple_choice | | |
| |afrisenti_por_prompt_4 |lm_eval/tasks/afrobench/afrisenti/prompt_4/afrisenti_por.yaml |multiple_choice | | |
| |afrisenti_por_prompt_5 |lm_eval/tasks/afrobench/afrisenti/prompt_5/afrisenti_por.yaml |multiple_choice | | |
| |afrisenti_swa_prompt_1 |lm_eval/tasks/afrobench/afrisenti/prompt_1/afrisenti_swa.yaml |multiple_choice | | |
| |afrisenti_swa_prompt_2 |lm_eval/tasks/afrobench/afrisenti/prompt_2/afrisenti_swa.yaml |multiple_choice | | |
| |afrisenti_swa_prompt_3 |lm_eval/tasks/afrobench/afrisenti/prompt_3/afrisenti_swa.yaml |multiple_choice | | |
| |afrisenti_swa_prompt_4 |lm_eval/tasks/afrobench/afrisenti/prompt_4/afrisenti_swa.yaml |multiple_choice | | |
| |afrisenti_swa_prompt_5 |lm_eval/tasks/afrobench/afrisenti/prompt_5/afrisenti_swa.yaml |multiple_choice | | |
| |afrisenti_tir_prompt_1 |lm_eval/tasks/afrobench/afrisenti/prompt_1/afrisenti_tir.yaml |multiple_choice | | |
| |afrisenti_tir_prompt_2 |lm_eval/tasks/afrobench/afrisenti/prompt_2/afrisenti_tir.yaml |multiple_choice | | |
| |afrisenti_tir_prompt_3 |lm_eval/tasks/afrobench/afrisenti/prompt_3/afrisenti_tir.yaml |multiple_choice | | |
| |afrisenti_tir_prompt_4 |lm_eval/tasks/afrobench/afrisenti/prompt_4/afrisenti_tir.yaml |multiple_choice | | |
| |afrisenti_tir_prompt_5 |lm_eval/tasks/afrobench/afrisenti/prompt_5/afrisenti_tir.yaml |multiple_choice | | |
| |afrisenti_tso_prompt_1 |lm_eval/tasks/afrobench/afrisenti/prompt_1/afrisenti_tso.yaml |multiple_choice | | |
| |afrisenti_tso_prompt_2 |lm_eval/tasks/afrobench/afrisenti/prompt_2/afrisenti_tso.yaml |multiple_choice | | |
| |afrisenti_tso_prompt_3 |lm_eval/tasks/afrobench/afrisenti/prompt_3/afrisenti_tso.yaml |multiple_choice | | |
| |afrisenti_tso_prompt_4 |lm_eval/tasks/afrobench/afrisenti/prompt_4/afrisenti_tso.yaml |multiple_choice | | |
| |afrisenti_tso_prompt_5 |lm_eval/tasks/afrobench/afrisenti/prompt_5/afrisenti_tso.yaml |multiple_choice | | |
| |afrisenti_twi_prompt_1 |lm_eval/tasks/afrobench/afrisenti/prompt_1/afrisenti_twi.yaml |multiple_choice | | |
| |afrisenti_twi_prompt_2 |lm_eval/tasks/afrobench/afrisenti/prompt_2/afrisenti_twi.yaml |multiple_choice | | |
| |afrisenti_twi_prompt_3 |lm_eval/tasks/afrobench/afrisenti/prompt_3/afrisenti_twi.yaml |multiple_choice | | |
| |afrisenti_twi_prompt_4 |lm_eval/tasks/afrobench/afrisenti/prompt_4/afrisenti_twi.yaml |multiple_choice | | |
| |afrisenti_twi_prompt_5 |lm_eval/tasks/afrobench/afrisenti/prompt_5/afrisenti_twi.yaml |multiple_choice | | |
| |afrisenti_yor_prompt_1 |lm_eval/tasks/afrobench/afrisenti/prompt_1/afrisenti_yor.yaml |multiple_choice | | |
| |afrisenti_yor_prompt_2 |lm_eval/tasks/afrobench/afrisenti/prompt_2/afrisenti_yor.yaml |multiple_choice | | |
| |afrisenti_yor_prompt_3 |lm_eval/tasks/afrobench/afrisenti/prompt_3/afrisenti_yor.yaml |multiple_choice | | |
| |afrisenti_yor_prompt_4 |lm_eval/tasks/afrobench/afrisenti/prompt_4/afrisenti_yor.yaml |multiple_choice | | |
| |afrisenti_yor_prompt_5 |lm_eval/tasks/afrobench/afrisenti/prompt_5/afrisenti_yor.yaml |multiple_choice | | |
| |afrixnli_amh_prompt_1 |lm_eval/tasks/afrixnli/direct/prompt_1/afrixnli_amh.yaml |multiple_choice | | |
| |afrixnli_amh_prompt_2 |lm_eval/tasks/afrixnli/direct/prompt_2/afrixnli_amh.yaml |multiple_choice | | |
| |afrixnli_amh_prompt_3 |lm_eval/tasks/afrixnli/direct/prompt_3/afrixnli_amh.yaml |multiple_choice | | |
| |afrixnli_amh_prompt_4 |lm_eval/tasks/afrixnli/direct/prompt_4/afrixnli_amh.yaml |multiple_choice | | |
| |afrixnli_amh_prompt_5 |lm_eval/tasks/afrixnli/direct/prompt_5/afrixnli_amh.yaml |multiple_choice | | |
| |afrixnli_en_direct_amh |lm_eval/tasks/afrixnli/anli prompt/en-direct/afrixnli_en_direct_amh.yaml |multiple_choice | | |
| |afrixnli_en_direct_eng |lm_eval/tasks/afrixnli/anli prompt/en-direct/afrixnli_en_direct_eng.yaml |multiple_choice | | |
| |afrixnli_en_direct_ewe |lm_eval/tasks/afrixnli/anli prompt/en-direct/afrixnli_en_direct_ewe.yaml |multiple_choice | | |
| |afrixnli_en_direct_fra |lm_eval/tasks/afrixnli/anli prompt/en-direct/afrixnli_en_direct_fra.yaml |multiple_choice | | |
| |afrixnli_en_direct_hau |lm_eval/tasks/afrixnli/anli prompt/en-direct/afrixnli_en_direct_hau.yaml |multiple_choice | | |
| |afrixnli_en_direct_ibo |lm_eval/tasks/afrixnli/anli prompt/en-direct/afrixnli_en_direct_ibo.yaml |multiple_choice | | |
| |afrixnli_en_direct_kin |lm_eval/tasks/afrixnli/anli prompt/en-direct/afrixnli_en_direct_kin.yaml |multiple_choice | | |
| |afrixnli_en_direct_lin |lm_eval/tasks/afrixnli/anli prompt/en-direct/afrixnli_en_direct_lin.yaml |multiple_choice | | |
| |afrixnli_en_direct_lug |lm_eval/tasks/afrixnli/anli prompt/en-direct/afrixnli_en_direct_lug.yaml |multiple_choice | | |
| |afrixnli_en_direct_orm |lm_eval/tasks/afrixnli/anli prompt/en-direct/afrixnli_en_direct_orm.yaml |multiple_choice | | |
| |afrixnli_en_direct_sna |lm_eval/tasks/afrixnli/anli prompt/en-direct/afrixnli_en_direct_sna.yaml |multiple_choice | | |
| |afrixnli_en_direct_sot |lm_eval/tasks/afrixnli/anli prompt/en-direct/afrixnli_en_direct_sot.yaml |multiple_choice | | |
| |afrixnli_en_direct_swa |lm_eval/tasks/afrixnli/anli prompt/en-direct/afrixnli_en_direct_swa.yaml |multiple_choice | | |
| |afrixnli_en_direct_twi |lm_eval/tasks/afrixnli/anli prompt/en-direct/afrixnli_en_direct_twi.yaml |multiple_choice | | |
| |afrixnli_en_direct_wol |lm_eval/tasks/afrixnli/anli prompt/en-direct/afrixnli_en_direct_wol.yaml |multiple_choice | | |
| |afrixnli_en_direct_xho |lm_eval/tasks/afrixnli/anli prompt/en-direct/afrixnli_en_direct_xho.yaml |multiple_choice | | |
| |afrixnli_en_direct_yor |lm_eval/tasks/afrixnli/anli prompt/en-direct/afrixnli_en_direct_yor.yaml |multiple_choice | | |
| |afrixnli_en_direct_zul |lm_eval/tasks/afrixnli/anli prompt/en-direct/afrixnli_en_direct_zul.yaml |multiple_choice | | |
| |afrixnli_eng_prompt_1 |lm_eval/tasks/afrixnli/direct/prompt_1/afrixnli_eng.yaml |multiple_choice | | |
| |afrixnli_eng_prompt_2 |lm_eval/tasks/afrixnli/direct/prompt_2/afrixnli_eng.yaml |multiple_choice | | |
| |afrixnli_eng_prompt_3 |lm_eval/tasks/afrixnli/direct/prompt_3/afrixnli_eng.yaml |multiple_choice | | |
| |afrixnli_eng_prompt_4 |lm_eval/tasks/afrixnli/direct/prompt_4/afrixnli_eng.yaml |multiple_choice | | |
| |afrixnli_eng_prompt_5 |lm_eval/tasks/afrixnli/direct/prompt_5/afrixnli_eng.yaml |multiple_choice | | |
| |afrixnli_ewe_prompt_1 |lm_eval/tasks/afrixnli/direct/prompt_1/afrixnli_ewe.yaml |multiple_choice | | |
| |afrixnli_ewe_prompt_2 |lm_eval/tasks/afrixnli/direct/prompt_2/afrixnli_ewe.yaml |multiple_choice | | |
| |afrixnli_ewe_prompt_3 |lm_eval/tasks/afrixnli/direct/prompt_3/afrixnli_ewe.yaml |multiple_choice | | |
| |afrixnli_ewe_prompt_4 |lm_eval/tasks/afrixnli/direct/prompt_4/afrixnli_ewe.yaml |multiple_choice | | |
| |afrixnli_ewe_prompt_5 |lm_eval/tasks/afrixnli/direct/prompt_5/afrixnli_ewe.yaml |multiple_choice | | |
| |afrixnli_fra_prompt_1 |lm_eval/tasks/afrixnli/direct/prompt_1/afrixnli_fra.yaml |multiple_choice | | |
| |afrixnli_fra_prompt_2 |lm_eval/tasks/afrixnli/direct/prompt_2/afrixnli_fra.yaml |multiple_choice | | |
| |afrixnli_fra_prompt_3 |lm_eval/tasks/afrixnli/direct/prompt_3/afrixnli_fra.yaml |multiple_choice | | |
| |afrixnli_fra_prompt_4 |lm_eval/tasks/afrixnli/direct/prompt_4/afrixnli_fra.yaml |multiple_choice | | |
| |afrixnli_fra_prompt_5 |lm_eval/tasks/afrixnli/direct/prompt_5/afrixnli_fra.yaml |multiple_choice | | |
| |afrixnli_hau_prompt_1 |lm_eval/tasks/afrixnli/direct/prompt_1/afrixnli_hau.yaml |multiple_choice | | |
| |afrixnli_hau_prompt_2 |lm_eval/tasks/afrixnli/direct/prompt_2/afrixnli_hau.yaml |multiple_choice | | |
| |afrixnli_hau_prompt_3 |lm_eval/tasks/afrixnli/direct/prompt_3/afrixnli_hau.yaml |multiple_choice | | |
| |afrixnli_hau_prompt_4 |lm_eval/tasks/afrixnli/direct/prompt_4/afrixnli_hau.yaml |multiple_choice | | |
| |afrixnli_hau_prompt_5 |lm_eval/tasks/afrixnli/direct/prompt_5/afrixnli_hau.yaml |multiple_choice | | |
| |afrixnli_ibo_prompt_1 |lm_eval/tasks/afrixnli/direct/prompt_1/afrixnli_ibo.yaml |multiple_choice | | |
| |afrixnli_ibo_prompt_2 |lm_eval/tasks/afrixnli/direct/prompt_2/afrixnli_ibo.yaml |multiple_choice | | |
| |afrixnli_ibo_prompt_3 |lm_eval/tasks/afrixnli/direct/prompt_3/afrixnli_ibo.yaml |multiple_choice | | |
| |afrixnli_ibo_prompt_4 |lm_eval/tasks/afrixnli/direct/prompt_4/afrixnli_ibo.yaml |multiple_choice | | |
| |afrixnli_ibo_prompt_5 |lm_eval/tasks/afrixnli/direct/prompt_5/afrixnli_ibo.yaml |multiple_choice | | |
| |afrixnli_kin_prompt_1 |lm_eval/tasks/afrixnli/direct/prompt_1/afrixnli_kin.yaml |multiple_choice | | |
| |afrixnli_kin_prompt_2 |lm_eval/tasks/afrixnli/direct/prompt_2/afrixnli_kin.yaml |multiple_choice | | |
| |afrixnli_kin_prompt_3 |lm_eval/tasks/afrixnli/direct/prompt_3/afrixnli_kin.yaml |multiple_choice | | |
| |afrixnli_kin_prompt_4 |lm_eval/tasks/afrixnli/direct/prompt_4/afrixnli_kin.yaml |multiple_choice | | |
| |afrixnli_kin_prompt_5 |lm_eval/tasks/afrixnli/direct/prompt_5/afrixnli_kin.yaml |multiple_choice | | |
| |afrixnli_lin_prompt_1 |lm_eval/tasks/afrixnli/direct/prompt_1/afrixnli_lin.yaml |multiple_choice | | |
| |afrixnli_lin_prompt_2 |lm_eval/tasks/afrixnli/direct/prompt_2/afrixnli_lin.yaml |multiple_choice | | |
| |afrixnli_lin_prompt_3 |lm_eval/tasks/afrixnli/direct/prompt_3/afrixnli_lin.yaml |multiple_choice | | |
| |afrixnli_lin_prompt_4 |lm_eval/tasks/afrixnli/direct/prompt_4/afrixnli_lin.yaml |multiple_choice | | |
| |afrixnli_lin_prompt_5 |lm_eval/tasks/afrixnli/direct/prompt_5/afrixnli_lin.yaml |multiple_choice | | |
| |afrixnli_lug_prompt_1 |lm_eval/tasks/afrixnli/direct/prompt_1/afrixnli_lug.yaml |multiple_choice | | |
| |afrixnli_lug_prompt_2 |lm_eval/tasks/afrixnli/direct/prompt_2/afrixnli_lug.yaml |multiple_choice | | |
| |afrixnli_lug_prompt_3 |lm_eval/tasks/afrixnli/direct/prompt_3/afrixnli_lug.yaml |multiple_choice | | |
| |afrixnli_lug_prompt_4 |lm_eval/tasks/afrixnli/direct/prompt_4/afrixnli_lug.yaml |multiple_choice | | |
| |afrixnli_lug_prompt_5 |lm_eval/tasks/afrixnli/direct/prompt_5/afrixnli_lug.yaml |multiple_choice | | |
| |afrixnli_manual_direct_amh |lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_amh.yaml |multiple_choice | | |
| |afrixnli_manual_direct_eng |lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_eng.yaml |multiple_choice | | |
| |afrixnli_manual_direct_ewe |lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_ewe.yaml |multiple_choice | | |
| |afrixnli_manual_direct_fra |lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_fra.yaml |multiple_choice | | |
| |afrixnli_manual_direct_hau |lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_hau.yaml |multiple_choice | | |
| |afrixnli_manual_direct_ibo |lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_ibo.yaml |multiple_choice | | |
| |afrixnli_manual_direct_kin |lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_kin.yaml |multiple_choice | | |
| |afrixnli_manual_direct_lin |lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_lin.yaml |multiple_choice | | |
| |afrixnli_manual_direct_lug |lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_lug.yaml |multiple_choice | | |
| |afrixnli_manual_direct_orm |lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_orm.yaml |multiple_choice | | |
| |afrixnli_manual_direct_sna |lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_sna.yaml |multiple_choice | | |
| |afrixnli_manual_direct_sot |lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_sot.yaml |multiple_choice | | |
| |afrixnli_manual_direct_swa |lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_swa.yaml |multiple_choice | | |
| |afrixnli_manual_direct_twi |lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_twi.yaml |multiple_choice | | |
| |afrixnli_manual_direct_wol |lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_wol.yaml |multiple_choice | | |
| |afrixnli_manual_direct_xho |lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_xho.yaml |multiple_choice | | |
| |afrixnli_manual_direct_yor |lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_yor.yaml |multiple_choice | | |
| |afrixnli_manual_direct_zul |lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_zul.yaml |multiple_choice | | |
| |afrixnli_manual_translate_amh |lm_eval/tasks/afrixnli/lai prompt/translate/afrixnli_manual_translate_amh.yaml |multiple_choice | | |
| |afrixnli_manual_translate_ewe |lm_eval/tasks/afrixnli/lai prompt/translate/afrixnli_manual_translate_ewe.yaml |multiple_choice | | |
| |afrixnli_manual_translate_fra |lm_eval/tasks/afrixnli/lai prompt/translate/afrixnli_manual_translate_fra.yaml |multiple_choice | | |
| |afrixnli_manual_translate_hau |lm_eval/tasks/afrixnli/lai prompt/translate/afrixnli_manual_translate_hau.yaml |multiple_choice | | |
| |afrixnli_manual_translate_ibo |lm_eval/tasks/afrixnli/lai prompt/translate/afrixnli_manual_translate_ibo.yaml |multiple_choice | | |
| |afrixnli_manual_translate_kin |lm_eval/tasks/afrixnli/lai prompt/translate/afrixnli_manual_translate_kin.yaml |multiple_choice | | |
| |afrixnli_manual_translate_lin |lm_eval/tasks/afrixnli/lai prompt/translate/afrixnli_manual_translate_lin.yaml |multiple_choice | | |
| |afrixnli_manual_translate_lug |lm_eval/tasks/afrixnli/lai prompt/translate/afrixnli_manual_translate_lug.yaml |multiple_choice | | |
| |afrixnli_manual_translate_orm |lm_eval/tasks/afrixnli/lai prompt/translate/afrixnli_manual_translate_orm.yaml |multiple_choice | | |
| |afrixnli_manual_translate_sna |lm_eval/tasks/afrixnli/lai prompt/translate/afrixnli_manual_translate_sna.yaml |multiple_choice | | |
| |afrixnli_manual_translate_sot |lm_eval/tasks/afrixnli/lai prompt/translate/afrixnli_manual_translate_sot.yaml |multiple_choice | | |
| |afrixnli_manual_translate_swa |lm_eval/tasks/afrixnli/lai prompt/translate/afrixnli_manual_translate_swa.yaml |multiple_choice | | |
| |afrixnli_manual_translate_twi |lm_eval/tasks/afrixnli/lai prompt/translate/afrixnli_manual_translate_twi.yaml |multiple_choice | | |
| |afrixnli_manual_translate_wol |lm_eval/tasks/afrixnli/lai prompt/translate/afrixnli_manual_translate_wol.yaml |multiple_choice | | |
| |afrixnli_manual_translate_xho |lm_eval/tasks/afrixnli/lai prompt/translate/afrixnli_manual_translate_xho.yaml |multiple_choice | | |
| |afrixnli_manual_translate_yor |lm_eval/tasks/afrixnli/lai prompt/translate/afrixnli_manual_translate_yor.yaml |multiple_choice | | |
| |afrixnli_manual_translate_zul |lm_eval/tasks/afrixnli/lai prompt/translate/afrixnli_manual_translate_zul.yaml |multiple_choice | | |
| |afrixnli_native_direct_amh |lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_amh.yaml |multiple_choice | | |
| |afrixnli_native_direct_eng |lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_eng.yaml |multiple_choice | | |
| |afrixnli_native_direct_ewe |lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_ewe.yaml |multiple_choice | | |
| |afrixnli_native_direct_fra |lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_fra.yaml |multiple_choice | | |
| |afrixnli_native_direct_hau |lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_hau.yaml |multiple_choice | | |
| |afrixnli_native_direct_ibo |lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_ibo.yaml |multiple_choice | | |
| |afrixnli_native_direct_kin |lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_kin.yaml |multiple_choice | | |
| |afrixnli_native_direct_lin |lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_lin.yaml |multiple_choice | | |
| |afrixnli_native_direct_lug |lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_lug.yaml |multiple_choice | | |
| |afrixnli_native_direct_orm |lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_orm.yaml |multiple_choice | | |
| |afrixnli_native_direct_sna |lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_sna.yaml |multiple_choice | | |
| |afrixnli_native_direct_sot |lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_sot.yaml |multiple_choice | | |
| |afrixnli_native_direct_swa |lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_swa.yaml |multiple_choice | | |
| |afrixnli_native_direct_twi |lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_twi.yaml |multiple_choice | | |
| |afrixnli_native_direct_wol |lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_wol.yaml |multiple_choice | | |
| |afrixnli_native_direct_xho |lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_xho.yaml |multiple_choice | | |
| |afrixnli_native_direct_yor |lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_yor.yaml |multiple_choice | | |
| |afrixnli_native_direct_zul |lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_zul.yaml |multiple_choice | | |
| |afrixnli_orm_prompt_1 |lm_eval/tasks/afrixnli/direct/prompt_1/afrixnli_orm.yaml |multiple_choice | | |
| |afrixnli_orm_prompt_2 |lm_eval/tasks/afrixnli/direct/prompt_2/afrixnli_orm.yaml |multiple_choice | | |
| |afrixnli_orm_prompt_3 |lm_eval/tasks/afrixnli/direct/prompt_3/afrixnli_orm.yaml |multiple_choice | | |
| |afrixnli_orm_prompt_4 |lm_eval/tasks/afrixnli/direct/prompt_4/afrixnli_orm.yaml |multiple_choice | | |
| |afrixnli_orm_prompt_5 |lm_eval/tasks/afrixnli/direct/prompt_5/afrixnli_orm.yaml |multiple_choice | | |
| |afrixnli_sna_prompt_1 |lm_eval/tasks/afrixnli/direct/prompt_1/afrixnli_sna.yaml |multiple_choice | | |
| |afrixnli_sna_prompt_2 |lm_eval/tasks/afrixnli/direct/prompt_2/afrixnli_sna.yaml |multiple_choice | | |
| |afrixnli_sna_prompt_3 |lm_eval/tasks/afrixnli/direct/prompt_3/afrixnli_sna.yaml |multiple_choice | | |
| |afrixnli_sna_prompt_4 |lm_eval/tasks/afrixnli/direct/prompt_4/afrixnli_sna.yaml |multiple_choice | | |
| |afrixnli_sna_prompt_5 |lm_eval/tasks/afrixnli/direct/prompt_5/afrixnli_sna.yaml |multiple_choice | | |
| |afrixnli_sot_prompt_1 |lm_eval/tasks/afrixnli/direct/prompt_1/afrixnli_sot.yaml |multiple_choice | | |
| |afrixnli_sot_prompt_2 |lm_eval/tasks/afrixnli/direct/prompt_2/afrixnli_sot.yaml |multiple_choice | | |
| |afrixnli_sot_prompt_3 |lm_eval/tasks/afrixnli/direct/prompt_3/afrixnli_sot.yaml |multiple_choice | | |
| |afrixnli_sot_prompt_4 |lm_eval/tasks/afrixnli/direct/prompt_4/afrixnli_sot.yaml |multiple_choice | | |
| |afrixnli_sot_prompt_5 |lm_eval/tasks/afrixnli/direct/prompt_5/afrixnli_sot.yaml |multiple_choice | | |
| |afrixnli_swa_prompt_1 |lm_eval/tasks/afrixnli/direct/prompt_1/afrixnli_swa.yaml |multiple_choice | | |
| |afrixnli_swa_prompt_2 |lm_eval/tasks/afrixnli/direct/prompt_2/afrixnli_swa.yaml |multiple_choice | | |
| |afrixnli_swa_prompt_3 |lm_eval/tasks/afrixnli/direct/prompt_3/afrixnli_swa.yaml |multiple_choice | | |
| |afrixnli_swa_prompt_4 |lm_eval/tasks/afrixnli/direct/prompt_4/afrixnli_swa.yaml |multiple_choice | | |
| |afrixnli_swa_prompt_5 |lm_eval/tasks/afrixnli/direct/prompt_5/afrixnli_swa.yaml |multiple_choice | | |
| |afrixnli_translate_amh |lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_amh.yaml |multiple_choice | | |
| |afrixnli_translate_amh_prompt_1 |lm_eval/tasks/afrixnli/translate/prompt_1/afrixnli_translate_amh.yaml |multiple_choice | | |
| |afrixnli_translate_amh_prompt_2 |lm_eval/tasks/afrixnli/translate/prompt_2/afrixnli_translate_amh.yaml |multiple_choice | | |
| |afrixnli_translate_amh_prompt_3 |lm_eval/tasks/afrixnli/translate/prompt_3/afrixnli_translate_amh.yaml |multiple_choice | | |
| |afrixnli_translate_amh_prompt_4 |lm_eval/tasks/afrixnli/translate/prompt_4/afrixnli_translate_amh.yaml |multiple_choice | | |
| |afrixnli_translate_amh_prompt_5 |lm_eval/tasks/afrixnli/translate/prompt_5/afrixnli_translate_amh.yaml |multiple_choice | | |
| |afrixnli_translate_ewe |lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_ewe.yaml |multiple_choice | | |
| |afrixnli_translate_ewe_prompt_1 |lm_eval/tasks/afrixnli/translate/prompt_1/afrixnli_translate_ewe.yaml |multiple_choice | | |
| |afrixnli_translate_ewe_prompt_2 |lm_eval/tasks/afrixnli/translate/prompt_2/afrixnli_translate_ewe.yaml |multiple_choice | | |
| |afrixnli_translate_ewe_prompt_3 |lm_eval/tasks/afrixnli/translate/prompt_3/afrixnli_translate_ewe.yaml |multiple_choice | | |
| |afrixnli_translate_ewe_prompt_4 |lm_eval/tasks/afrixnli/translate/prompt_4/afrixnli_translate_ewe.yaml |multiple_choice | | |
| |afrixnli_translate_ewe_prompt_5 |lm_eval/tasks/afrixnli/translate/prompt_5/afrixnli_translate_ewe.yaml |multiple_choice | | |
| |afrixnli_translate_fra |lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_fra.yaml |multiple_choice | | |
| |afrixnli_translate_fra_prompt_1 |lm_eval/tasks/afrixnli/translate/prompt_1/afrixnli_translate_fra.yaml |multiple_choice | | |
| |afrixnli_translate_fra_prompt_2 |lm_eval/tasks/afrixnli/translate/prompt_2/afrixnli_translate_fra.yaml |multiple_choice | | |
| |afrixnli_translate_fra_prompt_3 |lm_eval/tasks/afrixnli/translate/prompt_3/afrixnli_translate_fra.yaml |multiple_choice | | |
| |afrixnli_translate_fra_prompt_4 |lm_eval/tasks/afrixnli/translate/prompt_4/afrixnli_translate_fra.yaml |multiple_choice | | |
| |afrixnli_translate_fra_prompt_5 |lm_eval/tasks/afrixnli/translate/prompt_5/afrixnli_translate_fra.yaml |multiple_choice | | |
| |afrixnli_translate_hau |lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_hau.yaml |multiple_choice | | |
| |afrixnli_translate_hau_prompt_1 |lm_eval/tasks/afrixnli/translate/prompt_1/afrixnli_translate_hau.yaml |multiple_choice | | |
| |afrixnli_translate_hau_prompt_2 |lm_eval/tasks/afrixnli/translate/prompt_2/afrixnli_translate_hau.yaml |multiple_choice | | |
| |afrixnli_translate_hau_prompt_3 |lm_eval/tasks/afrixnli/translate/prompt_3/afrixnli_translate_hau.yaml |multiple_choice | | |
| |afrixnli_translate_hau_prompt_4 |lm_eval/tasks/afrixnli/translate/prompt_4/afrixnli_translate_hau.yaml |multiple_choice | | |
| |afrixnli_translate_hau_prompt_5 |lm_eval/tasks/afrixnli/translate/prompt_5/afrixnli_translate_hau.yaml |multiple_choice | | |
| |afrixnli_translate_ibo |lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_ibo.yaml |multiple_choice | | |
| |afrixnli_translate_ibo_prompt_1 |lm_eval/tasks/afrixnli/translate/prompt_1/afrixnli_translate_ibo.yaml |multiple_choice | | |
| |afrixnli_translate_ibo_prompt_2 |lm_eval/tasks/afrixnli/translate/prompt_2/afrixnli_translate_ibo.yaml |multiple_choice | | |
| |afrixnli_translate_ibo_prompt_3 |lm_eval/tasks/afrixnli/translate/prompt_3/afrixnli_translate_ibo.yaml |multiple_choice | | |
| |afrixnli_translate_ibo_prompt_4 |lm_eval/tasks/afrixnli/translate/prompt_4/afrixnli_translate_ibo.yaml |multiple_choice | | |
| |afrixnli_translate_ibo_prompt_5 |lm_eval/tasks/afrixnli/translate/prompt_5/afrixnli_translate_ibo.yaml |multiple_choice | | |
| |afrixnli_translate_kin |lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_kin.yaml |multiple_choice | | |
| |afrixnli_translate_kin_prompt_1 |lm_eval/tasks/afrixnli/translate/prompt_1/afrixnli_translate_kin.yaml |multiple_choice | | |
| |afrixnli_translate_kin_prompt_2 |lm_eval/tasks/afrixnli/translate/prompt_2/afrixnli_translate_kin.yaml |multiple_choice | | |
| |afrixnli_translate_kin_prompt_3 |lm_eval/tasks/afrixnli/translate/prompt_3/afrixnli_translate_kin.yaml |multiple_choice | | |
| |afrixnli_translate_kin_prompt_4 |lm_eval/tasks/afrixnli/translate/prompt_4/afrixnli_translate_kin.yaml |multiple_choice | | |
| |afrixnli_translate_kin_prompt_5 |lm_eval/tasks/afrixnli/translate/prompt_5/afrixnli_translate_kin.yaml |multiple_choice | | |
| |afrixnli_translate_lin |lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_lin.yaml |multiple_choice | | |
| |afrixnli_translate_lin_prompt_1 |lm_eval/tasks/afrixnli/translate/prompt_1/afrixnli_translate_lin.yaml |multiple_choice | | |
| |afrixnli_translate_lin_prompt_2 |lm_eval/tasks/afrixnli/translate/prompt_2/afrixnli_translate_lin.yaml |multiple_choice | | |
| |afrixnli_translate_lin_prompt_3 |lm_eval/tasks/afrixnli/translate/prompt_3/afrixnli_translate_lin.yaml |multiple_choice | | |
| |afrixnli_translate_lin_prompt_4 |lm_eval/tasks/afrixnli/translate/prompt_4/afrixnli_translate_lin.yaml |multiple_choice | | |
| |afrixnli_translate_lin_prompt_5 |lm_eval/tasks/afrixnli/translate/prompt_5/afrixnli_translate_lin.yaml |multiple_choice | | |
| |afrixnli_translate_lug |lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_lug.yaml |multiple_choice | | |
| |afrixnli_translate_lug_prompt_1 |lm_eval/tasks/afrixnli/translate/prompt_1/afrixnli_translate_lug.yaml |multiple_choice | | |
| |afrixnli_translate_lug_prompt_2 |lm_eval/tasks/afrixnli/translate/prompt_2/afrixnli_translate_lug.yaml |multiple_choice | | |
| |afrixnli_translate_lug_prompt_3 |lm_eval/tasks/afrixnli/translate/prompt_3/afrixnli_translate_lug.yaml |multiple_choice | | |
| |afrixnli_translate_lug_prompt_4 |lm_eval/tasks/afrixnli/translate/prompt_4/afrixnli_translate_lug.yaml |multiple_choice | | |
| |afrixnli_translate_lug_prompt_5 |lm_eval/tasks/afrixnli/translate/prompt_5/afrixnli_translate_lug.yaml |multiple_choice | | |
| |afrixnli_translate_orm |lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_orm.yaml |multiple_choice | | |
| |afrixnli_translate_orm_prompt_1 |lm_eval/tasks/afrixnli/translate/prompt_1/afrixnli_translate_orm.yaml |multiple_choice | | |
| |afrixnli_translate_orm_prompt_2 |lm_eval/tasks/afrixnli/translate/prompt_2/afrixnli_translate_orm.yaml |multiple_choice | | |
| |afrixnli_translate_orm_prompt_3 |lm_eval/tasks/afrixnli/translate/prompt_3/afrixnli_translate_orm.yaml |multiple_choice | | |
| |afrixnli_translate_orm_prompt_4 |lm_eval/tasks/afrixnli/translate/prompt_4/afrixnli_translate_orm.yaml |multiple_choice | | |
| |afrixnli_translate_orm_prompt_5 |lm_eval/tasks/afrixnli/translate/prompt_5/afrixnli_translate_orm.yaml |multiple_choice | | |
| |afrixnli_translate_sna |lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_sna.yaml |multiple_choice | | |
| |afrixnli_translate_sna_prompt_1 |lm_eval/tasks/afrixnli/translate/prompt_1/afrixnli_translate_sna.yaml |multiple_choice | | |
| |afrixnli_translate_sna_prompt_2 |lm_eval/tasks/afrixnli/translate/prompt_2/afrixnli_translate_sna.yaml |multiple_choice | | |
| |afrixnli_translate_sna_prompt_3 |lm_eval/tasks/afrixnli/translate/prompt_3/afrixnli_translate_sna.yaml |multiple_choice | | |
| |afrixnli_translate_sna_prompt_4 |lm_eval/tasks/afrixnli/translate/prompt_4/afrixnli_translate_sna.yaml |multiple_choice | | |
| |afrixnli_translate_sna_prompt_5 |lm_eval/tasks/afrixnli/translate/prompt_5/afrixnli_translate_sna.yaml |multiple_choice | | |
| |afrixnli_translate_sot |lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_sot.yaml |multiple_choice | | |
| |afrixnli_translate_sot_prompt_1 |lm_eval/tasks/afrixnli/translate/prompt_1/afrixnli_translate_sot.yaml |multiple_choice | | |
| |afrixnli_translate_sot_prompt_2 |lm_eval/tasks/afrixnli/translate/prompt_2/afrixnli_translate_sot.yaml |multiple_choice | | |
| |afrixnli_translate_sot_prompt_3 |lm_eval/tasks/afrixnli/translate/prompt_3/afrixnli_translate_sot.yaml |multiple_choice | | |
| |afrixnli_translate_sot_prompt_4 |lm_eval/tasks/afrixnli/translate/prompt_4/afrixnli_translate_sot.yaml |multiple_choice | | |
| |afrixnli_translate_sot_prompt_5 |lm_eval/tasks/afrixnli/translate/prompt_5/afrixnli_translate_sot.yaml |multiple_choice | | |
| |afrixnli_translate_swa |lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_swa.yaml |multiple_choice | | |
| |afrixnli_translate_swa_prompt_1 |lm_eval/tasks/afrixnli/translate/prompt_1/afrixnli_translate_swa.yaml |multiple_choice | | |
| |afrixnli_translate_swa_prompt_2 |lm_eval/tasks/afrixnli/translate/prompt_2/afrixnli_translate_swa.yaml |multiple_choice | | |
| |afrixnli_translate_swa_prompt_3 |lm_eval/tasks/afrixnli/translate/prompt_3/afrixnli_translate_swa.yaml |multiple_choice | | |
| |afrixnli_translate_swa_prompt_4 |lm_eval/tasks/afrixnli/translate/prompt_4/afrixnli_translate_swa.yaml |multiple_choice | | |
| |afrixnli_translate_swa_prompt_5 |lm_eval/tasks/afrixnli/translate/prompt_5/afrixnli_translate_swa.yaml |multiple_choice | | |
| |afrixnli_translate_twi |lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_twi.yaml |multiple_choice | | |
| |afrixnli_translate_twi_prompt_1 |lm_eval/tasks/afrixnli/translate/prompt_1/afrixnli_translate_twi.yaml |multiple_choice | | |
| |afrixnli_translate_twi_prompt_2 |lm_eval/tasks/afrixnli/translate/prompt_2/afrixnli_translate_twi.yaml |multiple_choice | | |
| |afrixnli_translate_twi_prompt_3 |lm_eval/tasks/afrixnli/translate/prompt_3/afrixnli_translate_twi.yaml |multiple_choice | | |
| |afrixnli_translate_twi_prompt_4 |lm_eval/tasks/afrixnli/translate/prompt_4/afrixnli_translate_twi.yaml |multiple_choice | | |
| |afrixnli_translate_twi_prompt_5 |lm_eval/tasks/afrixnli/translate/prompt_5/afrixnli_translate_twi.yaml |multiple_choice | | |
| |afrixnli_translate_wol |lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_wol.yaml |multiple_choice | | |
| |afrixnli_translate_wol_prompt_1 |lm_eval/tasks/afrixnli/translate/prompt_1/afrixnli_translate_wol.yaml |multiple_choice | | |
| |afrixnli_translate_wol_prompt_2 |lm_eval/tasks/afrixnli/translate/prompt_2/afrixnli_translate_wol.yaml |multiple_choice | | |
| |afrixnli_translate_wol_prompt_3 |lm_eval/tasks/afrixnli/translate/prompt_3/afrixnli_translate_wol.yaml |multiple_choice | | |
| |afrixnli_translate_wol_prompt_4 |lm_eval/tasks/afrixnli/translate/prompt_4/afrixnli_translate_wol.yaml |multiple_choice | | |
| |afrixnli_translate_wol_prompt_5 |lm_eval/tasks/afrixnli/translate/prompt_5/afrixnli_translate_wol.yaml |multiple_choice | | |
| |afrixnli_translate_xho |lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_xho.yaml |multiple_choice | | |
| |afrixnli_translate_xho_prompt_1 |lm_eval/tasks/afrixnli/translate/prompt_1/afrixnli_translate_xho.yaml |multiple_choice | | |
| |afrixnli_translate_xho_prompt_2 |lm_eval/tasks/afrixnli/translate/prompt_2/afrixnli_translate_xho.yaml |multiple_choice | | |
| |afrixnli_translate_xho_prompt_3 |lm_eval/tasks/afrixnli/translate/prompt_3/afrixnli_translate_xho.yaml |multiple_choice | | |
| |afrixnli_translate_xho_prompt_4 |lm_eval/tasks/afrixnli/translate/prompt_4/afrixnli_translate_xho.yaml |multiple_choice | | |
| |afrixnli_translate_xho_prompt_5 |lm_eval/tasks/afrixnli/translate/prompt_5/afrixnli_translate_xho.yaml |multiple_choice | | |
| |afrixnli_translate_yor |lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_yor.yaml |multiple_choice | | |
| |afrixnli_translate_yor_prompt_1 |lm_eval/tasks/afrixnli/translate/prompt_1/afrixnli_translate_yor.yaml |multiple_choice | | |
| |afrixnli_translate_yor_prompt_2 |lm_eval/tasks/afrixnli/translate/prompt_2/afrixnli_translate_yor.yaml |multiple_choice | | |
| |afrixnli_translate_yor_prompt_3 |lm_eval/tasks/afrixnli/translate/prompt_3/afrixnli_translate_yor.yaml |multiple_choice | | |
| |afrixnli_translate_yor_prompt_4 |lm_eval/tasks/afrixnli/translate/prompt_4/afrixnli_translate_yor.yaml |multiple_choice | | |
| |afrixnli_translate_yor_prompt_5 |lm_eval/tasks/afrixnli/translate/prompt_5/afrixnli_translate_yor.yaml |multiple_choice | | |
| |afrixnli_translate_zul |lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_zul.yaml |multiple_choice | | |
| |afrixnli_translate_zul_prompt_1 |lm_eval/tasks/afrixnli/translate/prompt_1/afrixnli_translate_zul.yaml |multiple_choice | | |
| |afrixnli_translate_zul_prompt_2 |lm_eval/tasks/afrixnli/translate/prompt_2/afrixnli_translate_zul.yaml |multiple_choice | | |
| |afrixnli_translate_zul_prompt_3 |lm_eval/tasks/afrixnli/translate/prompt_3/afrixnli_translate_zul.yaml |multiple_choice | | |
| |afrixnli_translate_zul_prompt_4 |lm_eval/tasks/afrixnli/translate/prompt_4/afrixnli_translate_zul.yaml |multiple_choice | | |
| |afrixnli_translate_zul_prompt_5 |lm_eval/tasks/afrixnli/translate/prompt_5/afrixnli_translate_zul.yaml |multiple_choice | | |
| |afrixnli_twi_prompt_1 |lm_eval/tasks/afrixnli/direct/prompt_1/afrixnli_twi.yaml |multiple_choice | | |
| |afrixnli_twi_prompt_2 |lm_eval/tasks/afrixnli/direct/prompt_2/afrixnli_twi.yaml |multiple_choice | | |
| |afrixnli_twi_prompt_3 |lm_eval/tasks/afrixnli/direct/prompt_3/afrixnli_twi.yaml |multiple_choice | | |
| |afrixnli_twi_prompt_4 |lm_eval/tasks/afrixnli/direct/prompt_4/afrixnli_twi.yaml |multiple_choice | | |
| |afrixnli_twi_prompt_5 |lm_eval/tasks/afrixnli/direct/prompt_5/afrixnli_twi.yaml |multiple_choice | | |
| |afrixnli_wol_prompt_1 |lm_eval/tasks/afrixnli/direct/prompt_1/afrixnli_wol.yaml |multiple_choice | | |
| |afrixnli_wol_prompt_2 |lm_eval/tasks/afrixnli/direct/prompt_2/afrixnli_wol.yaml |multiple_choice | | |
| |afrixnli_wol_prompt_3 |lm_eval/tasks/afrixnli/direct/prompt_3/afrixnli_wol.yaml |multiple_choice | | |
| |afrixnli_wol_prompt_4 |lm_eval/tasks/afrixnli/direct/prompt_4/afrixnli_wol.yaml |multiple_choice | | |
| |afrixnli_wol_prompt_5 |lm_eval/tasks/afrixnli/direct/prompt_5/afrixnli_wol.yaml |multiple_choice | | |
| |afrixnli_xho_prompt_1 |lm_eval/tasks/afrixnli/direct/prompt_1/afrixnli_xho.yaml |multiple_choice | | |
| |afrixnli_xho_prompt_2 |lm_eval/tasks/afrixnli/direct/prompt_2/afrixnli_xho.yaml |multiple_choice | | |
| |afrixnli_xho_prompt_3 |lm_eval/tasks/afrixnli/direct/prompt_3/afrixnli_xho.yaml |multiple_choice | | |
| |afrixnli_xho_prompt_4 |lm_eval/tasks/afrixnli/direct/prompt_4/afrixnli_xho.yaml |multiple_choice | | |
| |afrixnli_xho_prompt_5 |lm_eval/tasks/afrixnli/direct/prompt_5/afrixnli_xho.yaml |multiple_choice | | |
| |afrixnli_yor_prompt_1 |lm_eval/tasks/afrixnli/direct/prompt_1/afrixnli_yor.yaml |multiple_choice | | |
| |afrixnli_yor_prompt_2 |lm_eval/tasks/afrixnli/direct/prompt_2/afrixnli_yor.yaml |multiple_choice | | |
| |afrixnli_yor_prompt_3 |lm_eval/tasks/afrixnli/direct/prompt_3/afrixnli_yor.yaml |multiple_choice | | |
| |afrixnli_yor_prompt_4 |lm_eval/tasks/afrixnli/direct/prompt_4/afrixnli_yor.yaml |multiple_choice | | |
| |afrixnli_yor_prompt_5 |lm_eval/tasks/afrixnli/direct/prompt_5/afrixnli_yor.yaml |multiple_choice | | |
| |afrixnli_zul_prompt_1 |lm_eval/tasks/afrixnli/direct/prompt_1/afrixnli_zul.yaml |multiple_choice | | |
| |afrixnli_zul_prompt_2 |lm_eval/tasks/afrixnli/direct/prompt_2/afrixnli_zul.yaml |multiple_choice | | |
| |afrixnli_zul_prompt_3 |lm_eval/tasks/afrixnli/direct/prompt_3/afrixnli_zul.yaml |multiple_choice | | |
| |afrixnli_zul_prompt_4 |lm_eval/tasks/afrixnli/direct/prompt_4/afrixnli_zul.yaml |multiple_choice | | |
| |afrixnli_zul_prompt_5 |lm_eval/tasks/afrixnli/direct/prompt_5/afrixnli_zul.yaml |multiple_choice | | |
| |ag_news |lm_eval/tasks/unitxt/ag_news.yaml | | | |
| |agieval_aqua_rat |lm_eval/tasks/agieval/aqua-rat.yaml |multiple_choice | | |
| |agieval_gaokao_biology |lm_eval/tasks/agieval/gaokao-biology.yaml |multiple_choice | | |
| |agieval_gaokao_chemistry |lm_eval/tasks/agieval/gaokao-chemistry.yaml |multiple_choice | | |
| |agieval_gaokao_chinese |lm_eval/tasks/agieval/gaokao-chinese.yaml |multiple_choice | | |
| |agieval_gaokao_english |lm_eval/tasks/agieval/gaokao-english.yaml |multiple_choice | | |
| |agieval_gaokao_geography |lm_eval/tasks/agieval/gaokao-geography.yaml |multiple_choice | | |
| |agieval_gaokao_history |lm_eval/tasks/agieval/gaokao-history.yaml |multiple_choice | | |
| |agieval_gaokao_mathcloze |lm_eval/tasks/agieval/gaokao-mathcloze.yaml |generate_until | | |
| |agieval_gaokao_mathqa |lm_eval/tasks/agieval/gaokao-mathqa.yaml |multiple_choice | | |
| |agieval_gaokao_physics |lm_eval/tasks/agieval/gaokao-physics.yaml |multiple_choice | | |
| |agieval_jec_qa_ca |lm_eval/tasks/agieval/jec-qa-ca.yaml |multiple_choice | | |
| |agieval_jec_qa_kd |lm_eval/tasks/agieval/jec-qa-kd.yaml |multiple_choice | | |
| |agieval_logiqa_en |lm_eval/tasks/agieval/logiqa-en.yaml |multiple_choice | | |
| |agieval_logiqa_zh |lm_eval/tasks/agieval/logiqa-zh.yaml |multiple_choice | | |
| |agieval_lsat_ar |lm_eval/tasks/agieval/lsat-ar.yaml |multiple_choice | | |
| |agieval_lsat_lr |lm_eval/tasks/agieval/lsat-lr.yaml |multiple_choice | | |
| |agieval_lsat_rc |lm_eval/tasks/agieval/lsat-rc.yaml |multiple_choice | | |
| |agieval_math |lm_eval/tasks/agieval/math.yaml |generate_until | | |
| |agieval_sat_en |lm_eval/tasks/agieval/sat-en.yaml |multiple_choice | | |
| |agieval_sat_en_without_passage |lm_eval/tasks/agieval/sat-en-without-passage.yaml |multiple_choice | | |
| |agieval_sat_math |lm_eval/tasks/agieval/sat-math.yaml |multiple_choice | | |
| |anagrams1 |lm_eval/tasks/unscramble/anagrams1.yaml |generate_until | | |
| |anagrams2 |lm_eval/tasks/unscramble/anagrams2.yaml |generate_until | | |
| |anli_r1 |lm_eval/tasks/anli/anli_r1.yaml |multiple_choice | | |
| |anli_r2 |lm_eval/tasks/anli/anli_r2.yaml |multiple_choice | | |
| |anli_r3 |lm_eval/tasks/anli/anli_r3.yaml |multiple_choice | | |
| |arab_culture_algeria |lm_eval/tasks/arab_culture/arab_culture_algeria.yaml |multiple_choice | | |
| |arab_culture_completion_algeria |lm_eval/tasks/arab_culture_completion/arab_culture_completion_algeria.yaml |multiple_choice | | |
| |arab_culture_completion_egypt |lm_eval/tasks/arab_culture_completion/arab_culture_completion_egypt.yaml |multiple_choice | | |
| |arab_culture_completion_jordan |lm_eval/tasks/arab_culture_completion/arab_culture_completion_jordan.yaml |multiple_choice | | |
| |arab_culture_completion_ksa |lm_eval/tasks/arab_culture_completion/arab_culture_completion_ksa.yaml |multiple_choice | | |
| |arab_culture_completion_lebanon |lm_eval/tasks/arab_culture_completion/arab_culture_completion_lebanon.yaml |multiple_choice | | |
| |arab_culture_completion_libya |lm_eval/tasks/arab_culture_completion/arab_culture_completion_libya.yaml |multiple_choice | | |
| |arab_culture_completion_morocco |lm_eval/tasks/arab_culture_completion/arab_culture_completion_morocco.yaml |multiple_choice | | |
| |arab_culture_completion_palestine |lm_eval/tasks/arab_culture_completion/arab_culture_completion_palestine.yaml |multiple_choice | | |
| |arab_culture_completion_sudan |lm_eval/tasks/arab_culture_completion/arab_culture_completion_sudan.yaml |multiple_choice | | |
| |arab_culture_completion_syria |lm_eval/tasks/arab_culture_completion/arab_culture_completion_syria.yaml |multiple_choice | | |
| |arab_culture_completion_tunisia |lm_eval/tasks/arab_culture_completion/arab_culture_completion_tunisia.yaml |multiple_choice | | |
| |arab_culture_completion_uae |lm_eval/tasks/arab_culture_completion/arab_culture_completion_uae.yaml |multiple_choice | | |
| |arab_culture_completion_yemen |lm_eval/tasks/arab_culture_completion/arab_culture_completion_yemen.yaml |multiple_choice | | |
| |arab_culture_egypt |lm_eval/tasks/arab_culture/arab_culture_egypt.yaml |multiple_choice | | |
| |arab_culture_jordan |lm_eval/tasks/arab_culture/arab_culture_jordan.yaml |multiple_choice | | |
| |arab_culture_ksa |lm_eval/tasks/arab_culture/arab_culture_ksa.yaml |multiple_choice | | |
| |arab_culture_lebanon |lm_eval/tasks/arab_culture/arab_culture_lebanon.yaml |multiple_choice | | |
| |arab_culture_libya |lm_eval/tasks/arab_culture/arab_culture_libya.yaml |multiple_choice | | |
| |arab_culture_morocco |lm_eval/tasks/arab_culture/arab_culture_morocco.yaml |multiple_choice | | |
| |arab_culture_palestine |lm_eval/tasks/arab_culture/arab_culture_palestine.yaml |multiple_choice | | |
| |arab_culture_sudan |lm_eval/tasks/arab_culture/arab_culture_sudan.yaml |multiple_choice | | |
| |arab_culture_syria |lm_eval/tasks/arab_culture/arab_culture_syria.yaml |multiple_choice | | |
| |arab_culture_tunisia |lm_eval/tasks/arab_culture/arab_culture_tunisia.yaml |multiple_choice | | |
| |arab_culture_uae |lm_eval/tasks/arab_culture/arab_culture_uae.yaml |multiple_choice | | |
| |arab_culture_yemen |lm_eval/tasks/arab_culture/arab_culture_yemen.yaml |multiple_choice | | |
| |arabic_exams |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_exams/arabic_exams.yaml |multiple_choice | | |
| |arabic_exams_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_exams_light/arabic_exams_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Algeria |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Algeria.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Algeria_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Algeria_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Ancient_Egypt |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Ancient_Egypt.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Ancient_Egypt_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Ancient_Egypt_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Arab_Empire |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Arab_Empire.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Arab_Empire_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Arab_Empire_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Arabic_Architecture |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Arabic_Architecture.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Arabic_Architecture_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Arabic_Architecture_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Arabic_Art |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Arabic_Art.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Arabic_Art_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Arabic_Art_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Arabic_Astronomy |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Arabic_Astronomy.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Arabic_Astronomy_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Arabic_Astronomy_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Arabic_Calligraphy |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Arabic_Calligraphy.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Arabic_Calligraphy_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Arabic_Calligraphy_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Arabic_Ceremony |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Arabic_Ceremony.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Arabic_Ceremony_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Arabic_Ceremony_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Arabic_Clothing |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Arabic_Clothing.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Arabic_Clothing_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Arabic_Clothing_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Arabic_Culture |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Arabic_Culture.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Arabic_Culture_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Arabic_Culture_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Arabic_Food |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Arabic_Food.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Arabic_Food_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Arabic_Food_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Arabic_Funeral |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Arabic_Funeral.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Arabic_Funeral_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Arabic_Funeral_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Arabic_Geography |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Arabic_Geography.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Arabic_Geography_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Arabic_Geography_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Arabic_History |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Arabic_History.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Arabic_History_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Arabic_History_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Arabic_Language_Origin |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Arabic_Language_Origin.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Arabic_Language_Origin_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Arabic_Language_Origin_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Arabic_Literature |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Arabic_Literature.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Arabic_Literature_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Arabic_Literature_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Arabic_Math |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Arabic_Math.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Arabic_Math_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Arabic_Math_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Arabic_Medicine |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Arabic_Medicine.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Arabic_Medicine_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Arabic_Medicine_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Arabic_Music |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Arabic_Music.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Arabic_Music_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Arabic_Music_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Arabic_Ornament |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Arabic_Ornament.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Arabic_Ornament_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Arabic_Ornament_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Arabic_Philosophy |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Arabic_Philosophy.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Arabic_Philosophy_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Arabic_Philosophy_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Arabic_Physics_and_Chemistry |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Arabic_Physics_and_Chemistry.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Arabic_Physics_and_Chemistry_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Arabic_Physics_and_Chemistry_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Arabic_Wedding |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Arabic_Wedding.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Arabic_Wedding_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Arabic_Wedding_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Bahrain |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Bahrain.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Bahrain_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Bahrain_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Comoros |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Comoros.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Comoros_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Comoros_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Egypt_modern |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Egypt_modern.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Egypt_modern_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Egypt_modern_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_InfluenceFromAncientEgypt |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_InfluenceFromAncientEgypt.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_InfluenceFromAncientEgypt_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_InfluenceFromAncientEgypt_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_InfluenceFromByzantium |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_InfluenceFromByzantium.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_InfluenceFromByzantium_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_InfluenceFromByzantium_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_InfluenceFromChina |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_InfluenceFromChina.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_InfluenceFromChina_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_InfluenceFromChina_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_InfluenceFromGreece |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_InfluenceFromGreece.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_InfluenceFromGreece_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_InfluenceFromGreece_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_InfluenceFromIslam |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_InfluenceFromIslam.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_InfluenceFromIslam_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_InfluenceFromIslam_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_InfluenceFromPersia |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_InfluenceFromPersia.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_InfluenceFromPersia_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_InfluenceFromPersia_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_InfluenceFromRome |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_InfluenceFromRome.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_InfluenceFromRome_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_InfluenceFromRome_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Iraq |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Iraq.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Iraq_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Iraq_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Islam_Education |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Islam_Education.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Islam_Education_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Islam_Education_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Islam_branches_and_schools |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Islam_branches_and_schools.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Islam_branches_and_schools_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Islam_branches_and_schools_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Islamic_law_system |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Islamic_law_system.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Islamic_law_system_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Islamic_law_system_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Jordan |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Jordan.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Jordan_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Jordan_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Kuwait |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Kuwait.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Kuwait_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Kuwait_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Lebanon |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Lebanon.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Lebanon_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Lebanon_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Libya |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Libya.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Libya_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Libya_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Mauritania |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Mauritania.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Mauritania_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Mauritania_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Mesopotamia_civilization |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Mesopotamia_civilization.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Mesopotamia_civilization_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Mesopotamia_civilization_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Morocco |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Morocco.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Morocco_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Morocco_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Oman |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Oman.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Oman_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Oman_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Palestine |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Palestine.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Palestine_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Palestine_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Qatar |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Qatar.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Qatar_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Qatar_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Saudi_Arabia |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Saudi_Arabia.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Saudi_Arabia_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Saudi_Arabia_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Somalia |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Somalia.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Somalia_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Somalia_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Sudan |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Sudan.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Sudan_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Sudan_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Syria |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Syria.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Syria_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Syria_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Tunisia |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Tunisia.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Tunisia_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Tunisia_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_United_Arab_Emirates |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_United_Arab_Emirates.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_United_Arab_Emirates_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_United_Arab_Emirates_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Yemen |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_Yemen.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_Yemen_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_Yemen_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_communication |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_communication.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_communication_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_communication_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_computer_and_phone |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_computer_and_phone.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_computer_and_phone_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_computer_and_phone_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_daily_life |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_daily_life.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_daily_life_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_daily_life_light.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_entertainment |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_avca/arabic_leaderboard_acva_entertainment.yaml |multiple_choice | | |
| |arabic_leaderboard_acva_entertainment_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_avca_light/arabic_leaderboard_acva_entertainment_light.yaml |multiple_choice | | |
| |arabic_leaderboard_alghafa_mcq_exams_test_ar |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_alghafa/arabic_leaderboard_alghafa_mcq_exams_test_ar.yaml |multiple_choice | | |
| |arabic_leaderboard_alghafa_mcq_exams_test_ar_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_alghafa_light/arabic_leaderboard_alghafa_mcq_exams_test_ar_light.yaml |multiple_choice | | |
| |arabic_leaderboard_alghafa_meta_ar_dialects |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_alghafa/arabic_leaderboard_alghafa_meta_ar_dialects.yaml |multiple_choice | | |
| |arabic_leaderboard_alghafa_meta_ar_dialects_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_alghafa_light/arabic_leaderboard_alghafa_meta_ar_dialects_light.yaml |multiple_choice | | |
| |arabic_leaderboard_alghafa_meta_ar_msa |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_alghafa/arabic_leaderboard_alghafa_meta_ar_msa.yaml |multiple_choice | | |
| |arabic_leaderboard_alghafa_meta_ar_msa_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_alghafa_light/arabic_leaderboard_alghafa_meta_ar_msa_light.yaml |multiple_choice | | |
| |arabic_leaderboard_alghafa_multiple_choice_facts_truefalse_balanced_task |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_alghafa/arabic_leaderboard_alghafa_multiple_choice_facts_truefalse_balanced_task.yaml |multiple_choice | | |
| |arabic_leaderboard_alghafa_multiple_choice_facts_truefalse_balanced_task_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_alghafa_light/arabic_leaderboard_alghafa_multiple_choice_facts_truefalse_balanced_task_light.yaml |multiple_choice | | |
| |arabic_leaderboard_alghafa_multiple_choice_grounded_statement_soqal_task |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_alghafa/arabic_leaderboard_alghafa_multiple_choice_grounded_statement_soqal_task.yaml |multiple_choice | | |
| |arabic_leaderboard_alghafa_multiple_choice_grounded_statement_soqal_task_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_alghafa_light/arabic_leaderboard_alghafa_multiple_choice_grounded_statement_soqal_task_light.yaml |multiple_choice | | |
| |arabic_leaderboard_alghafa_multiple_choice_grounded_statement_xglue_mlqa_task |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_alghafa/arabic_leaderboard_alghafa_multiple_choice_grounded_statement_xglue_mlqa_task.yaml |multiple_choice | | |
| |arabic_leaderboard_alghafa_multiple_choice_grounded_statement_xglue_mlqa_task_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_alghafa_light/arabic_leaderboard_alghafa_multiple_choice_grounded_statement_xglue_mlqa_task_light.yaml|multiple_choice | | |
| |arabic_leaderboard_alghafa_multiple_choice_rating_sentiment_no_neutral_task |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_alghafa/arabic_leaderboard_alghafa_multiple_choice_rating_sentiment_no_neutral_task.yaml |multiple_choice | | |
| |arabic_leaderboard_alghafa_multiple_choice_rating_sentiment_no_neutral_task_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_alghafa_light/arabic_leaderboard_alghafa_multiple_choice_rating_sentiment_no_neutral_task_light.yaml |multiple_choice | | |
| |arabic_leaderboard_alghafa_multiple_choice_rating_sentiment_task |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_alghafa/arabic_leaderboard_alghafa_multiple_choice_rating_sentiment_task.yaml |multiple_choice | | |
| |arabic_leaderboard_alghafa_multiple_choice_rating_sentiment_task_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_alghafa_light/arabic_leaderboard_alghafa_multiple_choice_rating_sentiment_task_light.yaml |multiple_choice | | |
| |arabic_leaderboard_alghafa_multiple_choice_sentiment_task |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_alghafa/arabic_leaderboard_alghafa_multiple_choice_sentiment_task.yaml |multiple_choice | | |
| |arabic_leaderboard_alghafa_multiple_choice_sentiment_task_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_alghafa_light/arabic_leaderboard_alghafa_multiple_choice_sentiment_task_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_abstract_algebra |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_abstract_algebra.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_abstract_algebra_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_abstract_algebra_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_anatomy |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_anatomy.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_anatomy_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_anatomy_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_astronomy |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_astronomy.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_astronomy_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_astronomy_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_business_ethics |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_business_ethics.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_business_ethics_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_business_ethics_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_clinical_knowledge |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_clinical_knowledge.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_clinical_knowledge_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_clinical_knowledge_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_college_biology |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_college_biology.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_college_biology_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_college_biology_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_college_chemistry |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_college_chemistry.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_college_chemistry_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_college_chemistry_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_college_computer_science |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_college_computer_science.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_college_computer_science_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_college_computer_science_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_college_mathematics |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_college_mathematics.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_college_mathematics_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_college_mathematics_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_college_medicine |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_college_medicine.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_college_medicine_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_college_medicine_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_college_physics |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_college_physics.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_college_physics_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_college_physics_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_computer_security |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_computer_security.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_computer_security_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_computer_security_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_conceptual_physics |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_conceptual_physics.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_conceptual_physics_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_conceptual_physics_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_econometrics |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_econometrics.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_econometrics_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_econometrics_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_electrical_engineering |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_electrical_engineering.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_electrical_engineering_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_electrical_engineering_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_elementary_mathematics |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_elementary_mathematics.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_elementary_mathematics_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_elementary_mathematics_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_formal_logic |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_formal_logic.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_formal_logic_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_formal_logic_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_global_facts |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_global_facts.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_global_facts_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_global_facts_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_high_school_biology |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_high_school_biology.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_high_school_biology_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_high_school_biology_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_high_school_chemistry |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_high_school_chemistry.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_high_school_chemistry_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_high_school_chemistry_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_high_school_computer_science |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_high_school_computer_science.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_high_school_computer_science_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_high_school_computer_science_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_high_school_european_history |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_high_school_european_history.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_high_school_european_history_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_high_school_european_history_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_high_school_geography |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_high_school_geography.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_high_school_geography_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_high_school_geography_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_high_school_government_and_politics |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_high_school_government_and_politics.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_high_school_government_and_politics_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_high_school_government_and_politics_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_high_school_macroeconomics |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_high_school_macroeconomics.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_high_school_macroeconomics_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_high_school_macroeconomics_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_high_school_mathematics |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_high_school_mathematics.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_high_school_mathematics_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_high_school_mathematics_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_high_school_microeconomics |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_high_school_microeconomics.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_high_school_microeconomics_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_high_school_microeconomics_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_high_school_physics |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_high_school_physics.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_high_school_physics_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_high_school_physics_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_high_school_psychology |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_high_school_psychology.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_high_school_psychology_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_high_school_psychology_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_high_school_statistics |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_high_school_statistics.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_high_school_statistics_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_high_school_statistics_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_high_school_us_history |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_high_school_us_history.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_high_school_us_history_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_high_school_us_history_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_high_school_world_history |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_high_school_world_history.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_high_school_world_history_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_high_school_world_history_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_human_aging |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_human_aging.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_human_aging_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_human_aging_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_human_sexuality |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_human_sexuality.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_human_sexuality_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_human_sexuality_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_international_law |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_international_law.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_international_law_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_international_law_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_jurisprudence |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_jurisprudence.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_jurisprudence_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_jurisprudence_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_logical_fallacies |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_logical_fallacies.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_logical_fallacies_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_logical_fallacies_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_machine_learning |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_machine_learning.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_machine_learning_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_machine_learning_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_management |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_management.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_management_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_management_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_marketing |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_marketing.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_marketing_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_marketing_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_medical_genetics |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_medical_genetics.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_medical_genetics_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_medical_genetics_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_miscellaneous |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_miscellaneous.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_miscellaneous_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_miscellaneous_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_moral_disputes |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_moral_disputes.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_moral_disputes_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_moral_disputes_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_moral_scenarios |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_moral_scenarios.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_moral_scenarios_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_moral_scenarios_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_nutrition |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_nutrition.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_nutrition_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_nutrition_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_philosophy |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_philosophy.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_philosophy_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_philosophy_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_prehistory |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_prehistory.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_prehistory_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_prehistory_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_professional_accounting |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_professional_accounting.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_professional_accounting_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_professional_accounting_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_professional_law |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_professional_law.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_professional_law_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_professional_law_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_professional_medicine |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_professional_medicine.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_professional_medicine_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_professional_medicine_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_professional_psychology |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_professional_psychology.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_professional_psychology_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_professional_psychology_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_public_relations |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_public_relations.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_public_relations_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_public_relations_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_security_studies |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_security_studies.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_security_studies_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_security_studies_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_sociology |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_sociology.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_sociology_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_sociology_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_us_foreign_policy |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_us_foreign_policy.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_us_foreign_policy_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_us_foreign_policy_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_virology |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_virology.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_virology_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_virology_light.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_world_religions |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mmlu/arabic_leaderboard_arabic_mmlu_world_religions.yaml |multiple_choice | | |
| |arabic_leaderboard_arabic_mmlu_world_religions_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mmlu_light/arabic_leaderboard_arabic_mmlu_world_religions_light.yaml |multiple_choice | | |
| |arabic_mt_arc_challenge |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_arc_challenge/arabic_mt_arc_challenge.yaml |multiple_choice | | |
| |arabic_mt_arc_challenge_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_arc_challenge_light/arabic_mt_arc_challenge_light.yaml |multiple_choice | | |
| |arabic_mt_arc_easy |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_arc_easy/arabic_mt_arc_easy.yaml |multiple_choice | | |
| |arabic_mt_arc_easy_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_arc_easy_light/arabic_mt_arc_easy_light.yaml |multiple_choice | | |
| |arabic_mt_boolq |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_boolq/arabic_mt_boolq.yaml |multiple_choice | | |
| |arabic_mt_boolq_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_boolq_light/arabic_mt_boolq_light.yaml |multiple_choice | | |
| |arabic_mt_copa |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_copa/arabic_mt_copa.yaml |multiple_choice | | |
| |arabic_mt_copa_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_copa_light/arabic_mt_copa_light.yaml |multiple_choice | | |
| |arabic_mt_hellaswag |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_hellaswag/arabic_mt_hellaswag.yaml |multiple_choice | | |
| |arabic_mt_hellaswag_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_hellaswag_light/arabic_mt_hellaswag_light.yaml |multiple_choice | | |
| |arabic_mt_mmlu |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_mmlu/arabic_mt_mmlu.yaml |multiple_choice | | |
| |arabic_mt_mmlu_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_mmlu_light/arabic_mt_mmlu_light.yaml |multiple_choice | | |
| |arabic_mt_openbook_qa |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_openbook_qa/arabic_mt_openbook_qa.yaml |multiple_choice | | |
| |arabic_mt_openbook_qa_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_openbook_qa_light/arabic_mt_openbook_qa_light.yaml |multiple_choice | | |
| |arabic_mt_piqa |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_piqa/arabic_mt_piqa.yaml |multiple_choice | | |
| |arabic_mt_piqa_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_piqa_light/arabic_mt_piqa_light.yaml |multiple_choice | | |
| |arabic_mt_race |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_race/arabic_mt_race.yaml |multiple_choice | | |
| |arabic_mt_race_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_race_light/arabic_mt_race_light.yaml |multiple_choice | | |
| |arabic_mt_sciq |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_sciq/arabic_mt_sciq.yaml |multiple_choice | | |
| |arabic_mt_sciq_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_sciq_light/arabic_mt_sciq_light.yaml |multiple_choice | | |
| |arabic_mt_toxigen |lm_eval/tasks/arabic_leaderboard_complete/arabic_leaderboard_arabic_mt_toxigen/arabic_mt_toxigen.yaml |multiple_choice | | |
| |arabic_mt_toxigen_light |lm_eval/tasks/arabic_leaderboard_light/arabic_leaderboard_arabic_mt_toxigen_light/arabic_mt_toxigen_light.yaml |multiple_choice | | |
| |arabicmmlu_accounting_university |lm_eval/tasks/arabicmmlu/arabicmmlu_accounting_university.yaml |multiple_choice | | |
| |arabicmmlu_arabic_language_general |lm_eval/tasks/arabicmmlu/arabicmmlu_arabic_language_general.yaml |multiple_choice | | |
| |arabicmmlu_arabic_language_grammar |lm_eval/tasks/arabicmmlu/arabicmmlu_arabic_language_grammar.yaml |multiple_choice | | |
| |arabicmmlu_arabic_language_high_school |lm_eval/tasks/arabicmmlu/arabicmmlu_arabic_language_high_school.yaml |multiple_choice | | |
| |arabicmmlu_arabic_language_middle_school |lm_eval/tasks/arabicmmlu/arabicmmlu_arabic_language_middle_school.yaml |multiple_choice | | |
| |arabicmmlu_arabic_language_primary_school |lm_eval/tasks/arabicmmlu/arabicmmlu_arabic_language_primary_school.yaml |multiple_choice | | |
| |arabicmmlu_biology_high_school |lm_eval/tasks/arabicmmlu/arabicmmlu_biology_high_school.yaml |multiple_choice | | |
| |arabicmmlu_civics_high_school |lm_eval/tasks/arabicmmlu/arabicmmlu_civics_high_school.yaml |multiple_choice | | |
| |arabicmmlu_civics_middle_school |lm_eval/tasks/arabicmmlu/arabicmmlu_civics_middle_school.yaml |multiple_choice | | |
| |arabicmmlu_computer_science_high_school |lm_eval/tasks/arabicmmlu/arabicmmlu_computer_science_high_school.yaml |multiple_choice | | |
| |arabicmmlu_computer_science_middle_school |lm_eval/tasks/arabicmmlu/arabicmmlu_computer_science_middle_school.yaml |multiple_choice | | |
| |arabicmmlu_computer_science_primary_school |lm_eval/tasks/arabicmmlu/arabicmmlu_computer_science_primary_school.yaml |multiple_choice | | |
| |arabicmmlu_computer_science_university |lm_eval/tasks/arabicmmlu/arabicmmlu_computer_science_university.yaml |multiple_choice | | |
| |arabicmmlu_driving_test |lm_eval/tasks/arabicmmlu/arabicmmlu_driving_test.yaml |multiple_choice | | |
| |arabicmmlu_economics_high_school |lm_eval/tasks/arabicmmlu/arabicmmlu_economics_high_school.yaml |multiple_choice | | |
| |arabicmmlu_economics_middle_school |lm_eval/tasks/arabicmmlu/arabicmmlu_economics_middle_school.yaml |multiple_choice | | |
| |arabicmmlu_economics_university |lm_eval/tasks/arabicmmlu/arabicmmlu_economics_university.yaml |multiple_choice | | |
| |arabicmmlu_general_knowledge |lm_eval/tasks/arabicmmlu/arabicmmlu_general_knowledge.yaml |multiple_choice | | |
| |arabicmmlu_general_knowledge_middle_school |lm_eval/tasks/arabicmmlu/arabicmmlu_general_knowledge_middle_school.yaml |multiple_choice | | |
| |arabicmmlu_general_knowledge_primary_school |lm_eval/tasks/arabicmmlu/arabicmmlu_general_knowledge_primary_school.yaml |multiple_choice | | |
| |arabicmmlu_geography_high_school |lm_eval/tasks/arabicmmlu/arabicmmlu_geography_high_school.yaml |multiple_choice | | |
| |arabicmmlu_geography_middle_school |lm_eval/tasks/arabicmmlu/arabicmmlu_geography_middle_school.yaml |multiple_choice | | |
| |arabicmmlu_geography_primary_school |lm_eval/tasks/arabicmmlu/arabicmmlu_geography_primary_school.yaml |multiple_choice | | |
| |arabicmmlu_history_high_school |lm_eval/tasks/arabicmmlu/arabicmmlu_history_high_school.yaml |multiple_choice | | |
| |arabicmmlu_history_middle_school |lm_eval/tasks/arabicmmlu/arabicmmlu_history_middle_school.yaml |multiple_choice | | |
| |arabicmmlu_history_primary_school |lm_eval/tasks/arabicmmlu/arabicmmlu_history_primary_school.yaml |multiple_choice | | |
| |arabicmmlu_islamic_studies |lm_eval/tasks/arabicmmlu/arabicmmlu_islamic_studies.yaml |multiple_choice | | |
| |arabicmmlu_islamic_studies_high_school |lm_eval/tasks/arabicmmlu/arabicmmlu_islamic_studies_high_school.yaml |multiple_choice | | |
| |arabicmmlu_islamic_studies_middle_school |lm_eval/tasks/arabicmmlu/arabicmmlu_islamic_studies_middle_school.yaml |multiple_choice | | |
| |arabicmmlu_islamic_studies_primary_school |lm_eval/tasks/arabicmmlu/arabicmmlu_islamic_studies_primary_school.yaml |multiple_choice | | |
| |arabicmmlu_law_professional |lm_eval/tasks/arabicmmlu/arabicmmlu_law_professional.yaml |multiple_choice | | |
| |arabicmmlu_management_university |lm_eval/tasks/arabicmmlu/arabicmmlu_management_university.yaml |multiple_choice | | |
| |arabicmmlu_math_primary_school |lm_eval/tasks/arabicmmlu/arabicmmlu_math_primary_school.yaml |multiple_choice | | |
| |arabicmmlu_natural_science_middle_school |lm_eval/tasks/arabicmmlu/arabicmmlu_natural_science_middle_school.yaml |multiple_choice | | |
| |arabicmmlu_natural_science_primary_school |lm_eval/tasks/arabicmmlu/arabicmmlu_natural_science_primary_school.yaml |multiple_choice | | |
| |arabicmmlu_philosophy_high_school |lm_eval/tasks/arabicmmlu/arabicmmlu_philosophy_high_school.yaml |multiple_choice | | |
| |arabicmmlu_physics_high_school |lm_eval/tasks/arabicmmlu/arabicmmlu_physics_high_school.yaml |multiple_choice | | |
| |arabicmmlu_political_science_university |lm_eval/tasks/arabicmmlu/arabicmmlu_political_science_university.yaml |multiple_choice | | |
| |arabicmmlu_social_science_middle_school |lm_eval/tasks/arabicmmlu/arabicmmlu_social_science_middle_school.yaml |multiple_choice | | |
| |arabicmmlu_social_science_primary_school |lm_eval/tasks/arabicmmlu/arabicmmlu_social_science_primary_school.yaml |multiple_choice | | |
| |arc_ar |lm_eval/tasks/okapi/arc_multilingual/arc_ar.yaml |multiple_choice | | |
| |arc_bn |lm_eval/tasks/okapi/arc_multilingual/arc_bn.yaml |multiple_choice | | |
| |arc_ca |lm_eval/tasks/okapi/arc_multilingual/arc_ca.yaml |multiple_choice | | |
| |arc_ca_challenge |lm_eval/tasks/catalan_bench/arc_ca_challenge.yaml |multiple_choice | | |
| |arc_ca_easy |lm_eval/tasks/catalan_bench/arc_ca_easy.yaml |multiple_choice | | |
| |arc_challenge |lm_eval/tasks/arc/arc_challenge.yaml |multiple_choice | | |
| |arc_challenge_chat |lm_eval/tasks/arc/arc_challenge_chat.yaml |generate_until | | |
| |arc_challenge_llama |lm_eval/tasks/llama3/instruct/arc_challenge/arc_challenge_llama.yaml |generate_until | | |
| |arc_challenge_mt_da |lm_eval/tasks/arc_mt/arc_challenge_mt_da.yaml |multiple_choice | | |
| |arc_challenge_mt_de |lm_eval/tasks/arc_mt/arc_challenge_mt_de.yaml |multiple_choice | | |
| |arc_challenge_mt_el |lm_eval/tasks/arc_mt/arc_challenge_mt_el.yaml |multiple_choice | | |
| |arc_challenge_mt_es |lm_eval/tasks/arc_mt/arc_challenge_mt_es.yaml |multiple_choice | | |
| |arc_challenge_mt_fi |lm_eval/tasks/arc_mt/arc_challenge_mt_fi.yaml |multiple_choice | | |
| |arc_challenge_mt_hu |lm_eval/tasks/arc_mt/arc_challenge_mt_hu.yaml |multiple_choice | | |
| |arc_challenge_mt_is |lm_eval/tasks/arc_mt/arc_challenge_mt_is.yaml |multiple_choice | | |
| |arc_challenge_mt_it |lm_eval/tasks/arc_mt/arc_challenge_mt_it.yaml |multiple_choice | | |
| |arc_challenge_mt_nb |lm_eval/tasks/arc_mt/arc_challenge_mt_nb.yaml |multiple_choice | | |
| |arc_challenge_mt_pl |lm_eval/tasks/arc_mt/arc_challenge_mt_pl.yaml |multiple_choice | | |
| |arc_challenge_mt_pt |lm_eval/tasks/arc_mt/arc_challenge_mt_pt.yaml |multiple_choice | | |
| |arc_challenge_mt_sv |lm_eval/tasks/arc_mt/arc_challenge_mt_sv.yaml |multiple_choice | | |
| |arc_da |lm_eval/tasks/okapi/arc_multilingual/arc_da.yaml |multiple_choice | | |
| |arc_de |lm_eval/tasks/okapi/arc_multilingual/arc_de.yaml |multiple_choice | | |
| |arc_easy |lm_eval/tasks/arc/arc_easy.yaml |multiple_choice | | |
| |arc_es |lm_eval/tasks/okapi/arc_multilingual/arc_es.yaml |multiple_choice | | |
| |arc_eu |lm_eval/tasks/okapi/arc_multilingual/arc_eu.yaml |multiple_choice | | |
| |arc_eu_challenge |lm_eval/tasks/basque_bench/arc_eu_challenge.yaml |multiple_choice | | |
| |arc_eu_easy |lm_eval/tasks/basque_bench/arc_eu_easy.yaml |multiple_choice | | |
| |arc_fr |lm_eval/tasks/okapi/arc_multilingual/arc_fr.yaml |multiple_choice | | |
| |arc_gu |lm_eval/tasks/okapi/arc_multilingual/arc_gu.yaml |multiple_choice | | |
| |arc_hi |lm_eval/tasks/okapi/arc_multilingual/arc_hi.yaml |multiple_choice | | |
| |arc_hr |lm_eval/tasks/okapi/arc_multilingual/arc_hr.yaml |multiple_choice | | |
| |arc_hu |lm_eval/tasks/okapi/arc_multilingual/arc_hu.yaml |multiple_choice | | |
| |arc_hy |lm_eval/tasks/okapi/arc_multilingual/arc_hy.yaml |multiple_choice | | |
| |arc_id |lm_eval/tasks/okapi/arc_multilingual/arc_id.yaml |multiple_choice | | |
| |arc_it |lm_eval/tasks/okapi/arc_multilingual/arc_it.yaml |multiple_choice | | |
| |arc_kn |lm_eval/tasks/okapi/arc_multilingual/arc_kn.yaml |multiple_choice | | |
| |arc_ml |lm_eval/tasks/okapi/arc_multilingual/arc_ml.yaml |multiple_choice | | |
| |arc_mr |lm_eval/tasks/okapi/arc_multilingual/arc_mr.yaml |multiple_choice | | |
| |arc_ne |lm_eval/tasks/okapi/arc_multilingual/arc_ne.yaml |multiple_choice | | |
| |arc_nl |lm_eval/tasks/okapi/arc_multilingual/arc_nl.yaml |multiple_choice | | |
| |arc_pt |lm_eval/tasks/okapi/arc_multilingual/arc_pt.yaml |multiple_choice | | |
| |arc_ro |lm_eval/tasks/okapi/arc_multilingual/arc_ro.yaml |multiple_choice | | |
| |arc_ru |lm_eval/tasks/okapi/arc_multilingual/arc_ru.yaml |multiple_choice | | |
| |arc_sk |lm_eval/tasks/okapi/arc_multilingual/arc_sk.yaml |multiple_choice | | |
| |arc_sr |lm_eval/tasks/okapi/arc_multilingual/arc_sr.yaml |multiple_choice | | |
| |arc_sv |lm_eval/tasks/okapi/arc_multilingual/arc_sv.yaml |multiple_choice | | |
| |arc_ta |lm_eval/tasks/okapi/arc_multilingual/arc_ta.yaml |multiple_choice | | |
| |arc_te |lm_eval/tasks/okapi/arc_multilingual/arc_te.yaml |multiple_choice | | |
| |arc_uk |lm_eval/tasks/okapi/arc_multilingual/arc_uk.yaml |multiple_choice | | |
| |arc_vi |lm_eval/tasks/okapi/arc_multilingual/arc_vi.yaml |multiple_choice | | |
| |arc_zh |lm_eval/tasks/okapi/arc_multilingual/arc_zh.yaml |multiple_choice | | |
| |argument_topic |lm_eval/tasks/unitxt/argument_topic.yaml | | | |
| |arithmetic_1dc |lm_eval/tasks/arithmetic/arithmetic_1dc.yaml |loglikelihood | | |
| |arithmetic_2da |lm_eval/tasks/arithmetic/arithmetic_2da.yaml |loglikelihood | | |
| |arithmetic_2dm |lm_eval/tasks/arithmetic/arithmetic_2dm.yaml |loglikelihood | | |
| |arithmetic_2ds |lm_eval/tasks/arithmetic/arithmetic_2ds.yaml |loglikelihood | | |
| |arithmetic_3da |lm_eval/tasks/arithmetic/arithmetic_3da.yaml |loglikelihood | | |
| |arithmetic_3ds |lm_eval/tasks/arithmetic/arithmetic_3ds.yaml |loglikelihood | | |
| |arithmetic_4da |lm_eval/tasks/arithmetic/arithmetic_4da.yaml |loglikelihood | | |
| |arithmetic_4ds |lm_eval/tasks/arithmetic/arithmetic_4ds.yaml |loglikelihood | | |
| |arithmetic_5da |lm_eval/tasks/arithmetic/arithmetic_5da.yaml |loglikelihood | | |
| |arithmetic_5ds |lm_eval/tasks/arithmetic/arithmetic_5ds.yaml |loglikelihood | | |
| |asdiv |lm_eval/tasks/asdiv/default.yaml |loglikelihood | | |
| |asdiv_cot_llama |lm_eval/tasks/asdiv/asdiv-cot-llama.yaml |generate_until | | |
| |ask_gec_p0 |lm_eval/tasks/noreval/ask_gec/ask_gec_p0.yaml |generate_until | | |
| |ask_gec_p1 |lm_eval/tasks/noreval/ask_gec/ask_gec_p1.yaml |generate_until | | |
| |ask_gec_p2 |lm_eval/tasks/noreval/ask_gec/ask_gec_p2.yaml |generate_until | | |
| |ask_gec_p3 |lm_eval/tasks/noreval/ask_gec/ask_gec_p3.yaml |generate_until | | |
| |ask_gec_p4 |lm_eval/tasks/noreval/ask_gec/ask_gec_p4.yaml |generate_until | | |
| |assin_entailment |lm_eval/tasks/portuguese_bench/assin_entailment.yaml |multiple_choice | | |
| |assin_paraphrase |lm_eval/tasks/portuguese_bench/assin_paraphrase.yaml |multiple_choice | | |
| |atis |lm_eval/tasks/unitxt/atis.yaml | | | |
| |babi |lm_eval/tasks/babi/babi.yaml |generate_until | | |
| |banking77 |lm_eval/tasks/unitxt/banking77.yaml | | | |
| |bbh_cot_fewshot_boolean_expressions |lm_eval/tasks/bbh/cot_fewshot/boolean_expressions.yaml |generate_until | | |
| |bbh_cot_fewshot_causal_judgement |lm_eval/tasks/bbh/cot_fewshot/causal_judgement.yaml |generate_until | | |
| |bbh_cot_fewshot_date_understanding |lm_eval/tasks/bbh/cot_fewshot/date_understanding.yaml |generate_until | | |
| |bbh_cot_fewshot_disambiguation_qa |lm_eval/tasks/bbh/cot_fewshot/disambiguation_qa.yaml |generate_until | | |
| |bbh_cot_fewshot_dyck_languages |lm_eval/tasks/bbh/cot_fewshot/dyck_languages.yaml |generate_until | | |
| |bbh_cot_fewshot_formal_fallacies |lm_eval/tasks/bbh/cot_fewshot/formal_fallacies.yaml |generate_until | | |
| |bbh_cot_fewshot_geometric_shapes |lm_eval/tasks/bbh/cot_fewshot/geometric_shapes.yaml |generate_until | | |
| |bbh_cot_fewshot_hyperbaton |lm_eval/tasks/bbh/cot_fewshot/hyperbaton.yaml |generate_until | | |
| |bbh_cot_fewshot_logical_deduction_five_objects |lm_eval/tasks/bbh/cot_fewshot/logical_deduction_five_objects.yaml |generate_until | | |
| |bbh_cot_fewshot_logical_deduction_seven_objects |lm_eval/tasks/bbh/cot_fewshot/logical_deduction_seven_objects.yaml |generate_until | | |
| |bbh_cot_fewshot_logical_deduction_three_objects |lm_eval/tasks/bbh/cot_fewshot/logical_deduction_three_objects.yaml |generate_until | | |
| |bbh_cot_fewshot_movie_recommendation |lm_eval/tasks/bbh/cot_fewshot/movie_recommendation.yaml |generate_until | | |
| |bbh_cot_fewshot_multistep_arithmetic_two |lm_eval/tasks/bbh/cot_fewshot/multistep_arithmetic_two.yaml |generate_until | | |
| |bbh_cot_fewshot_navigate |lm_eval/tasks/bbh/cot_fewshot/navigate.yaml |generate_until | | |
| |bbh_cot_fewshot_object_counting |lm_eval/tasks/bbh/cot_fewshot/object_counting.yaml |generate_until | | |
| |bbh_cot_fewshot_penguins_in_a_table |lm_eval/tasks/bbh/cot_fewshot/penguins_in_a_table.yaml |generate_until | | |
| |bbh_cot_fewshot_reasoning_about_colored_objects |lm_eval/tasks/bbh/cot_fewshot/reasoning_about_colored_objects.yaml |generate_until | | |
| |bbh_cot_fewshot_ruin_names |lm_eval/tasks/bbh/cot_fewshot/ruin_names.yaml |generate_until | | |
| |bbh_cot_fewshot_salient_translation_error_detection |lm_eval/tasks/bbh/cot_fewshot/salient_translation_error_detection.yaml |generate_until | | |
| |bbh_cot_fewshot_snarks |lm_eval/tasks/bbh/cot_fewshot/snarks.yaml |generate_until | | |
| |bbh_cot_fewshot_sports_understanding |lm_eval/tasks/bbh/cot_fewshot/sports_understanding.yaml |generate_until | | |
| |bbh_cot_fewshot_temporal_sequences |lm_eval/tasks/bbh/cot_fewshot/temporal_sequences.yaml |generate_until | | |
| |bbh_cot_fewshot_tracking_shuffled_objects_five_objects |lm_eval/tasks/bbh/cot_fewshot/tracking_shuffled_objects_five_objects.yaml |generate_until | | |
| |bbh_cot_fewshot_tracking_shuffled_objects_seven_objects |lm_eval/tasks/bbh/cot_fewshot/tracking_shuffled_objects_seven_objects.yaml |generate_until | | |
| |bbh_cot_fewshot_tracking_shuffled_objects_three_objects |lm_eval/tasks/bbh/cot_fewshot/tracking_shuffled_objects_three_objects.yaml |generate_until | | |
| |bbh_cot_fewshot_web_of_lies |lm_eval/tasks/bbh/cot_fewshot/web_of_lies.yaml |generate_until | | |
| |bbh_cot_fewshot_word_sorting |lm_eval/tasks/bbh/cot_fewshot/word_sorting.yaml |generate_until | | |
| |bbh_cot_zeroshot_boolean_expressions |lm_eval/tasks/bbh/cot_zeroshot/boolean_expressions.yaml |generate_until | | |
| |bbh_cot_zeroshot_causal_judgement |lm_eval/tasks/bbh/cot_zeroshot/causal_judgement.yaml |generate_until | | |
| |bbh_cot_zeroshot_date_understanding |lm_eval/tasks/bbh/cot_zeroshot/date_understanding.yaml |generate_until | | |
| |bbh_cot_zeroshot_disambiguation_qa |lm_eval/tasks/bbh/cot_zeroshot/disambiguation_qa.yaml |generate_until | | |
| |bbh_cot_zeroshot_dyck_languages |lm_eval/tasks/bbh/cot_zeroshot/dyck_languages.yaml |generate_until | | |
| |bbh_cot_zeroshot_formal_fallacies |lm_eval/tasks/bbh/cot_zeroshot/formal_fallacies.yaml |generate_until | | |
| |bbh_cot_zeroshot_geometric_shapes |lm_eval/tasks/bbh/cot_zeroshot/geometric_shapes.yaml |generate_until | | |
| |bbh_cot_zeroshot_hyperbaton |lm_eval/tasks/bbh/cot_zeroshot/hyperbaton.yaml |generate_until | | |
| |bbh_cot_zeroshot_logical_deduction_five_objects |lm_eval/tasks/bbh/cot_zeroshot/logical_deduction_five_objects.yaml |generate_until | | |
| |bbh_cot_zeroshot_logical_deduction_seven_objects |lm_eval/tasks/bbh/cot_zeroshot/logical_deduction_seven_objects.yaml |generate_until | | |
| |bbh_cot_zeroshot_logical_deduction_three_objects |lm_eval/tasks/bbh/cot_zeroshot/logical_deduction_three_objects.yaml |generate_until | | |
| |bbh_cot_zeroshot_movie_recommendation |lm_eval/tasks/bbh/cot_zeroshot/movie_recommendation.yaml |generate_until | | |
| |bbh_cot_zeroshot_multistep_arithmetic_two |lm_eval/tasks/bbh/cot_zeroshot/multistep_arithmetic_two.yaml |generate_until | | |
| |bbh_cot_zeroshot_navigate |lm_eval/tasks/bbh/cot_zeroshot/navigate.yaml |generate_until | | |
| |bbh_cot_zeroshot_object_counting |lm_eval/tasks/bbh/cot_zeroshot/object_counting.yaml |generate_until | | |
| |bbh_cot_zeroshot_penguins_in_a_table |lm_eval/tasks/bbh/cot_zeroshot/penguins_in_a_table.yaml |generate_until | | |
| |bbh_cot_zeroshot_reasoning_about_colored_objects |lm_eval/tasks/bbh/cot_zeroshot/reasoning_about_colored_objects.yaml |generate_until | | |
| |bbh_cot_zeroshot_ruin_names |lm_eval/tasks/bbh/cot_zeroshot/ruin_names.yaml |generate_until | | |
| |bbh_cot_zeroshot_salient_translation_error_detection |lm_eval/tasks/bbh/cot_zeroshot/salient_translation_error_detection.yaml |generate_until | | |
| |bbh_cot_zeroshot_snarks |lm_eval/tasks/bbh/cot_zeroshot/snarks.yaml |generate_until | | |
| |bbh_cot_zeroshot_sports_understanding |lm_eval/tasks/bbh/cot_zeroshot/sports_understanding.yaml |generate_until | | |
| |bbh_cot_zeroshot_temporal_sequences |lm_eval/tasks/bbh/cot_zeroshot/temporal_sequences.yaml |generate_until | | |
| |bbh_cot_zeroshot_tracking_shuffled_objects_five_objects |lm_eval/tasks/bbh/cot_zeroshot/tracking_shuffled_objects_five_objects.yaml |generate_until | | |
| |bbh_cot_zeroshot_tracking_shuffled_objects_seven_objects |lm_eval/tasks/bbh/cot_zeroshot/tracking_shuffled_objects_seven_objects.yaml |generate_until | | |
| |bbh_cot_zeroshot_tracking_shuffled_objects_three_objects |lm_eval/tasks/bbh/cot_zeroshot/tracking_shuffled_objects_three_objects.yaml |generate_until | | |
| |bbh_cot_zeroshot_web_of_lies |lm_eval/tasks/bbh/cot_zeroshot/web_of_lies.yaml |generate_until | | |
| |bbh_cot_zeroshot_word_sorting |lm_eval/tasks/bbh/cot_zeroshot/word_sorting.yaml |generate_until | | |
| |bbh_fewshot_boolean_expressions |lm_eval/tasks/bbh/fewshot/boolean_expressions.yaml |generate_until | | |
| |bbh_fewshot_causal_judgement |lm_eval/tasks/bbh/fewshot/causal_judgement.yaml |generate_until | | |
| |bbh_fewshot_date_understanding |lm_eval/tasks/bbh/fewshot/date_understanding.yaml |generate_until | | |
| |bbh_fewshot_disambiguation_qa |lm_eval/tasks/bbh/fewshot/disambiguation_qa.yaml |generate_until | | |
| |bbh_fewshot_dyck_languages |lm_eval/tasks/bbh/fewshot/dyck_languages.yaml |generate_until | | |
| |bbh_fewshot_formal_fallacies |lm_eval/tasks/bbh/fewshot/formal_fallacies.yaml |generate_until | | |
| |bbh_fewshot_geometric_shapes |lm_eval/tasks/bbh/fewshot/geometric_shapes.yaml |generate_until | | |
| |bbh_fewshot_hyperbaton |lm_eval/tasks/bbh/fewshot/hyperbaton.yaml |generate_until | | |
| |bbh_fewshot_logical_deduction_five_objects |lm_eval/tasks/bbh/fewshot/logical_deduction_five_objects.yaml |generate_until | | |
| |bbh_fewshot_logical_deduction_seven_objects |lm_eval/tasks/bbh/fewshot/logical_deduction_seven_objects.yaml |generate_until | | |
| |bbh_fewshot_logical_deduction_three_objects |lm_eval/tasks/bbh/fewshot/logical_deduction_three_objects.yaml |generate_until | | |
| |bbh_fewshot_movie_recommendation |lm_eval/tasks/bbh/fewshot/movie_recommendation.yaml |generate_until | | |
| |bbh_fewshot_multistep_arithmetic_two |lm_eval/tasks/bbh/fewshot/multistep_arithmetic_two.yaml |generate_until | | |
| |bbh_fewshot_navigate |lm_eval/tasks/bbh/fewshot/navigate.yaml |generate_until | | |
| |bbh_fewshot_object_counting |lm_eval/tasks/bbh/fewshot/object_counting.yaml |generate_until | | |
| |bbh_fewshot_penguins_in_a_table |lm_eval/tasks/bbh/fewshot/penguins_in_a_table.yaml |generate_until | | |
| |bbh_fewshot_reasoning_about_colored_objects |lm_eval/tasks/bbh/fewshot/reasoning_about_colored_objects.yaml |generate_until | | |
| |bbh_fewshot_ruin_names |lm_eval/tasks/bbh/fewshot/ruin_names.yaml |generate_until | | |
| |bbh_fewshot_salient_translation_error_detection |lm_eval/tasks/bbh/fewshot/salient_translation_error_detection.yaml |generate_until | | |
| |bbh_fewshot_snarks |lm_eval/tasks/bbh/fewshot/snarks.yaml |generate_until | | |
| |bbh_fewshot_sports_understanding |lm_eval/tasks/bbh/fewshot/sports_understanding.yaml |generate_until | | |
| |bbh_fewshot_temporal_sequences |lm_eval/tasks/bbh/fewshot/temporal_sequences.yaml |generate_until | | |
| |bbh_fewshot_tracking_shuffled_objects_five_objects |lm_eval/tasks/bbh/fewshot/tracking_shuffled_objects_five_objects.yaml |generate_until | | |
| |bbh_fewshot_tracking_shuffled_objects_seven_objects |lm_eval/tasks/bbh/fewshot/tracking_shuffled_objects_seven_objects.yaml |generate_until | | |
| |bbh_fewshot_tracking_shuffled_objects_three_objects |lm_eval/tasks/bbh/fewshot/tracking_shuffled_objects_three_objects.yaml |generate_until | | |
| |bbh_fewshot_web_of_lies |lm_eval/tasks/bbh/fewshot/web_of_lies.yaml |generate_until | | |
| |bbh_fewshot_word_sorting |lm_eval/tasks/bbh/fewshot/word_sorting.yaml |generate_until | | |
| |bbh_zeroshot_boolean_expressions |lm_eval/tasks/bbh/zeroshot/boolean_expressions.yaml |generate_until | | |
| |bbh_zeroshot_causal_judgement |lm_eval/tasks/bbh/zeroshot/causal_judgement.yaml |generate_until | | |
| |bbh_zeroshot_date_understanding |lm_eval/tasks/bbh/zeroshot/date_understanding.yaml |generate_until | | |
| |bbh_zeroshot_disambiguation_qa |lm_eval/tasks/bbh/zeroshot/disambiguation_qa.yaml |generate_until | | |
| |bbh_zeroshot_dyck_languages |lm_eval/tasks/bbh/zeroshot/dyck_languages.yaml |generate_until | | |
| |bbh_zeroshot_formal_fallacies |lm_eval/tasks/bbh/zeroshot/formal_fallacies.yaml |generate_until | | |
| |bbh_zeroshot_geometric_shapes |lm_eval/tasks/bbh/zeroshot/geometric_shapes.yaml |generate_until | | |
| |bbh_zeroshot_hyperbaton |lm_eval/tasks/bbh/zeroshot/hyperbaton.yaml |generate_until | | |
| |bbh_zeroshot_logical_deduction_five_objects |lm_eval/tasks/bbh/zeroshot/logical_deduction_five_objects.yaml |generate_until | | |
| |bbh_zeroshot_logical_deduction_seven_objects |lm_eval/tasks/bbh/zeroshot/logical_deduction_seven_objects.yaml |generate_until | | |
| |bbh_zeroshot_logical_deduction_three_objects |lm_eval/tasks/bbh/zeroshot/logical_deduction_three_objects.yaml |generate_until | | |
| |bbh_zeroshot_movie_recommendation |lm_eval/tasks/bbh/zeroshot/movie_recommendation.yaml |generate_until | | |
| |bbh_zeroshot_multistep_arithmetic_two |lm_eval/tasks/bbh/zeroshot/multistep_arithmetic_two.yaml |generate_until | | |
| |bbh_zeroshot_navigate |lm_eval/tasks/bbh/zeroshot/navigate.yaml |generate_until | | |
| |bbh_zeroshot_object_counting |lm_eval/tasks/bbh/zeroshot/object_counting.yaml |generate_until | | |
| |bbh_zeroshot_penguins_in_a_table |lm_eval/tasks/bbh/zeroshot/penguins_in_a_table.yaml |generate_until | | |
| |bbh_zeroshot_reasoning_about_colored_objects |lm_eval/tasks/bbh/zeroshot/reasoning_about_colored_objects.yaml |generate_until | | |
| |bbh_zeroshot_ruin_names |lm_eval/tasks/bbh/zeroshot/ruin_names.yaml |generate_until | | |
| |bbh_zeroshot_salient_translation_error_detection |lm_eval/tasks/bbh/zeroshot/salient_translation_error_detection.yaml |generate_until | | |
| |bbh_zeroshot_snarks |lm_eval/tasks/bbh/zeroshot/snarks.yaml |generate_until | | |
| |bbh_zeroshot_sports_understanding |lm_eval/tasks/bbh/zeroshot/sports_understanding.yaml |generate_until | | |
| |bbh_zeroshot_temporal_sequences |lm_eval/tasks/bbh/zeroshot/temporal_sequences.yaml |generate_until | | |
| |bbh_zeroshot_tracking_shuffled_objects_five_objects |lm_eval/tasks/bbh/zeroshot/tracking_shuffled_objects_five_objects.yaml |generate_until | | |
| |bbh_zeroshot_tracking_shuffled_objects_seven_objects |lm_eval/tasks/bbh/zeroshot/tracking_shuffled_objects_seven_objects.yaml |generate_until | | |
| |bbh_zeroshot_tracking_shuffled_objects_three_objects |lm_eval/tasks/bbh/zeroshot/tracking_shuffled_objects_three_objects.yaml |generate_until | | |
| |bbh_zeroshot_web_of_lies |lm_eval/tasks/bbh/zeroshot/web_of_lies.yaml |generate_until | | |
| |bbh_zeroshot_word_sorting |lm_eval/tasks/bbh/zeroshot/word_sorting.yaml |generate_until | | |
| |bbq |lm_eval/tasks/bbq/bbq_multiple_choice.yaml |multiple_choice | | |
| |bbq_ambig |lm_eval/tasks/bbq/bbq_multiple_choice_ambig.yaml |multiple_choice | | |
| |bbq_disambig |lm_eval/tasks/bbq/bbq_multiple_choice_disambig.yaml |multiple_choice | | |
| |bbq_generate |lm_eval/tasks/bbq/bbq_generate.yaml |generate_until | | |
| |bbq_generate_ambig |lm_eval/tasks/bbq/bbq_generate_ambig.yaml |generate_until | | |
| |bbq_generate_disambig |lm_eval/tasks/bbq/bbq_generate_disambig.yaml |generate_until | | |
| |bec2016eu |lm_eval/tasks/basqueglue/bec.yaml |multiple_choice | | |
| |belebele_acm_Arab |lm_eval/tasks/belebele/belebele_acm_Arab.yaml |multiple_choice | | |
| |belebele_afr_Latn |lm_eval/tasks/belebele/belebele_afr_Latn.yaml |multiple_choice | | |
| |belebele_afr_prompt_1 |lm_eval/tasks/afrobench/belebele/prompt_1/belebele_afr.yaml |multiple_choice | | |
| |belebele_afr_prompt_2 |lm_eval/tasks/afrobench/belebele/prompt_2/belebele_afr.yaml |multiple_choice | | |
| |belebele_afr_prompt_3 |lm_eval/tasks/afrobench/belebele/prompt_3/belebele_afr.yaml |multiple_choice | | |
| |belebele_afr_prompt_4 |lm_eval/tasks/afrobench/belebele/prompt_4/belebele_afr.yaml |multiple_choice | | |
| |belebele_afr_prompt_5 |lm_eval/tasks/afrobench/belebele/prompt_5/belebele_afr.yaml |multiple_choice | | |
| |belebele_als_Latn |lm_eval/tasks/belebele/belebele_als_Latn.yaml |multiple_choice | | |
| |belebele_amh_Ethi |lm_eval/tasks/belebele/belebele_amh_Ethi.yaml |multiple_choice | | |
| |belebele_amh_prompt_1 |lm_eval/tasks/afrobench/belebele/prompt_1/belebele_amh.yaml |multiple_choice | | |
| |belebele_amh_prompt_2 |lm_eval/tasks/afrobench/belebele/prompt_2/belebele_amh.yaml |multiple_choice | | |
| |belebele_amh_prompt_3 |lm_eval/tasks/afrobench/belebele/prompt_3/belebele_amh.yaml |multiple_choice | | |
| |belebele_amh_prompt_4 |lm_eval/tasks/afrobench/belebele/prompt_4/belebele_amh.yaml |multiple_choice | | |
| |belebele_amh_prompt_5 |lm_eval/tasks/afrobench/belebele/prompt_5/belebele_amh.yaml |multiple_choice | | |
| |belebele_apc_Arab |lm_eval/tasks/belebele/belebele_apc_Arab.yaml |multiple_choice | | |
| |belebele_arb_Arab |lm_eval/tasks/belebele/belebele_arb_Arab.yaml |multiple_choice | | |
| |belebele_arb_Latn |lm_eval/tasks/belebele/belebele_arb_Latn.yaml |multiple_choice | | |
| |belebele_ars_Arab |lm_eval/tasks/belebele/belebele_ars_Arab.yaml |multiple_choice | | |
| |belebele_ary_Arab |lm_eval/tasks/belebele/belebele_ary_Arab.yaml |multiple_choice | | |
| |belebele_ary_prompt_1 |lm_eval/tasks/afrobench/belebele/prompt_1/belebele_ary.yaml |multiple_choice | | |
| |belebele_ary_prompt_2 |lm_eval/tasks/afrobench/belebele/prompt_2/belebele_ary.yaml |multiple_choice | | |
| |belebele_ary_prompt_3 |lm_eval/tasks/afrobench/belebele/prompt_3/belebele_ary.yaml |multiple_choice | | |
| |belebele_ary_prompt_4 |lm_eval/tasks/afrobench/belebele/prompt_4/belebele_ary.yaml |multiple_choice | | |
| |belebele_ary_prompt_5 |lm_eval/tasks/afrobench/belebele/prompt_5/belebele_ary.yaml |multiple_choice | | |
| |belebele_arz_Arab |lm_eval/tasks/belebele/belebele_arz_Arab.yaml |multiple_choice | | |
| |belebele_arz_prompt_1 |lm_eval/tasks/afrobench/belebele/prompt_1/belebele_arz.yaml |multiple_choice | | |
| |belebele_arz_prompt_2 |lm_eval/tasks/afrobench/belebele/prompt_2/belebele_arz.yaml |multiple_choice | | |
| |belebele_arz_prompt_3 |lm_eval/tasks/afrobench/belebele/prompt_3/belebele_arz.yaml |multiple_choice | | |
| |belebele_arz_prompt_4 |lm_eval/tasks/afrobench/belebele/prompt_4/belebele_arz.yaml |multiple_choice | | |
| |belebele_arz_prompt_5 |lm_eval/tasks/afrobench/belebele/prompt_5/belebele_arz.yaml |multiple_choice | | |
| |belebele_asm_Beng |lm_eval/tasks/belebele/belebele_asm_Beng.yaml |multiple_choice | | |
| |belebele_azj_Latn |lm_eval/tasks/belebele/belebele_azj_Latn.yaml |multiple_choice | | |
| |belebele_bam_Latn |lm_eval/tasks/belebele/belebele_bam_Latn.yaml |multiple_choice | | |
| |belebele_bam_prompt_1 |lm_eval/tasks/afrobench/belebele/prompt_1/belebele_bam.yaml |multiple_choice | | |
| |belebele_bam_prompt_2 |lm_eval/tasks/afrobench/belebele/prompt_2/belebele_bam.yaml |multiple_choice | | |
| |belebele_bam_prompt_3 |lm_eval/tasks/afrobench/belebele/prompt_3/belebele_bam.yaml |multiple_choice | | |
| |belebele_bam_prompt_4 |lm_eval/tasks/afrobench/belebele/prompt_4/belebele_bam.yaml |multiple_choice | | |
| |belebele_bam_prompt_5 |lm_eval/tasks/afrobench/belebele/prompt_5/belebele_bam.yaml |multiple_choice | | |
| |belebele_ben_Beng |lm_eval/tasks/belebele/belebele_ben_Beng.yaml |multiple_choice | | |
| |belebele_ben_Latn |lm_eval/tasks/belebele/belebele_ben_Latn.yaml |multiple_choice | | |
| |belebele_bod_Tibt |lm_eval/tasks/belebele/belebele_bod_Tibt.yaml |multiple_choice | | |
| |belebele_bul_Cyrl |lm_eval/tasks/belebele/belebele_bul_Cyrl.yaml |multiple_choice | | |
| |belebele_cat_Latn |lm_eval/tasks/belebele/belebele_cat_Latn.yaml |multiple_choice | | |
| |belebele_ceb_Latn |lm_eval/tasks/belebele/belebele_ceb_Latn.yaml |multiple_choice | | |
| |belebele_ces_Latn |lm_eval/tasks/belebele/belebele_ces_Latn.yaml |multiple_choice | | |
| |belebele_ckb_Arab |lm_eval/tasks/belebele/belebele_ckb_Arab.yaml |multiple_choice | | |
| |belebele_dan_Latn |lm_eval/tasks/belebele/belebele_dan_Latn.yaml |multiple_choice | | |
| |belebele_deu_Latn |lm_eval/tasks/belebele/belebele_deu_Latn.yaml |multiple_choice | | |
| |belebele_ell_Grek |lm_eval/tasks/belebele/belebele_ell_Grek.yaml |multiple_choice | | |
| |belebele_eng_Latn |lm_eval/tasks/belebele/belebele_eng_Latn.yaml |multiple_choice | | |
| |belebele_eng_prompt_1 |lm_eval/tasks/afrobench/belebele/prompt_1/belebele_eng.yaml |multiple_choice | | |
| |belebele_eng_prompt_2 |lm_eval/tasks/afrobench/belebele/prompt_2/belebele_eng.yaml |multiple_choice | | |
| |belebele_eng_prompt_3 |lm_eval/tasks/afrobench/belebele/prompt_3/belebele_eng.yaml |multiple_choice | | |
| |belebele_eng_prompt_4 |lm_eval/tasks/afrobench/belebele/prompt_4/belebele_eng.yaml |multiple_choice | | |
| |belebele_eng_prompt_5 |lm_eval/tasks/afrobench/belebele/prompt_5/belebele_eng.yaml |multiple_choice | | |
| |belebele_est_Latn |lm_eval/tasks/belebele/belebele_est_Latn.yaml |multiple_choice | | |
| |belebele_eus_Latn |lm_eval/tasks/belebele/belebele_eus_Latn.yaml |multiple_choice | | |
| |belebele_fin_Latn |lm_eval/tasks/belebele/belebele_fin_Latn.yaml |multiple_choice | | |
| |belebele_fra_Latn |lm_eval/tasks/belebele/belebele_fra_Latn.yaml |multiple_choice | | |
| |belebele_fra_prompt_1 |lm_eval/tasks/afrobench/belebele/prompt_1/belebele_fra.yaml |multiple_choice | | |
| |belebele_fra_prompt_2 |lm_eval/tasks/afrobench/belebele/prompt_2/belebele_fra.yaml |multiple_choice | | |
| |belebele_fra_prompt_3 |lm_eval/tasks/afrobench/belebele/prompt_3/belebele_fra.yaml |multiple_choice | | |
| |belebele_fra_prompt_4 |lm_eval/tasks/afrobench/belebele/prompt_4/belebele_fra.yaml |multiple_choice | | |
| |belebele_fra_prompt_5 |lm_eval/tasks/afrobench/belebele/prompt_5/belebele_fra.yaml |multiple_choice | | |
| |belebele_fuv_Latn |lm_eval/tasks/belebele/belebele_fuv_Latn.yaml |multiple_choice | | |
| |belebele_fuv_prompt_1 |lm_eval/tasks/afrobench/belebele/prompt_1/belebele_fuv.yaml |multiple_choice | | |
| |belebele_fuv_prompt_2 |lm_eval/tasks/afrobench/belebele/prompt_2/belebele_fuv.yaml |multiple_choice | | |
| |belebele_fuv_prompt_3 |lm_eval/tasks/afrobench/belebele/prompt_3/belebele_fuv.yaml |multiple_choice | | |
| |belebele_fuv_prompt_4 |lm_eval/tasks/afrobench/belebele/prompt_4/belebele_fuv.yaml |multiple_choice | | |
| |belebele_fuv_prompt_5 |lm_eval/tasks/afrobench/belebele/prompt_5/belebele_fuv.yaml |multiple_choice | | |
| |belebele_gaz_Latn |lm_eval/tasks/belebele/belebele_gaz_Latn.yaml |multiple_choice | | |
| |belebele_gaz_prompt_1 |lm_eval/tasks/afrobench/belebele/prompt_1/belebele_gaz.yaml |multiple_choice | | |
| |belebele_gaz_prompt_2 |lm_eval/tasks/afrobench/belebele/prompt_2/belebele_gaz.yaml |multiple_choice | | |
| |belebele_gaz_prompt_3 |lm_eval/tasks/afrobench/belebele/prompt_3/belebele_gaz.yaml |multiple_choice | | |
| |belebele_gaz_prompt_4 |lm_eval/tasks/afrobench/belebele/prompt_4/belebele_gaz.yaml |multiple_choice | | |
| |belebele_gaz_prompt_5 |lm_eval/tasks/afrobench/belebele/prompt_5/belebele_gaz.yaml |multiple_choice | | |
| |belebele_glg_Latn |lm_eval/tasks/galician_bench/belebele_glg_Latn.yaml |multiple_choice | | |
| |belebele_grn_Latn |lm_eval/tasks/belebele/belebele_grn_Latn.yaml |multiple_choice | | |
| |belebele_guj_Gujr |lm_eval/tasks/belebele/belebele_guj_Gujr.yaml |multiple_choice | | |
| |belebele_hat_Latn |lm_eval/tasks/belebele/belebele_hat_Latn.yaml |multiple_choice | | |
| |belebele_hau_Latn |lm_eval/tasks/belebele/belebele_hau_Latn.yaml |multiple_choice | | |
| |belebele_hau_prompt_1 |lm_eval/tasks/afrobench/belebele/prompt_1/belebele_hau.yaml |multiple_choice | | |
| |belebele_hau_prompt_2 |lm_eval/tasks/afrobench/belebele/prompt_2/belebele_hau.yaml |multiple_choice | | |
| |belebele_hau_prompt_3 |lm_eval/tasks/afrobench/belebele/prompt_3/belebele_hau.yaml |multiple_choice | | |
| |belebele_hau_prompt_4 |lm_eval/tasks/afrobench/belebele/prompt_4/belebele_hau.yaml |multiple_choice | | |
| |belebele_hau_prompt_5 |lm_eval/tasks/afrobench/belebele/prompt_5/belebele_hau.yaml |multiple_choice | | |
| |belebele_heb_Hebr |lm_eval/tasks/belebele/belebele_heb_Hebr.yaml |multiple_choice | | |
| |belebele_hin_Deva |lm_eval/tasks/belebele/belebele_hin_Deva.yaml |multiple_choice | | |
| |belebele_hin_Latn |lm_eval/tasks/belebele/belebele_hin_Latn.yaml |multiple_choice | | |
| |belebele_hrv_Latn |lm_eval/tasks/belebele/belebele_hrv_Latn.yaml |multiple_choice | | |
| |belebele_hun_Latn |lm_eval/tasks/belebele/belebele_hun_Latn.yaml |multiple_choice | | |
| |belebele_hye_Armn |lm_eval/tasks/belebele/belebele_hye_Armn.yaml |multiple_choice | | |
| |belebele_ibo_Latn |lm_eval/tasks/belebele/belebele_ibo_Latn.yaml |multiple_choice | | |
| |belebele_ibo_prompt_1 |lm_eval/tasks/afrobench/belebele/prompt_1/belebele_ibo.yaml |multiple_choice | | |
| |belebele_ibo_prompt_2 |lm_eval/tasks/afrobench/belebele/prompt_2/belebele_ibo.yaml |multiple_choice | | |
| |belebele_ibo_prompt_3 |lm_eval/tasks/afrobench/belebele/prompt_3/belebele_ibo.yaml |multiple_choice | | |
| |belebele_ibo_prompt_4 |lm_eval/tasks/afrobench/belebele/prompt_4/belebele_ibo.yaml |multiple_choice | | |
| |belebele_ibo_prompt_5 |lm_eval/tasks/afrobench/belebele/prompt_5/belebele_ibo.yaml |multiple_choice | | |
| |belebele_ilo_Latn |lm_eval/tasks/belebele/belebele_ilo_Latn.yaml |multiple_choice | | |
| |belebele_ind_Latn |lm_eval/tasks/belebele/belebele_ind_Latn.yaml |multiple_choice | | |
| |belebele_isl_Latn |lm_eval/tasks/belebele/belebele_isl_Latn.yaml |multiple_choice | | |
| |belebele_ita_Latn |lm_eval/tasks/belebele/belebele_ita_Latn.yaml |multiple_choice | | |
| |belebele_jav_Latn |lm_eval/tasks/belebele/belebele_jav_Latn.yaml |multiple_choice | | |
| |belebele_jpn_Jpan |lm_eval/tasks/belebele/belebele_jpn_Jpan.yaml |multiple_choice | | |
| |belebele_kac_Latn |lm_eval/tasks/belebele/belebele_kac_Latn.yaml |multiple_choice | | |
| |belebele_kan_Knda |lm_eval/tasks/belebele/belebele_kan_Knda.yaml |multiple_choice | | |
| |belebele_kat_Geor |lm_eval/tasks/belebele/belebele_kat_Geor.yaml |multiple_choice | | |
| |belebele_kaz_Cyrl |lm_eval/tasks/belebele/belebele_kaz_Cyrl.yaml |multiple_choice | | |
| |belebele_kea_Latn |lm_eval/tasks/belebele/belebele_kea_Latn.yaml |multiple_choice | | |
| |belebele_kea_prompt_1 |lm_eval/tasks/afrobench/belebele/prompt_1/belebele_kea.yaml |multiple_choice | | |
| |belebele_kea_prompt_2 |lm_eval/tasks/afrobench/belebele/prompt_2/belebele_kea.yaml |multiple_choice | | |
| |belebele_kea_prompt_3 |lm_eval/tasks/afrobench/belebele/prompt_3/belebele_kea.yaml |multiple_choice | | |
| |belebele_kea_prompt_4 |lm_eval/tasks/afrobench/belebele/prompt_4/belebele_kea.yaml |multiple_choice | | |
| |belebele_kea_prompt_5 |lm_eval/tasks/afrobench/belebele/prompt_5/belebele_kea.yaml |multiple_choice | | |
| |belebele_khk_Cyrl |lm_eval/tasks/belebele/belebele_khk_Cyrl.yaml |multiple_choice | | |
| |belebele_khm_Khmr |lm_eval/tasks/belebele/belebele_khm_Khmr.yaml |multiple_choice | | |
| |belebele_kin_Latn |lm_eval/tasks/belebele/belebele_kin_Latn.yaml |multiple_choice | | |
| |belebele_kin_prompt_1 |lm_eval/tasks/afrobench/belebele/prompt_1/belebele_kin.yaml |multiple_choice | | |
| |belebele_kin_prompt_2 |lm_eval/tasks/afrobench/belebele/prompt_2/belebele_kin.yaml |multiple_choice | | |
| |belebele_kin_prompt_3 |lm_eval/tasks/afrobench/belebele/prompt_3/belebele_kin.yaml |multiple_choice | | |
| |belebele_kin_prompt_4 |lm_eval/tasks/afrobench/belebele/prompt_4/belebele_kin.yaml |multiple_choice | | |
| |belebele_kin_prompt_5 |lm_eval/tasks/afrobench/belebele/prompt_5/belebele_kin.yaml |multiple_choice | | |
| |belebele_kir_Cyrl |lm_eval/tasks/belebele/belebele_kir_Cyrl.yaml |multiple_choice | | |
| |belebele_kor_Hang |lm_eval/tasks/belebele/belebele_kor_Hang.yaml |multiple_choice | | |
| |belebele_lao_Laoo |lm_eval/tasks/belebele/belebele_lao_Laoo.yaml |multiple_choice | | |
| |belebele_lin_Latn |lm_eval/tasks/belebele/belebele_lin_Latn.yaml |multiple_choice | | |
| |belebele_lin_prompt_1 |lm_eval/tasks/afrobench/belebele/prompt_1/belebele_lin.yaml |multiple_choice | | |
| |belebele_lin_prompt_2 |lm_eval/tasks/afrobench/belebele/prompt_2/belebele_lin.yaml |multiple_choice | | |
| |belebele_lin_prompt_3 |lm_eval/tasks/afrobench/belebele/prompt_3/belebele_lin.yaml |multiple_choice | | |
| |belebele_lin_prompt_4 |lm_eval/tasks/afrobench/belebele/prompt_4/belebele_lin.yaml |multiple_choice | | |
| |belebele_lin_prompt_5 |lm_eval/tasks/afrobench/belebele/prompt_5/belebele_lin.yaml |multiple_choice | | |
| |belebele_lit_Latn |lm_eval/tasks/belebele/belebele_lit_Latn.yaml |multiple_choice | | |
| |belebele_lug_Latn |lm_eval/tasks/belebele/belebele_lug_Latn.yaml |multiple_choice | | |
| |belebele_lug_prompt_1 |lm_eval/tasks/afrobench/belebele/prompt_1/belebele_lug.yaml |multiple_choice | | |
| |belebele_lug_prompt_2 |lm_eval/tasks/afrobench/belebele/prompt_2/belebele_lug.yaml |multiple_choice | | |
| |belebele_lug_prompt_3 |lm_eval/tasks/afrobench/belebele/prompt_3/belebele_lug.yaml |multiple_choice | | |
| |belebele_lug_prompt_4 |lm_eval/tasks/afrobench/belebele/prompt_4/belebele_lug.yaml |multiple_choice | | |
| |belebele_lug_prompt_5 |lm_eval/tasks/afrobench/belebele/prompt_5/belebele_lug.yaml |multiple_choice | | |
| |belebele_luo_Latn |lm_eval/tasks/belebele/belebele_luo_Latn.yaml |multiple_choice | | |
| |belebele_luo_prompt_1 |lm_eval/tasks/afrobench/belebele/prompt_1/belebele_luo.yaml |multiple_choice | | |
| |belebele_luo_prompt_2 |lm_eval/tasks/afrobench/belebele/prompt_2/belebele_luo.yaml |multiple_choice | | |
| |belebele_luo_prompt_3 |lm_eval/tasks/afrobench/belebele/prompt_3/belebele_luo.yaml |multiple_choice | | |
| |belebele_luo_prompt_4 |lm_eval/tasks/afrobench/belebele/prompt_4/belebele_luo.yaml |multiple_choice | | |
| |belebele_luo_prompt_5 |lm_eval/tasks/afrobench/belebele/prompt_5/belebele_luo.yaml |multiple_choice | | |
| |belebele_lvs_Latn |lm_eval/tasks/belebele/belebele_lvs_Latn.yaml |multiple_choice | | |
| |belebele_mal_Mlym |lm_eval/tasks/belebele/belebele_mal_Mlym.yaml |multiple_choice | | |
| |belebele_mar_Deva |lm_eval/tasks/belebele/belebele_mar_Deva.yaml |multiple_choice | | |
| |belebele_mkd_Cyrl |lm_eval/tasks/belebele/belebele_mkd_Cyrl.yaml |multiple_choice | | |
| |belebele_mlt_Latn |lm_eval/tasks/belebele/belebele_mlt_Latn.yaml |multiple_choice | | |
| |belebele_mri_Latn |lm_eval/tasks/belebele/belebele_mri_Latn.yaml |multiple_choice | | |
| |belebele_mya_Mymr |lm_eval/tasks/belebele/belebele_mya_Mymr.yaml |multiple_choice | | |
| |belebele_nld_Latn |lm_eval/tasks/belebele/belebele_nld_Latn.yaml |multiple_choice | | |
| |belebele_nob_Latn |lm_eval/tasks/belebele/belebele_nob_Latn.yaml |multiple_choice | | |
| |belebele_npi_Deva |lm_eval/tasks/belebele/belebele_npi_Deva.yaml |multiple_choice | | |
| |belebele_npi_Latn |lm_eval/tasks/belebele/belebele_npi_Latn.yaml |multiple_choice | | |
| |belebele_nso_Latn |lm_eval/tasks/belebele/belebele_nso_Latn.yaml |multiple_choice | | |
| |belebele_nya_Latn |lm_eval/tasks/belebele/belebele_nya_Latn.yaml |multiple_choice | | |
| |belebele_nya_prompt_1 |lm_eval/tasks/afrobench/belebele/prompt_1/belebele_nya.yaml |multiple_choice | | |
| |belebele_nya_prompt_2 |lm_eval/tasks/afrobench/belebele/prompt_2/belebele_nya.yaml |multiple_choice | | |
| |belebele_nya_prompt_3 |lm_eval/tasks/afrobench/belebele/prompt_3/belebele_nya.yaml |multiple_choice | | |
| |belebele_nya_prompt_4 |lm_eval/tasks/afrobench/belebele/prompt_4/belebele_nya.yaml |multiple_choice | | |
| |belebele_nya_prompt_5 |lm_eval/tasks/afrobench/belebele/prompt_5/belebele_nya.yaml |multiple_choice | | |
| |belebele_ory_Orya |lm_eval/tasks/belebele/belebele_ory_Orya.yaml |multiple_choice | | |
| |belebele_pan_Guru |lm_eval/tasks/belebele/belebele_pan_Guru.yaml |multiple_choice | | |
| |belebele_pbt_Arab |lm_eval/tasks/belebele/belebele_pbt_Arab.yaml |multiple_choice | | |
| |belebele_pes_Arab |lm_eval/tasks/belebele/belebele_pes_Arab.yaml |multiple_choice | | |
| |belebele_plt_Latn |lm_eval/tasks/belebele/belebele_plt_Latn.yaml |multiple_choice | | |
| |belebele_plt_prompt_1 |lm_eval/tasks/afrobench/belebele/prompt_1/belebele_plt.yaml |multiple_choice | | |
| |belebele_plt_prompt_2 |lm_eval/tasks/afrobench/belebele/prompt_2/belebele_plt.yaml |multiple_choice | | |
| |belebele_plt_prompt_3 |lm_eval/tasks/afrobench/belebele/prompt_3/belebele_plt.yaml |multiple_choice | | |
| |belebele_plt_prompt_4 |lm_eval/tasks/afrobench/belebele/prompt_4/belebele_plt.yaml |multiple_choice | | |
| |belebele_plt_prompt_5 |lm_eval/tasks/afrobench/belebele/prompt_5/belebele_plt.yaml |multiple_choice | | |
| |belebele_pol_Latn |lm_eval/tasks/belebele/belebele_pol_Latn.yaml |multiple_choice | | |
| |belebele_por_Latn |lm_eval/tasks/belebele/belebele_por_Latn.yaml |multiple_choice | | |
| |belebele_por_prompt_1 |lm_eval/tasks/afrobench/belebele/prompt_1/belebele_por.yaml |multiple_choice | | |
| |belebele_por_prompt_2 |lm_eval/tasks/afrobench/belebele/prompt_2/belebele_por.yaml |multiple_choice | | |
| |belebele_por_prompt_3 |lm_eval/tasks/afrobench/belebele/prompt_3/belebele_por.yaml |multiple_choice | | |
| |belebele_por_prompt_4 |lm_eval/tasks/afrobench/belebele/prompt_4/belebele_por.yaml |multiple_choice | | |
| |belebele_por_prompt_5 |lm_eval/tasks/afrobench/belebele/prompt_5/belebele_por.yaml |multiple_choice | | |
| |belebele_ron_Latn |lm_eval/tasks/belebele/belebele_ron_Latn.yaml |multiple_choice | | |
| |belebele_rus_Cyrl |lm_eval/tasks/belebele/belebele_rus_Cyrl.yaml |multiple_choice | | |
| |belebele_shn_Mymr |lm_eval/tasks/belebele/belebele_shn_Mymr.yaml |multiple_choice | | |
| |belebele_sin_Latn |lm_eval/tasks/belebele/belebele_sin_Latn.yaml |multiple_choice | | |
| |belebele_sin_Sinh |lm_eval/tasks/belebele/belebele_sin_Sinh.yaml |multiple_choice | | |
| |belebele_slk_Latn |lm_eval/tasks/belebele/belebele_slk_Latn.yaml |multiple_choice | | |
| |belebele_slv_Latn |lm_eval/tasks/belebele/belebele_slv_Latn.yaml |multiple_choice | | |
| |belebele_sna_Latn |lm_eval/tasks/belebele/belebele_sna_Latn.yaml |multiple_choice | | |
| |belebele_sna_prompt_1 |lm_eval/tasks/afrobench/belebele/prompt_1/belebele_sna.yaml |multiple_choice | | |
| |belebele_sna_prompt_2 |lm_eval/tasks/afrobench/belebele/prompt_2/belebele_sna.yaml |multiple_choice | | |
| |belebele_sna_prompt_3 |lm_eval/tasks/afrobench/belebele/prompt_3/belebele_sna.yaml |multiple_choice | | |
| |belebele_sna_prompt_4 |lm_eval/tasks/afrobench/belebele/prompt_4/belebele_sna.yaml |multiple_choice | | |
| |belebele_sna_prompt_5 |lm_eval/tasks/afrobench/belebele/prompt_5/belebele_sna.yaml |multiple_choice | | |
| |belebele_snd_Arab |lm_eval/tasks/belebele/belebele_snd_Arab.yaml |multiple_choice | | |
| |belebele_som_Latn |lm_eval/tasks/belebele/belebele_som_Latn.yaml |multiple_choice | | |
| |belebele_som_prompt_1 |lm_eval/tasks/afrobench/belebele/prompt_1/belebele_som.yaml |multiple_choice | | |
| |belebele_som_prompt_2 |lm_eval/tasks/afrobench/belebele/prompt_2/belebele_som.yaml |multiple_choice | | |
| |belebele_som_prompt_3 |lm_eval/tasks/afrobench/belebele/prompt_3/belebele_som.yaml |multiple_choice | | |
| |belebele_som_prompt_4 |lm_eval/tasks/afrobench/belebele/prompt_4/belebele_som.yaml |multiple_choice | | |
| |belebele_som_prompt_5 |lm_eval/tasks/afrobench/belebele/prompt_5/belebele_som.yaml |multiple_choice | | |
| |belebele_sot_Latn |lm_eval/tasks/belebele/belebele_sot_Latn.yaml |multiple_choice | | |
| |belebele_sot_prompt_1 |lm_eval/tasks/afrobench/belebele/prompt_1/belebele_sot.yaml |multiple_choice | | |
| |belebele_sot_prompt_2 |lm_eval/tasks/afrobench/belebele/prompt_2/belebele_sot.yaml |multiple_choice | | |
| |belebele_sot_prompt_3 |lm_eval/tasks/afrobench/belebele/prompt_3/belebele_sot.yaml |multiple_choice | | |
| |belebele_sot_prompt_4 |lm_eval/tasks/afrobench/belebele/prompt_4/belebele_sot.yaml |multiple_choice | | |
| |belebele_sot_prompt_5 |lm_eval/tasks/afrobench/belebele/prompt_5/belebele_sot.yaml |multiple_choice | | |
| |belebele_spa_Latn |lm_eval/tasks/belebele/belebele_spa_Latn.yaml |multiple_choice | | |
| |belebele_srp_Cyrl |lm_eval/tasks/belebele/belebele_srp_Cyrl.yaml |multiple_choice | | |
| |belebele_ssw_Latn |lm_eval/tasks/belebele/belebele_ssw_Latn.yaml |multiple_choice | | |
| |belebele_ssw_prompt_1 |lm_eval/tasks/afrobench/belebele/prompt_1/belebele_ssw.yaml |multiple_choice | | |
| |belebele_ssw_prompt_2 |lm_eval/tasks/afrobench/belebele/prompt_2/belebele_ssw.yaml |multiple_choice | | |
| |belebele_ssw_prompt_3 |lm_eval/tasks/afrobench/belebele/prompt_3/belebele_ssw.yaml |multiple_choice | | |
| |belebele_ssw_prompt_4 |lm_eval/tasks/afrobench/belebele/prompt_4/belebele_ssw.yaml |multiple_choice | | |
| |belebele_ssw_prompt_5 |lm_eval/tasks/afrobench/belebele/prompt_5/belebele_ssw.yaml |multiple_choice | | |
| |belebele_sun_Latn |lm_eval/tasks/belebele/belebele_sun_Latn.yaml |multiple_choice | | |
| |belebele_swa_prompt_1 |lm_eval/tasks/afrobench/belebele/prompt_1/belebele_swa.yaml |multiple_choice | | |
| |belebele_swa_prompt_2 |lm_eval/tasks/afrobench/belebele/prompt_2/belebele_swa.yaml |multiple_choice | | |
| |belebele_swa_prompt_3 |lm_eval/tasks/afrobench/belebele/prompt_3/belebele_swa.yaml |multiple_choice | | |
| |belebele_swa_prompt_4 |lm_eval/tasks/afrobench/belebele/prompt_4/belebele_swa.yaml |multiple_choice | | |
| |belebele_swa_prompt_5 |lm_eval/tasks/afrobench/belebele/prompt_5/belebele_swa.yaml |multiple_choice | | |
| |belebele_swe_Latn |lm_eval/tasks/belebele/belebele_swe_Latn.yaml |multiple_choice | | |
| |belebele_swh_Latn |lm_eval/tasks/belebele/belebele_swh_Latn.yaml |multiple_choice | | |
| |belebele_tam_Taml |lm_eval/tasks/belebele/belebele_tam_Taml.yaml |multiple_choice | | |
| |belebele_tel_Telu |lm_eval/tasks/belebele/belebele_tel_Telu.yaml |multiple_choice | | |
| |belebele_tgk_Cyrl |lm_eval/tasks/belebele/belebele_tgk_Cyrl.yaml |multiple_choice | | |
| |belebele_tgl_Latn |lm_eval/tasks/belebele/belebele_tgl_Latn.yaml |multiple_choice | | |
| |belebele_tha_Thai |lm_eval/tasks/belebele/belebele_tha_Thai.yaml |multiple_choice | | |
| |belebele_tir_Ethi |lm_eval/tasks/belebele/belebele_tir_Ethi.yaml |multiple_choice | | |
| |belebele_tir_prompt_1 |lm_eval/tasks/afrobench/belebele/prompt_1/belebele_tir.yaml |multiple_choice | | |
| |belebele_tir_prompt_2 |lm_eval/tasks/afrobench/belebele/prompt_2/belebele_tir.yaml |multiple_choice | | |
| |belebele_tir_prompt_3 |lm_eval/tasks/afrobench/belebele/prompt_3/belebele_tir.yaml |multiple_choice | | |
| |belebele_tir_prompt_4 |lm_eval/tasks/afrobench/belebele/prompt_4/belebele_tir.yaml |multiple_choice | | |
| |belebele_tir_prompt_5 |lm_eval/tasks/afrobench/belebele/prompt_5/belebele_tir.yaml |multiple_choice | | |
| |belebele_tsn_Latn |lm_eval/tasks/belebele/belebele_tsn_Latn.yaml |multiple_choice | | |
| |belebele_tsn_prompt_1 |lm_eval/tasks/afrobench/belebele/prompt_1/belebele_tsn.yaml |multiple_choice | | |
| |belebele_tsn_prompt_2 |lm_eval/tasks/afrobench/belebele/prompt_2/belebele_tsn.yaml |multiple_choice | | |
| |belebele_tsn_prompt_3 |lm_eval/tasks/afrobench/belebele/prompt_3/belebele_tsn.yaml |multiple_choice | | |
| |belebele_tsn_prompt_4 |lm_eval/tasks/afrobench/belebele/prompt_4/belebele_tsn.yaml |multiple_choice | | |
| |belebele_tsn_prompt_5 |lm_eval/tasks/afrobench/belebele/prompt_5/belebele_tsn.yaml |multiple_choice | | |
| |belebele_tso_Latn |lm_eval/tasks/belebele/belebele_tso_Latn.yaml |multiple_choice | | |
| |belebele_tso_prompt_1 |lm_eval/tasks/afrobench/belebele/prompt_1/belebele_tso.yaml |multiple_choice | | |
| |belebele_tso_prompt_2 |lm_eval/tasks/afrobench/belebele/prompt_2/belebele_tso.yaml |multiple_choice | | |
| |belebele_tso_prompt_3 |lm_eval/tasks/afrobench/belebele/prompt_3/belebele_tso.yaml |multiple_choice | | |
| |belebele_tso_prompt_4 |lm_eval/tasks/afrobench/belebele/prompt_4/belebele_tso.yaml |multiple_choice | | |
| |belebele_tso_prompt_5 |lm_eval/tasks/afrobench/belebele/prompt_5/belebele_tso.yaml |multiple_choice | | |
| |belebele_tur_Latn |lm_eval/tasks/belebele/belebele_tur_Latn.yaml |multiple_choice | | |
| |belebele_ukr_Cyrl |lm_eval/tasks/belebele/belebele_ukr_Cyrl.yaml |multiple_choice | | |
| |belebele_urd_Arab |lm_eval/tasks/belebele/belebele_urd_Arab.yaml |multiple_choice | | |
| |belebele_urd_Latn |lm_eval/tasks/belebele/belebele_urd_Latn.yaml |multiple_choice | | |
| |belebele_uzn_Latn |lm_eval/tasks/belebele/belebele_uzn_Latn.yaml |multiple_choice | | |
| |belebele_vie_Latn |lm_eval/tasks/belebele/belebele_vie_Latn.yaml |multiple_choice | | |
| |belebele_war_Latn |lm_eval/tasks/belebele/belebele_war_Latn.yaml |multiple_choice | | |
| |belebele_wol_Latn |lm_eval/tasks/belebele/belebele_wol_Latn.yaml |multiple_choice | | |
| |belebele_wol_prompt_1 |lm_eval/tasks/afrobench/belebele/prompt_1/belebele_wol.yaml |multiple_choice | | |
| |belebele_wol_prompt_2 |lm_eval/tasks/afrobench/belebele/prompt_2/belebele_wol.yaml |multiple_choice | | |
| |belebele_wol_prompt_3 |lm_eval/tasks/afrobench/belebele/prompt_3/belebele_wol.yaml |multiple_choice | | |
| |belebele_wol_prompt_4 |lm_eval/tasks/afrobench/belebele/prompt_4/belebele_wol.yaml |multiple_choice | | |
| |belebele_wol_prompt_5 |lm_eval/tasks/afrobench/belebele/prompt_5/belebele_wol.yaml |multiple_choice | | |
| |belebele_xho_Latn |lm_eval/tasks/belebele/belebele_xho_Latn.yaml |multiple_choice | | |
| |belebele_xho_prompt_1 |lm_eval/tasks/afrobench/belebele/prompt_1/belebele_xho.yaml |multiple_choice | | |
| |belebele_xho_prompt_2 |lm_eval/tasks/afrobench/belebele/prompt_2/belebele_xho.yaml |multiple_choice | | |
| |belebele_xho_prompt_3 |lm_eval/tasks/afrobench/belebele/prompt_3/belebele_xho.yaml |multiple_choice | | |
| |belebele_xho_prompt_4 |lm_eval/tasks/afrobench/belebele/prompt_4/belebele_xho.yaml |multiple_choice | | |
| |belebele_xho_prompt_5 |lm_eval/tasks/afrobench/belebele/prompt_5/belebele_xho.yaml |multiple_choice | | |
| |belebele_yor_Latn |lm_eval/tasks/belebele/belebele_yor_Latn.yaml |multiple_choice | | |
| |belebele_yor_prompt_1 |lm_eval/tasks/afrobench/belebele/prompt_1/belebele_yor.yaml |multiple_choice | | |
| |belebele_yor_prompt_2 |lm_eval/tasks/afrobench/belebele/prompt_2/belebele_yor.yaml |multiple_choice | | |
| |belebele_yor_prompt_3 |lm_eval/tasks/afrobench/belebele/prompt_3/belebele_yor.yaml |multiple_choice | | |
| |belebele_yor_prompt_4 |lm_eval/tasks/afrobench/belebele/prompt_4/belebele_yor.yaml |multiple_choice | | |
| |belebele_yor_prompt_5 |lm_eval/tasks/afrobench/belebele/prompt_5/belebele_yor.yaml |multiple_choice | | |
| |belebele_zho_Hans |lm_eval/tasks/belebele/belebele_zho_Hans.yaml |multiple_choice | | |
| |belebele_zho_Hant |lm_eval/tasks/belebele/belebele_zho_Hant.yaml |multiple_choice | | |
| |belebele_zsm_Latn |lm_eval/tasks/belebele/belebele_zsm_Latn.yaml |multiple_choice | | |
| |belebele_zul_Latn |lm_eval/tasks/belebele/belebele_zul_Latn.yaml |multiple_choice | | |
| |belebele_zul_prompt_1 |lm_eval/tasks/afrobench/belebele/prompt_1/belebele_zul.yaml |multiple_choice | | |
| |belebele_zul_prompt_2 |lm_eval/tasks/afrobench/belebele/prompt_2/belebele_zul.yaml |multiple_choice | | |
| |belebele_zul_prompt_3 |lm_eval/tasks/afrobench/belebele/prompt_3/belebele_zul.yaml |multiple_choice | | |
| |belebele_zul_prompt_4 |lm_eval/tasks/afrobench/belebele/prompt_4/belebele_zul.yaml |multiple_choice | | |
| |belebele_zul_prompt_5 |lm_eval/tasks/afrobench/belebele/prompt_5/belebele_zul.yaml |multiple_choice | | |
| |bertaqa_en |lm_eval/tasks/bertaqa/bertaqa_en.yaml |multiple_choice | | |
| |bertaqa_en_mt_gemma-7b |lm_eval/tasks/bertaqa/bertaqa_en_mt_gemma-7b.yaml |multiple_choice | | |
| |bertaqa_en_mt_hitz |lm_eval/tasks/bertaqa/bertaqa_en_mt_hitz.yaml |multiple_choice | | |
| |bertaqa_en_mt_itzuli |lm_eval/tasks/bertaqa/bertaqa_en_mt_itzuli.yaml |multiple_choice | | |
| |bertaqa_en_mt_latxa-13b-v1 |lm_eval/tasks/bertaqa/bertaqa_en_mt_latxa-13b-v1.yaml |multiple_choice | | |
| |bertaqa_en_mt_latxa-13b-v1.1 |lm_eval/tasks/bertaqa/bertaqa_en_mt_latxa-13b-v1.1.yaml |multiple_choice | | |
| |bertaqa_en_mt_latxa-70b-v1 |lm_eval/tasks/bertaqa/bertaqa_en_mt_latxa-70b-v1.yaml |multiple_choice | | |
| |bertaqa_en_mt_latxa-70b-v1.1 |lm_eval/tasks/bertaqa/bertaqa_en_mt_latxa-70b-v1.1.yaml |multiple_choice | | |
| |bertaqa_en_mt_latxa-7b-v1 |lm_eval/tasks/bertaqa/bertaqa_en_mt_latxa-7b-v1.yaml |multiple_choice | | |
| |bertaqa_en_mt_latxa-7b-v1.1 |lm_eval/tasks/bertaqa/bertaqa_en_mt_latxa-7b-v1.1.yaml |multiple_choice | | |
| |bertaqa_en_mt_llama-2-13b |lm_eval/tasks/bertaqa/bertaqa_en_mt_llama-2-13b.yaml |multiple_choice | | |
| |bertaqa_en_mt_llama-2-70b |lm_eval/tasks/bertaqa/bertaqa_en_mt_llama-2-70b.yaml |multiple_choice | | |
| |bertaqa_en_mt_llama-2-7b |lm_eval/tasks/bertaqa/bertaqa_en_mt_llama-2-7b.yaml |multiple_choice | | |
| |bertaqa_en_mt_madlad |lm_eval/tasks/bertaqa/bertaqa_en_mt_madlad.yaml |multiple_choice | | |
| |bertaqa_en_mt_nllb |lm_eval/tasks/bertaqa/bertaqa_en_mt_nllb.yaml |multiple_choice | | |
| |bertaqa_eu |lm_eval/tasks/bertaqa/bertaqa_eu.yaml |multiple_choice | | |
| |bhtc_v2 |lm_eval/tasks/basqueglue/bhtc.yaml |multiple_choice | | |
| |bigbench_abstract_narrative_understanding_generate_until |lm_eval/tasks/bigbench/generate_until/abstract_narrative_understanding.yaml |generate_until | | |
| |bigbench_abstract_narrative_understanding_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/abstract_narrative_understanding.yaml |multiple_choice | | |
| |bigbench_anachronisms_generate_until |lm_eval/tasks/bigbench/generate_until/anachronisms.yaml |generate_until | | |
| |bigbench_anachronisms_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/anachronisms.yaml |multiple_choice | | |
| |bigbench_analogical_similarity_generate_until |lm_eval/tasks/bigbench/generate_until/analogical_similarity.yaml |generate_until | | |
| |bigbench_analogical_similarity_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/analogical_similarity.yaml |multiple_choice | | |
| |bigbench_analytic_entailment_generate_until |lm_eval/tasks/bigbench/generate_until/analytic_entailment.yaml |generate_until | | |
| |bigbench_analytic_entailment_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/analytic_entailment.yaml |multiple_choice | | |
| |bigbench_arithmetic_generate_until |lm_eval/tasks/bigbench/generate_until/arithmetic.yaml |generate_until | | |
| |bigbench_arithmetic_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/arithmetic.yaml |multiple_choice | | |
| |bigbench_ascii_word_recognition_generate_until |lm_eval/tasks/bigbench/generate_until/ascii_word_recognition.yaml |generate_until | | |
| |bigbench_authorship_verification_generate_until |lm_eval/tasks/bigbench/generate_until/authorship_verification.yaml |generate_until | | |
| |bigbench_authorship_verification_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/authorship_verification.yaml |multiple_choice | | |
| |bigbench_auto_categorization_generate_until |lm_eval/tasks/bigbench/generate_until/auto_categorization.yaml |generate_until | | |
| |bigbench_auto_debugging_generate_until |lm_eval/tasks/bigbench/generate_until/auto_debugging.yaml |generate_until | | |
| |bigbench_bbq_lite_json_generate_until |lm_eval/tasks/bigbench/generate_until/bbq_lite_json.yaml |generate_until | | |
| |bigbench_bbq_lite_json_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/bbq_lite_json.yaml |multiple_choice | | |
| |bigbench_bridging_anaphora_resolution_barqa_generate_until |lm_eval/tasks/bigbench/generate_until/bridging_anaphora_resolution_barqa.yaml |generate_until | | |
| |bigbench_causal_judgment_generate_until |lm_eval/tasks/bigbench/generate_until/causal_judgment.yaml |generate_until | | |
| |bigbench_causal_judgment_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/causal_judgment.yaml |multiple_choice | | |
| |bigbench_cause_and_effect_generate_until |lm_eval/tasks/bigbench/generate_until/cause_and_effect.yaml |generate_until | | |
| |bigbench_cause_and_effect_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/cause_and_effect.yaml |multiple_choice | | |
| |bigbench_checkmate_in_one_generate_until |lm_eval/tasks/bigbench/generate_until/checkmate_in_one.yaml |generate_until | | |
| |bigbench_checkmate_in_one_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/checkmate_in_one.yaml |multiple_choice | | |
| |bigbench_chess_state_tracking_generate_until |lm_eval/tasks/bigbench/generate_until/chess_state_tracking.yaml |generate_until | | |
| |bigbench_chinese_remainder_theorem_generate_until |lm_eval/tasks/bigbench/generate_until/chinese_remainder_theorem.yaml |generate_until | | |
| |bigbench_cifar10_classification_generate_until |lm_eval/tasks/bigbench/generate_until/cifar10_classification.yaml |generate_until | | |
| |bigbench_cifar10_classification_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/cifar10_classification.yaml |multiple_choice | | |
| |bigbench_code_line_description_generate_until |lm_eval/tasks/bigbench/generate_until/code_line_description.yaml |generate_until | | |
| |bigbench_code_line_description_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/code_line_description.yaml |multiple_choice | | |
| |bigbench_codenames_generate_until |lm_eval/tasks/bigbench/generate_until/codenames.yaml |generate_until | | |
| |bigbench_color_generate_until |lm_eval/tasks/bigbench/generate_until/color.yaml |generate_until | | |
| |bigbench_color_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/color.yaml |multiple_choice | | |
| |bigbench_common_morpheme_generate_until |lm_eval/tasks/bigbench/generate_until/common_morpheme.yaml |generate_until | | |
| |bigbench_common_morpheme_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/common_morpheme.yaml |multiple_choice | | |
| |bigbench_conceptual_combinations_generate_until |lm_eval/tasks/bigbench/generate_until/conceptual_combinations.yaml |generate_until | | |
| |bigbench_conceptual_combinations_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/conceptual_combinations.yaml |multiple_choice | | |
| |bigbench_conlang_translation_generate_until |lm_eval/tasks/bigbench/generate_until/conlang_translation.yaml |generate_until | | |
| |bigbench_contextual_parametric_knowledge_conflicts_generate_until |lm_eval/tasks/bigbench/generate_until/contextual_parametric_knowledge_conflicts.yaml |generate_until | | |
| |bigbench_contextual_parametric_knowledge_conflicts_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/contextual_parametric_knowledge_conflicts.yaml |multiple_choice | | |
| |bigbench_crash_blossom_generate_until |lm_eval/tasks/bigbench/generate_until/crash_blossom.yaml |generate_until | | |
| |bigbench_crash_blossom_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/crash_blossom.yaml |multiple_choice | | |
| |bigbench_crass_ai_generate_until |lm_eval/tasks/bigbench/generate_until/crass_ai.yaml |generate_until | | |
| |bigbench_crass_ai_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/crass_ai.yaml |multiple_choice | | |
| |bigbench_cryobiology_spanish_generate_until |lm_eval/tasks/bigbench/generate_until/cryobiology_spanish.yaml |generate_until | | |
| |bigbench_cryobiology_spanish_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/cryobiology_spanish.yaml |multiple_choice | | |
| |bigbench_cryptonite_generate_until |lm_eval/tasks/bigbench/generate_until/cryptonite.yaml |generate_until | | |
| |bigbench_cs_algorithms_generate_until |lm_eval/tasks/bigbench/generate_until/cs_algorithms.yaml |generate_until | | |
| |bigbench_cs_algorithms_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/cs_algorithms.yaml |multiple_choice | | |
| |bigbench_dark_humor_detection_generate_until |lm_eval/tasks/bigbench/generate_until/dark_humor_detection.yaml |generate_until | | |
| |bigbench_dark_humor_detection_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/dark_humor_detection.yaml |multiple_choice | | |
| |bigbench_date_understanding_generate_until |lm_eval/tasks/bigbench/generate_until/date_understanding.yaml |generate_until | | |
| |bigbench_date_understanding_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/date_understanding.yaml |multiple_choice | | |
| |bigbench_disambiguation_qa_generate_until |lm_eval/tasks/bigbench/generate_until/disambiguation_qa.yaml |generate_until | | |
| |bigbench_disambiguation_qa_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/disambiguation_qa.yaml |multiple_choice | | |
| |bigbench_discourse_marker_prediction_generate_until |lm_eval/tasks/bigbench/generate_until/discourse_marker_prediction.yaml |generate_until | | |
| |bigbench_discourse_marker_prediction_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/discourse_marker_prediction.yaml |multiple_choice | | |
| |bigbench_disfl_qa_generate_until |lm_eval/tasks/bigbench/generate_until/disfl_qa.yaml |generate_until | | |
| |bigbench_dyck_languages_generate_until |lm_eval/tasks/bigbench/generate_until/dyck_languages.yaml |generate_until | | |
| |bigbench_dyck_languages_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/dyck_languages.yaml |multiple_choice | | |
| |bigbench_elementary_math_qa_generate_until |lm_eval/tasks/bigbench/generate_until/elementary_math_qa.yaml |generate_until | | |
| |bigbench_elementary_math_qa_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/elementary_math_qa.yaml |multiple_choice | | |
| |bigbench_emoji_movie_generate_until |lm_eval/tasks/bigbench/generate_until/emoji_movie.yaml |generate_until | | |
| |bigbench_emoji_movie_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/emoji_movie.yaml |multiple_choice | | |
| |bigbench_emojis_emotion_prediction_generate_until |lm_eval/tasks/bigbench/generate_until/emojis_emotion_prediction.yaml |generate_until | | |
| |bigbench_emojis_emotion_prediction_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/emojis_emotion_prediction.yaml |multiple_choice | | |
| |bigbench_empirical_judgments_generate_until |lm_eval/tasks/bigbench/generate_until/empirical_judgments.yaml |generate_until | | |
| |bigbench_empirical_judgments_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/empirical_judgments.yaml |multiple_choice | | |
| |bigbench_english_proverbs_generate_until |lm_eval/tasks/bigbench/generate_until/english_proverbs.yaml |generate_until | | |
| |bigbench_english_proverbs_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/english_proverbs.yaml |multiple_choice | | |
| |bigbench_english_russian_proverbs_generate_until |lm_eval/tasks/bigbench/generate_until/english_russian_proverbs.yaml |generate_until | | |
| |bigbench_english_russian_proverbs_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/english_russian_proverbs.yaml |multiple_choice | | |
| |bigbench_entailed_polarity_generate_until |lm_eval/tasks/bigbench/generate_until/entailed_polarity.yaml |generate_until | | |
| |bigbench_entailed_polarity_hindi_generate_until |lm_eval/tasks/bigbench/generate_until/entailed_polarity_hindi.yaml |generate_until | | |
| |bigbench_entailed_polarity_hindi_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/entailed_polarity_hindi.yaml |multiple_choice | | |
| |bigbench_entailed_polarity_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/entailed_polarity.yaml |multiple_choice | | |
| |bigbench_epistemic_reasoning_generate_until |lm_eval/tasks/bigbench/generate_until/epistemic_reasoning.yaml |generate_until | | |
| |bigbench_epistemic_reasoning_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/epistemic_reasoning.yaml |multiple_choice | | |
| |bigbench_evaluating_information_essentiality_generate_until |lm_eval/tasks/bigbench/generate_until/evaluating_information_essentiality.yaml |generate_until | | |
| |bigbench_evaluating_information_essentiality_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/evaluating_information_essentiality.yaml |multiple_choice | | |
| |bigbench_fact_checker_generate_until |lm_eval/tasks/bigbench/generate_until/fact_checker.yaml |generate_until | | |
| |bigbench_fact_checker_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/fact_checker.yaml |multiple_choice | | |
| |bigbench_fantasy_reasoning_generate_until |lm_eval/tasks/bigbench/generate_until/fantasy_reasoning.yaml |generate_until | | |
| |bigbench_fantasy_reasoning_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/fantasy_reasoning.yaml |multiple_choice | | |
| |bigbench_few_shot_nlg_generate_until |lm_eval/tasks/bigbench/generate_until/few_shot_nlg.yaml |generate_until | | |
| |bigbench_figure_of_speech_detection_generate_until |lm_eval/tasks/bigbench/generate_until/figure_of_speech_detection.yaml |generate_until | | |
| |bigbench_figure_of_speech_detection_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/figure_of_speech_detection.yaml |multiple_choice | | |
| |bigbench_formal_fallacies_syllogisms_negation_generate_until |lm_eval/tasks/bigbench/generate_until/formal_fallacies_syllogisms_negation.yaml |generate_until | | |
| |bigbench_formal_fallacies_syllogisms_negation_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/formal_fallacies_syllogisms_negation.yaml |multiple_choice | | |
| |bigbench_gem_generate_until |lm_eval/tasks/bigbench/generate_until/gem.yaml |generate_until | | |
| |bigbench_gender_inclusive_sentences_german_generate_until |lm_eval/tasks/bigbench/generate_until/gender_inclusive_sentences_german.yaml |generate_until | | |
| |bigbench_general_knowledge_generate_until |lm_eval/tasks/bigbench/generate_until/general_knowledge.yaml |generate_until | | |
| |bigbench_general_knowledge_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/general_knowledge.yaml |multiple_choice | | |
| |bigbench_geometric_shapes_generate_until |lm_eval/tasks/bigbench/generate_until/geometric_shapes.yaml |generate_until | | |
| |bigbench_geometric_shapes_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/geometric_shapes.yaml |multiple_choice | | |
| |bigbench_goal_step_wikihow_generate_until |lm_eval/tasks/bigbench/generate_until/goal_step_wikihow.yaml |generate_until | | |
| |bigbench_goal_step_wikihow_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/goal_step_wikihow.yaml |multiple_choice | | |
| |bigbench_gre_reading_comprehension_generate_until |lm_eval/tasks/bigbench/generate_until/gre_reading_comprehension.yaml |generate_until | | |
| |bigbench_gre_reading_comprehension_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/gre_reading_comprehension.yaml |multiple_choice | | |
| |bigbench_hhh_alignment_generate_until |lm_eval/tasks/bigbench/generate_until/hhh_alignment.yaml |generate_until | | |
| |bigbench_hhh_alignment_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/hhh_alignment.yaml |multiple_choice | | |
| |bigbench_hindi_question_answering_generate_until |lm_eval/tasks/bigbench/generate_until/hindi_question_answering.yaml |generate_until | | |
| |bigbench_hindu_knowledge_generate_until |lm_eval/tasks/bigbench/generate_until/hindu_knowledge.yaml |generate_until | | |
| |bigbench_hindu_knowledge_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/hindu_knowledge.yaml |multiple_choice | | |
| |bigbench_hinglish_toxicity_generate_until |lm_eval/tasks/bigbench/generate_until/hinglish_toxicity.yaml |generate_until | | |
| |bigbench_hinglish_toxicity_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/hinglish_toxicity.yaml |multiple_choice | | |
| |bigbench_human_organs_senses_generate_until |lm_eval/tasks/bigbench/generate_until/human_organs_senses.yaml |generate_until | | |
| |bigbench_human_organs_senses_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/human_organs_senses.yaml |multiple_choice | | |
| |bigbench_hyperbaton_generate_until |lm_eval/tasks/bigbench/generate_until/hyperbaton.yaml |generate_until | | |
| |bigbench_hyperbaton_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/hyperbaton.yaml |multiple_choice | | |
| |bigbench_identify_math_theorems_generate_until |lm_eval/tasks/bigbench/generate_until/identify_math_theorems.yaml |generate_until | | |
| |bigbench_identify_math_theorems_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/identify_math_theorems.yaml |multiple_choice | | |
| |bigbench_identify_odd_metaphor_generate_until |lm_eval/tasks/bigbench/generate_until/identify_odd_metaphor.yaml |generate_until | | |
| |bigbench_identify_odd_metaphor_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/identify_odd_metaphor.yaml |multiple_choice | | |
| |bigbench_implicatures_generate_until |lm_eval/tasks/bigbench/generate_until/implicatures.yaml |generate_until | | |
| |bigbench_implicatures_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/implicatures.yaml |multiple_choice | | |
| |bigbench_implicit_relations_generate_until |lm_eval/tasks/bigbench/generate_until/implicit_relations.yaml |generate_until | | |
| |bigbench_implicit_relations_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/implicit_relations.yaml |multiple_choice | | |
| |bigbench_intent_recognition_generate_until |lm_eval/tasks/bigbench/generate_until/intent_recognition.yaml |generate_until | | |
| |bigbench_intent_recognition_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/intent_recognition.yaml |multiple_choice | | |
| |bigbench_international_phonetic_alphabet_nli_generate_until |lm_eval/tasks/bigbench/generate_until/international_phonetic_alphabet_nli.yaml |generate_until | | |
| |bigbench_international_phonetic_alphabet_nli_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/international_phonetic_alphabet_nli.yaml |multiple_choice | | |
| |bigbench_international_phonetic_alphabet_transliterate_generate_until |lm_eval/tasks/bigbench/generate_until/international_phonetic_alphabet_transliterate.yaml |generate_until | | |
| |bigbench_intersect_geometry_generate_until |lm_eval/tasks/bigbench/generate_until/intersect_geometry.yaml |generate_until | | |
| |bigbench_intersect_geometry_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/intersect_geometry.yaml |multiple_choice | | |
| |bigbench_irony_identification_generate_until |lm_eval/tasks/bigbench/generate_until/irony_identification.yaml |generate_until | | |
| |bigbench_irony_identification_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/irony_identification.yaml |multiple_choice | | |
| |bigbench_kanji_ascii_generate_until |lm_eval/tasks/bigbench/generate_until/kanji_ascii.yaml |generate_until | | |
| |bigbench_kanji_ascii_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/kanji_ascii.yaml |multiple_choice | | |
| |bigbench_kannada_generate_until |lm_eval/tasks/bigbench/generate_until/kannada.yaml |generate_until | | |
| |bigbench_kannada_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/kannada.yaml |multiple_choice | | |
| |bigbench_key_value_maps_generate_until |lm_eval/tasks/bigbench/generate_until/key_value_maps.yaml |generate_until | | |
| |bigbench_key_value_maps_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/key_value_maps.yaml |multiple_choice | | |
| |bigbench_known_unknowns_generate_until |lm_eval/tasks/bigbench/generate_until/known_unknowns.yaml |generate_until | | |
| |bigbench_known_unknowns_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/known_unknowns.yaml |multiple_choice | | |
| |bigbench_language_games_generate_until |lm_eval/tasks/bigbench/generate_until/language_games.yaml |generate_until | | |
| |bigbench_language_identification_generate_until |lm_eval/tasks/bigbench/generate_until/language_identification.yaml |generate_until | | |
| |bigbench_language_identification_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/language_identification.yaml |multiple_choice | | |
| |bigbench_linguistic_mappings_generate_until |lm_eval/tasks/bigbench/generate_until/linguistic_mappings.yaml |generate_until | | |
| |bigbench_linguistics_puzzles_generate_until |lm_eval/tasks/bigbench/generate_until/linguistics_puzzles.yaml |generate_until | | |
| |bigbench_list_functions_generate_until |lm_eval/tasks/bigbench/generate_until/list_functions.yaml |generate_until | | |
| |bigbench_logic_grid_puzzle_generate_until |lm_eval/tasks/bigbench/generate_until/logic_grid_puzzle.yaml |generate_until | | |
| |bigbench_logic_grid_puzzle_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/logic_grid_puzzle.yaml |multiple_choice | | |
| |bigbench_logical_args_generate_until |lm_eval/tasks/bigbench/generate_until/logical_args.yaml |generate_until | | |
| |bigbench_logical_args_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/logical_args.yaml |multiple_choice | | |
| |bigbench_logical_deduction_generate_until |lm_eval/tasks/bigbench/generate_until/logical_deduction.yaml |generate_until | | |
| |bigbench_logical_deduction_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/logical_deduction.yaml |multiple_choice | | |
| |bigbench_logical_fallacy_detection_generate_until |lm_eval/tasks/bigbench/generate_until/logical_fallacy_detection.yaml |generate_until | | |
| |bigbench_logical_fallacy_detection_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/logical_fallacy_detection.yaml |multiple_choice | | |
| |bigbench_logical_sequence_generate_until |lm_eval/tasks/bigbench/generate_until/logical_sequence.yaml |generate_until | | |
| |bigbench_logical_sequence_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/logical_sequence.yaml |multiple_choice | | |
| |bigbench_mathematical_induction_generate_until |lm_eval/tasks/bigbench/generate_until/mathematical_induction.yaml |generate_until | | |
| |bigbench_mathematical_induction_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/mathematical_induction.yaml |multiple_choice | | |
| |bigbench_matrixshapes_generate_until |lm_eval/tasks/bigbench/generate_until/matrixshapes.yaml |generate_until | | |
| |bigbench_metaphor_boolean_generate_until |lm_eval/tasks/bigbench/generate_until/metaphor_boolean.yaml |generate_until | | |
| |bigbench_metaphor_boolean_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/metaphor_boolean.yaml |multiple_choice | | |
| |bigbench_metaphor_understanding_generate_until |lm_eval/tasks/bigbench/generate_until/metaphor_understanding.yaml |generate_until | | |
| |bigbench_metaphor_understanding_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/metaphor_understanding.yaml |multiple_choice | | |
| |bigbench_minute_mysteries_qa_generate_until |lm_eval/tasks/bigbench/generate_until/minute_mysteries_qa.yaml |generate_until | | |
| |bigbench_misconceptions_generate_until |lm_eval/tasks/bigbench/generate_until/misconceptions.yaml |generate_until | | |
| |bigbench_misconceptions_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/misconceptions.yaml |multiple_choice | | |
| |bigbench_misconceptions_russian_generate_until |lm_eval/tasks/bigbench/generate_until/misconceptions_russian.yaml |generate_until | | |
| |bigbench_misconceptions_russian_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/misconceptions_russian.yaml |multiple_choice | | |
| |bigbench_mnist_ascii_generate_until |lm_eval/tasks/bigbench/generate_until/mnist_ascii.yaml |generate_until | | |
| |bigbench_mnist_ascii_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/mnist_ascii.yaml |multiple_choice | | |
| |bigbench_modified_arithmetic_generate_until |lm_eval/tasks/bigbench/generate_until/modified_arithmetic.yaml |generate_until | | |
| |bigbench_moral_permissibility_generate_until |lm_eval/tasks/bigbench/generate_until/moral_permissibility.yaml |generate_until | | |
| |bigbench_moral_permissibility_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/moral_permissibility.yaml |multiple_choice | | |
| |bigbench_movie_dialog_same_or_different_generate_until |lm_eval/tasks/bigbench/generate_until/movie_dialog_same_or_different.yaml |generate_until | | |
| |bigbench_movie_dialog_same_or_different_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/movie_dialog_same_or_different.yaml |multiple_choice | | |
| |bigbench_movie_recommendation_generate_until |lm_eval/tasks/bigbench/generate_until/movie_recommendation.yaml |generate_until | | |
| |bigbench_movie_recommendation_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/movie_recommendation.yaml |multiple_choice | | |
| |bigbench_mult_data_wrangling_generate_until |lm_eval/tasks/bigbench/generate_until/mult_data_wrangling.yaml |generate_until | | |
| |bigbench_multiemo_generate_until |lm_eval/tasks/bigbench/generate_until/multiemo.yaml |generate_until | | |
| |bigbench_multiemo_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/multiemo.yaml |multiple_choice | | |
| |bigbench_natural_instructions_generate_until |lm_eval/tasks/bigbench/generate_until/natural_instructions.yaml |generate_until | | |
| |bigbench_navigate_generate_until |lm_eval/tasks/bigbench/generate_until/navigate.yaml |generate_until | | |
| |bigbench_navigate_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/navigate.yaml |multiple_choice | | |
| |bigbench_nonsense_words_grammar_generate_until |lm_eval/tasks/bigbench/generate_until/nonsense_words_grammar.yaml |generate_until | | |
| |bigbench_nonsense_words_grammar_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/nonsense_words_grammar.yaml |multiple_choice | | |
| |bigbench_novel_concepts_generate_until |lm_eval/tasks/bigbench/generate_until/novel_concepts.yaml |generate_until | | |
| |bigbench_novel_concepts_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/novel_concepts.yaml |multiple_choice | | |
| |bigbench_object_counting_generate_until |lm_eval/tasks/bigbench/generate_until/object_counting.yaml |generate_until | | |
| |bigbench_odd_one_out_generate_until |lm_eval/tasks/bigbench/generate_until/odd_one_out.yaml |generate_until | | |
| |bigbench_odd_one_out_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/odd_one_out.yaml |multiple_choice | | |
| |bigbench_operators_generate_until |lm_eval/tasks/bigbench/generate_until/operators.yaml |generate_until | | |
| |bigbench_paragraph_segmentation_generate_until |lm_eval/tasks/bigbench/generate_until/paragraph_segmentation.yaml |generate_until | | |
| |bigbench_parsinlu_qa_generate_until |lm_eval/tasks/bigbench/generate_until/parsinlu_qa.yaml |generate_until | | |
| |bigbench_parsinlu_qa_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/parsinlu_qa.yaml |multiple_choice | | |
| |bigbench_parsinlu_reading_comprehension_generate_until |lm_eval/tasks/bigbench/generate_until/parsinlu_reading_comprehension.yaml |generate_until | | |
| |bigbench_penguins_in_a_table_generate_until |lm_eval/tasks/bigbench/generate_until/penguins_in_a_table.yaml |generate_until | | |
| |bigbench_penguins_in_a_table_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/penguins_in_a_table.yaml |multiple_choice | | |
| |bigbench_periodic_elements_generate_until |lm_eval/tasks/bigbench/generate_until/periodic_elements.yaml |generate_until | | |
| |bigbench_periodic_elements_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/periodic_elements.yaml |multiple_choice | | |
| |bigbench_persian_idioms_generate_until |lm_eval/tasks/bigbench/generate_until/persian_idioms.yaml |generate_until | | |
| |bigbench_persian_idioms_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/persian_idioms.yaml |multiple_choice | | |
| |bigbench_phrase_relatedness_generate_until |lm_eval/tasks/bigbench/generate_until/phrase_relatedness.yaml |generate_until | | |
| |bigbench_phrase_relatedness_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/phrase_relatedness.yaml |multiple_choice | | |
| |bigbench_physical_intuition_generate_until |lm_eval/tasks/bigbench/generate_until/physical_intuition.yaml |generate_until | | |
| |bigbench_physical_intuition_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/physical_intuition.yaml |multiple_choice | | |
| |bigbench_physics_generate_until |lm_eval/tasks/bigbench/generate_until/physics.yaml |generate_until | | |
| |bigbench_physics_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/physics.yaml |multiple_choice | | |
| |bigbench_physics_questions_generate_until |lm_eval/tasks/bigbench/generate_until/physics_questions.yaml |generate_until | | |
| |bigbench_play_dialog_same_or_different_generate_until |lm_eval/tasks/bigbench/generate_until/play_dialog_same_or_different.yaml |generate_until | | |
| |bigbench_play_dialog_same_or_different_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/play_dialog_same_or_different.yaml |multiple_choice | | |
| |bigbench_polish_sequence_labeling_generate_until |lm_eval/tasks/bigbench/generate_until/polish_sequence_labeling.yaml |generate_until | | |
| |bigbench_presuppositions_as_nli_generate_until |lm_eval/tasks/bigbench/generate_until/presuppositions_as_nli.yaml |generate_until | | |
| |bigbench_presuppositions_as_nli_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/presuppositions_as_nli.yaml |multiple_choice | | |
| |bigbench_qa_wikidata_generate_until |lm_eval/tasks/bigbench/generate_until/qa_wikidata.yaml |generate_until | | |
| |bigbench_question_selection_generate_until |lm_eval/tasks/bigbench/generate_until/question_selection.yaml |generate_until | | |
| |bigbench_question_selection_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/question_selection.yaml |multiple_choice | | |
| |bigbench_real_or_fake_text_generate_until |lm_eval/tasks/bigbench/generate_until/real_or_fake_text.yaml |generate_until | | |
| |bigbench_real_or_fake_text_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/real_or_fake_text.yaml |multiple_choice | | |
| |bigbench_reasoning_about_colored_objects_generate_until |lm_eval/tasks/bigbench/generate_until/reasoning_about_colored_objects.yaml |generate_until | | |
| |bigbench_reasoning_about_colored_objects_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/reasoning_about_colored_objects.yaml |multiple_choice | | |
| |bigbench_repeat_copy_logic_generate_until |lm_eval/tasks/bigbench/generate_until/repeat_copy_logic.yaml |generate_until | | |
| |bigbench_rephrase_generate_until |lm_eval/tasks/bigbench/generate_until/rephrase.yaml |generate_until | | |
| |bigbench_riddle_sense_generate_until |lm_eval/tasks/bigbench/generate_until/riddle_sense.yaml |generate_until | | |
| |bigbench_riddle_sense_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/riddle_sense.yaml |multiple_choice | | |
| |bigbench_ruin_names_generate_until |lm_eval/tasks/bigbench/generate_until/ruin_names.yaml |generate_until | | |
| |bigbench_ruin_names_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/ruin_names.yaml |multiple_choice | | |
| |bigbench_salient_translation_error_detection_generate_until |lm_eval/tasks/bigbench/generate_until/salient_translation_error_detection.yaml |generate_until | | |
| |bigbench_salient_translation_error_detection_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/salient_translation_error_detection.yaml |multiple_choice | | |
| |bigbench_scientific_press_release_generate_until |lm_eval/tasks/bigbench/generate_until/scientific_press_release.yaml |generate_until | | |
| |bigbench_semantic_parsing_in_context_sparc_generate_until |lm_eval/tasks/bigbench/generate_until/semantic_parsing_in_context_sparc.yaml |generate_until | | |
| |bigbench_semantic_parsing_spider_generate_until |lm_eval/tasks/bigbench/generate_until/semantic_parsing_spider.yaml |generate_until | | |
| |bigbench_sentence_ambiguity_generate_until |lm_eval/tasks/bigbench/generate_until/sentence_ambiguity.yaml |generate_until | | |
| |bigbench_sentence_ambiguity_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/sentence_ambiguity.yaml |multiple_choice | | |
| |bigbench_similarities_abstraction_generate_until |lm_eval/tasks/bigbench/generate_until/similarities_abstraction.yaml |generate_until | | |
| |bigbench_similarities_abstraction_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/similarities_abstraction.yaml |multiple_choice | | |
| |bigbench_simp_turing_concept_generate_until |lm_eval/tasks/bigbench/generate_until/simp_turing_concept.yaml |generate_until | | |
| |bigbench_simple_arithmetic_json_generate_until |lm_eval/tasks/bigbench/generate_until/simple_arithmetic_json.yaml |generate_until | | |
| |bigbench_simple_arithmetic_json_multiple_choice_generate_until |lm_eval/tasks/bigbench/generate_until/simple_arithmetic_json_multiple_choice.yaml |generate_until | | |
| |bigbench_simple_arithmetic_json_subtasks_generate_until |lm_eval/tasks/bigbench/generate_until/simple_arithmetic_json_subtasks.yaml |generate_until | | |
| |bigbench_simple_arithmetic_multiple_targets_json_generate_until |lm_eval/tasks/bigbench/generate_until/simple_arithmetic_multiple_targets_json.yaml |generate_until | | |
| |bigbench_simple_ethical_questions_generate_until |lm_eval/tasks/bigbench/generate_until/simple_ethical_questions.yaml |generate_until | | |
| |bigbench_simple_ethical_questions_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/simple_ethical_questions.yaml |multiple_choice | | |
| |bigbench_simple_text_editing_generate_until |lm_eval/tasks/bigbench/generate_until/simple_text_editing.yaml |generate_until | | |
| |bigbench_snarks_generate_until |lm_eval/tasks/bigbench/generate_until/snarks.yaml |generate_until | | |
| |bigbench_snarks_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/snarks.yaml |multiple_choice | | |
| |bigbench_social_iqa_generate_until |lm_eval/tasks/bigbench/generate_until/social_iqa.yaml |generate_until | | |
| |bigbench_social_iqa_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/social_iqa.yaml |multiple_choice | | |
| |bigbench_social_support_generate_until |lm_eval/tasks/bigbench/generate_until/social_support.yaml |generate_until | | |
| |bigbench_social_support_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/social_support.yaml |multiple_choice | | |
| |bigbench_sports_understanding_generate_until |lm_eval/tasks/bigbench/generate_until/sports_understanding.yaml |generate_until | | |
| |bigbench_sports_understanding_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/sports_understanding.yaml |multiple_choice | | |
| |bigbench_strange_stories_generate_until |lm_eval/tasks/bigbench/generate_until/strange_stories.yaml |generate_until | | |
| |bigbench_strange_stories_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/strange_stories.yaml |multiple_choice | | |
| |bigbench_strategyqa_generate_until |lm_eval/tasks/bigbench/generate_until/strategyqa.yaml |generate_until | | |
| |bigbench_strategyqa_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/strategyqa.yaml |multiple_choice | | |
| |bigbench_sufficient_information_generate_until |lm_eval/tasks/bigbench/generate_until/sufficient_information.yaml |generate_until | | |
| |bigbench_suicide_risk_generate_until |lm_eval/tasks/bigbench/generate_until/suicide_risk.yaml |generate_until | | |
| |bigbench_suicide_risk_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/suicide_risk.yaml |multiple_choice | | |
| |bigbench_swahili_english_proverbs_generate_until |lm_eval/tasks/bigbench/generate_until/swahili_english_proverbs.yaml |generate_until | | |
| |bigbench_swahili_english_proverbs_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/swahili_english_proverbs.yaml |multiple_choice | | |
| |bigbench_swedish_to_german_proverbs_generate_until |lm_eval/tasks/bigbench/generate_until/swedish_to_german_proverbs.yaml |generate_until | | |
| |bigbench_swedish_to_german_proverbs_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/swedish_to_german_proverbs.yaml |multiple_choice | | |
| |bigbench_symbol_interpretation_generate_until |lm_eval/tasks/bigbench/generate_until/symbol_interpretation.yaml |generate_until | | |
| |bigbench_symbol_interpretation_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/symbol_interpretation.yaml |multiple_choice | | |
| |bigbench_temporal_sequences_generate_until |lm_eval/tasks/bigbench/generate_until/temporal_sequences.yaml |generate_until | | |
| |bigbench_temporal_sequences_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/temporal_sequences.yaml |multiple_choice | | |
| |bigbench_tense_generate_until |lm_eval/tasks/bigbench/generate_until/tense.yaml |generate_until | | |
| |bigbench_timedial_generate_until |lm_eval/tasks/bigbench/generate_until/timedial.yaml |generate_until | | |
| |bigbench_timedial_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/timedial.yaml |multiple_choice | | |
| |bigbench_topical_chat_generate_until |lm_eval/tasks/bigbench/generate_until/topical_chat.yaml |generate_until | | |
| |bigbench_tracking_shuffled_objects_generate_until |lm_eval/tasks/bigbench/generate_until/tracking_shuffled_objects.yaml |generate_until | | |
| |bigbench_tracking_shuffled_objects_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/tracking_shuffled_objects.yaml |multiple_choice | | |
| |bigbench_understanding_fables_generate_until |lm_eval/tasks/bigbench/generate_until/understanding_fables.yaml |generate_until | | |
| |bigbench_understanding_fables_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/understanding_fables.yaml |multiple_choice | | |
| |bigbench_undo_permutation_generate_until |lm_eval/tasks/bigbench/generate_until/undo_permutation.yaml |generate_until | | |
| |bigbench_undo_permutation_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/undo_permutation.yaml |multiple_choice | | |
| |bigbench_unit_conversion_generate_until |lm_eval/tasks/bigbench/generate_until/unit_conversion.yaml |generate_until | | |
| |bigbench_unit_conversion_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/unit_conversion.yaml |multiple_choice | | |
| |bigbench_unit_interpretation_generate_until |lm_eval/tasks/bigbench/generate_until/unit_interpretation.yaml |generate_until | | |
| |bigbench_unit_interpretation_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/unit_interpretation.yaml |multiple_choice | | |
| |bigbench_unnatural_in_context_learning_generate_until |lm_eval/tasks/bigbench/generate_until/unnatural_in_context_learning.yaml |generate_until | | |
| |bigbench_vitaminc_fact_verification_generate_until |lm_eval/tasks/bigbench/generate_until/vitaminc_fact_verification.yaml |generate_until | | |
| |bigbench_vitaminc_fact_verification_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/vitaminc_fact_verification.yaml |multiple_choice | | |
| |bigbench_what_is_the_tao_generate_until |lm_eval/tasks/bigbench/generate_until/what_is_the_tao.yaml |generate_until | | |
| |bigbench_what_is_the_tao_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/what_is_the_tao.yaml |multiple_choice | | |
| |bigbench_which_wiki_edit_generate_until |lm_eval/tasks/bigbench/generate_until/which_wiki_edit.yaml |generate_until | | |
| |bigbench_which_wiki_edit_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/which_wiki_edit.yaml |multiple_choice | | |
| |bigbench_winowhy_generate_until |lm_eval/tasks/bigbench/generate_until/winowhy.yaml |generate_until | | |
| |bigbench_winowhy_multiple_choice |lm_eval/tasks/bigbench/multiple_choice/winowhy.yaml |multiple_choice | | |
| |bigbench_word_sorting_generate_until |lm_eval/tasks/bigbench/generate_until/word_sorting.yaml |generate_until | | |
| |bigbench_word_unscrambling_generate_until |lm_eval/tasks/bigbench/generate_until/word_unscrambling.yaml |generate_until | | |
| |blimp_adjunct_island |lm_eval/tasks/blimp/adjunct_island.yaml |multiple_choice | | |
| |blimp_anaphor_gender_agreement |lm_eval/tasks/blimp/anaphor_gender_agreement.yaml |multiple_choice | | |
| |blimp_anaphor_number_agreement |lm_eval/tasks/blimp/anaphor_number_agreement.yaml |multiple_choice | | |
| |blimp_animate_subject_passive |lm_eval/tasks/blimp/animate_subject_passive.yaml |multiple_choice | | |
| |blimp_animate_subject_trans |lm_eval/tasks/blimp/animate_subject_trans.yaml |multiple_choice | | |
| |blimp_causative |lm_eval/tasks/blimp/causative.yaml |multiple_choice | | |
| |blimp_complex_NP_island |lm_eval/tasks/blimp/complex_NP_island.yaml |multiple_choice | | |
| |blimp_coordinate_structure_constraint_complex_left_branch |lm_eval/tasks/blimp/coordinate_structure_constraint_complex_left_branch.yaml |multiple_choice | | |
| |blimp_coordinate_structure_constraint_object_extraction |lm_eval/tasks/blimp/coordinate_structure_constraint_object_extraction.yaml |multiple_choice | | |
| |blimp_determiner_noun_agreement_1 |lm_eval/tasks/blimp/determiner_noun_agreement_1.yaml |multiple_choice | | |
| |blimp_determiner_noun_agreement_2 |lm_eval/tasks/blimp/determiner_noun_agreement_2.yaml |multiple_choice | | |
| |blimp_determiner_noun_agreement_irregular_1 |lm_eval/tasks/blimp/determiner_noun_agreement_irregular_1.yaml |multiple_choice | | |
| |blimp_determiner_noun_agreement_irregular_2 |lm_eval/tasks/blimp/determiner_noun_agreement_irregular_2.yaml |multiple_choice | | |
| |blimp_determiner_noun_agreement_with_adj_2 |lm_eval/tasks/blimp/determiner_noun_agreement_with_adj_2.yaml |multiple_choice | | |
| |blimp_determiner_noun_agreement_with_adj_irregular_1 |lm_eval/tasks/blimp/determiner_noun_agreement_with_adj_irregular_1.yaml |multiple_choice | | |
| |blimp_determiner_noun_agreement_with_adj_irregular_2 |lm_eval/tasks/blimp/determiner_noun_agreement_with_adj_irregular_2.yaml |multiple_choice | | |
| |blimp_determiner_noun_agreement_with_adjective_1 |lm_eval/tasks/blimp/determiner_noun_agreement_with_adjective_1.yaml |multiple_choice | | |
| |blimp_distractor_agreement_relational_noun |lm_eval/tasks/blimp/distractor_agreement_relational_noun.yaml |multiple_choice | | |
| |blimp_distractor_agreement_relative_clause |lm_eval/tasks/blimp/distractor_agreement_relative_clause.yaml |multiple_choice | | |
| |blimp_drop_argument |lm_eval/tasks/blimp/drop_argument.yaml |multiple_choice | | |
| |blimp_ellipsis_n_bar_1 |lm_eval/tasks/blimp/ellipsis_n_bar_1.yaml |multiple_choice | | |
| |blimp_ellipsis_n_bar_2 |lm_eval/tasks/blimp/ellipsis_n_bar_2.yaml |multiple_choice | | |
| |blimp_existential_there_object_raising |lm_eval/tasks/blimp/existential_there_object_raising.yaml |multiple_choice | | |
| |blimp_existential_there_quantifiers_1 |lm_eval/tasks/blimp/existential_there_quantifiers_1.yaml |multiple_choice | | |
| |blimp_existential_there_quantifiers_2 |lm_eval/tasks/blimp/existential_there_quantifiers_2.yaml |multiple_choice | | |
| |blimp_existential_there_subject_raising |lm_eval/tasks/blimp/existential_there_subject_raising.yaml |multiple_choice | | |
| |blimp_expletive_it_object_raising |lm_eval/tasks/blimp/expletive_it_object_raising.yaml |multiple_choice | | |
| |blimp_inchoative |lm_eval/tasks/blimp/inchoative.yaml |multiple_choice | | |
| |blimp_intransitive |lm_eval/tasks/blimp/intransitive.yaml |multiple_choice | | |
| |blimp_irregular_past_participle_adjectives |lm_eval/tasks/blimp/irregular_past_participle_adjectives.yaml |multiple_choice | | |
| |blimp_irregular_past_participle_verbs |lm_eval/tasks/blimp/irregular_past_participle_verbs.yaml |multiple_choice | | |
| |blimp_irregular_plural_subject_verb_agreement_1 |lm_eval/tasks/blimp/irregular_plural_subject_verb_agreement_1.yaml |multiple_choice | | |
| |blimp_irregular_plural_subject_verb_agreement_2 |lm_eval/tasks/blimp/irregular_plural_subject_verb_agreement_2.yaml |multiple_choice | | |
| |blimp_left_branch_island_echo_question |lm_eval/tasks/blimp/left_branch_island_echo_question.yaml |multiple_choice | | |
| |blimp_left_branch_island_simple_question |lm_eval/tasks/blimp/left_branch_island_simple_question.yaml |multiple_choice | | |
| |blimp_matrix_question_npi_licensor_present |lm_eval/tasks/blimp/matrix_question_npi_licensor_present.yaml |multiple_choice | | |
| |blimp_npi_present_1 |lm_eval/tasks/blimp/npi_present_1.yaml |multiple_choice | | |
| |blimp_npi_present_2 |lm_eval/tasks/blimp/npi_present_2.yaml |multiple_choice | | |
| |blimp_only_npi_licensor_present |lm_eval/tasks/blimp/only_npi_licensor_present.yaml |multiple_choice | | |
| |blimp_only_npi_scope |lm_eval/tasks/blimp/only_npi_scope.yaml |multiple_choice | | |
| |blimp_passive_1 |lm_eval/tasks/blimp/passive_1.yaml |multiple_choice | | |
| |blimp_passive_2 |lm_eval/tasks/blimp/passive_2.yaml |multiple_choice | | |
| |blimp_principle_A_c_command |lm_eval/tasks/blimp/principle_A_c_command.yaml |multiple_choice | | |
| |blimp_principle_A_case_1 |lm_eval/tasks/blimp/principle_A_case_1.yaml |multiple_choice | | |
| |blimp_principle_A_case_2 |lm_eval/tasks/blimp/principle_A_case_2.yaml |multiple_choice | | |
| |blimp_principle_A_domain_1 |lm_eval/tasks/blimp/principle_A_domain_1.yaml |multiple_choice | | |
| |blimp_principle_A_domain_2 |lm_eval/tasks/blimp/principle_A_domain_2.yaml |multiple_choice | | |
| |blimp_principle_A_domain_3 |lm_eval/tasks/blimp/principle_A_domain_3.yaml |multiple_choice | | |
| |blimp_principle_A_reconstruction |lm_eval/tasks/blimp/principle_A_reconstruction.yaml |multiple_choice | | |
| |blimp_regular_plural_subject_verb_agreement_1 |lm_eval/tasks/blimp/regular_plural_subject_verb_agreement_1.yaml |multiple_choice | | |
| |blimp_regular_plural_subject_verb_agreement_2 |lm_eval/tasks/blimp/regular_plural_subject_verb_agreement_2.yaml |multiple_choice | | |
| |blimp_sentential_negation_npi_licensor_present |lm_eval/tasks/blimp/sentential_negation_npi_licensor_present.yaml |multiple_choice | | |
| |blimp_sentential_negation_npi_scope |lm_eval/tasks/blimp/sentential_negation_npi_scope.yaml |multiple_choice | | |
| |blimp_sentential_subject_island |lm_eval/tasks/blimp/sentential_subject_island.yaml |multiple_choice | | |
| |blimp_superlative_quantifiers_1 |lm_eval/tasks/blimp/superlative_quantifiers_1.yaml |multiple_choice | | |
| |blimp_superlative_quantifiers_2 |lm_eval/tasks/blimp/superlative_quantifiers_2.yaml |multiple_choice | | |
| |blimp_tough_vs_raising_1 |lm_eval/tasks/blimp/tough_vs_raising_1.yaml |multiple_choice | | |
| |blimp_tough_vs_raising_2 |lm_eval/tasks/blimp/tough_vs_raising_2.yaml |multiple_choice | | |
| |blimp_transitive |lm_eval/tasks/blimp/transitive.yaml |multiple_choice | | |
| |blimp_wh_island |lm_eval/tasks/blimp/wh_island.yaml |multiple_choice | | |
| |blimp_wh_questions_object_gap |lm_eval/tasks/blimp/wh_questions_object_gap.yaml |multiple_choice | | |
| |blimp_wh_questions_subject_gap |lm_eval/tasks/blimp/wh_questions_subject_gap.yaml |multiple_choice | | |
| |blimp_wh_questions_subject_gap_long_distance |lm_eval/tasks/blimp/wh_questions_subject_gap_long_distance.yaml |multiple_choice | | |
| |blimp_wh_vs_that_no_gap |lm_eval/tasks/blimp/wh_vs_that_no_gap.yaml |multiple_choice | | |
| |blimp_wh_vs_that_no_gap_long_distance |lm_eval/tasks/blimp/wh_vs_that_no_gap_long_distance.yaml |multiple_choice | | |
| |blimp_wh_vs_that_with_gap |lm_eval/tasks/blimp/wh_vs_that_with_gap.yaml |multiple_choice | | |
| |blimp_wh_vs_that_with_gap_long_distance |lm_eval/tasks/blimp/wh_vs_that_with_gap_long_distance.yaml |multiple_choice | | |
| |boolq |lm_eval/tasks/super_glue/boolq/default.yaml |multiple_choice | | |
| |boolq-seq2seq |lm_eval/tasks/super_glue/boolq/seq2seq.yaml |generate_until | | |
| |c4 |lm_eval/tasks/c4/c4.yaml |loglikelihood_rolling| | |
| |cabreu_abstractive |lm_eval/tasks/catalan_bench/cabreu_abstractive.yaml |generate_until | | |
| |cabreu_extractive |lm_eval/tasks/catalan_bench/cabreu_extractive.yaml |generate_until | | |
| |cabreu_extreme |lm_eval/tasks/catalan_bench/cabreu_extreme.yaml |generate_until | | |
| |careqa_en |lm_eval/tasks/careqa/careqa_en.yaml |multiple_choice | | |
| |careqa_es |lm_eval/tasks/careqa/careqa_es.yaml |multiple_choice | | |
| |careqa_open |lm_eval/tasks/careqa/careqa_open.yaml |generate_until | | |
| |careqa_open_perplexity |lm_eval/tasks/careqa/careqa_open_perplexity.yaml |loglikelihood_rolling| | |
| |catalanqa |lm_eval/tasks/catalan_bench/catalanqa.yaml |generate_until | | |
| |catcola |lm_eval/tasks/catalan_bench/catcola.yaml |multiple_choice | | |
| |cb |lm_eval/tasks/super_glue/cb/default.yaml |multiple_choice | | |
| |ceval-valid_accountant |lm_eval/tasks/ceval/ceval-valid_accountant.yaml |multiple_choice | | |
| |ceval-valid_advanced_mathematics |lm_eval/tasks/ceval/ceval-valid_advanced_mathematics.yaml |multiple_choice | | |
| |ceval-valid_art_studies |lm_eval/tasks/ceval/ceval-valid_art_studies.yaml |multiple_choice | | |
| |ceval-valid_basic_medicine |lm_eval/tasks/ceval/ceval-valid_basic_medicine.yaml |multiple_choice | | |
| |ceval-valid_business_administration |lm_eval/tasks/ceval/ceval-valid_business_administration.yaml |multiple_choice | | |
| |ceval-valid_chinese_language_and_literature |lm_eval/tasks/ceval/ceval-valid_chinese_language_and_literature.yaml |multiple_choice | | |
| |ceval-valid_civil_servant |lm_eval/tasks/ceval/ceval-valid_civil_servant.yaml |multiple_choice | | |
| |ceval-valid_clinical_medicine |lm_eval/tasks/ceval/ceval-valid_clinical_medicine.yaml |multiple_choice | | |
| |ceval-valid_college_chemistry |lm_eval/tasks/ceval/ceval-valid_college_chemistry.yaml |multiple_choice | | |
| |ceval-valid_college_economics |lm_eval/tasks/ceval/ceval-valid_college_economics.yaml |multiple_choice | | |
| |ceval-valid_college_physics |lm_eval/tasks/ceval/ceval-valid_college_physics.yaml |multiple_choice | | |
| |ceval-valid_college_programming |lm_eval/tasks/ceval/ceval-valid_college_programming.yaml |multiple_choice | | |
| |ceval-valid_computer_architecture |lm_eval/tasks/ceval/ceval-valid_computer_architecture.yaml |multiple_choice | | |
| |ceval-valid_computer_network |lm_eval/tasks/ceval/ceval-valid_computer_network.yaml |multiple_choice | | |
| |ceval-valid_discrete_mathematics |lm_eval/tasks/ceval/ceval-valid_discrete_mathematics.yaml |multiple_choice | | |
| |ceval-valid_education_science |lm_eval/tasks/ceval/ceval-valid_education_science.yaml |multiple_choice | | |
| |ceval-valid_electrical_engineer |lm_eval/tasks/ceval/ceval-valid_electrical_engineer.yaml |multiple_choice | | |
| |ceval-valid_environmental_impact_assessment_engineer |lm_eval/tasks/ceval/ceval-valid_environmental_impact_assessment_engineer.yaml |multiple_choice | | |
| |ceval-valid_fire_engineer |lm_eval/tasks/ceval/ceval-valid_fire_engineer.yaml |multiple_choice | | |
| |ceval-valid_high_school_biology |lm_eval/tasks/ceval/ceval-valid_high_school_biology.yaml |multiple_choice | | |
| |ceval-valid_high_school_chemistry |lm_eval/tasks/ceval/ceval-valid_high_school_chemistry.yaml |multiple_choice | | |
| |ceval-valid_high_school_chinese |lm_eval/tasks/ceval/ceval-valid_high_school_chinese.yaml |multiple_choice | | |
| |ceval-valid_high_school_geography |lm_eval/tasks/ceval/ceval-valid_high_school_geography.yaml |multiple_choice | | |
| |ceval-valid_high_school_history |lm_eval/tasks/ceval/ceval-valid_high_school_history.yaml |multiple_choice | | |
| |ceval-valid_high_school_mathematics |lm_eval/tasks/ceval/ceval-valid_high_school_mathematics.yaml |multiple_choice | | |
| |ceval-valid_high_school_physics |lm_eval/tasks/ceval/ceval-valid_high_school_physics.yaml |multiple_choice | | |
| |ceval-valid_high_school_politics |lm_eval/tasks/ceval/ceval-valid_high_school_politics.yaml |multiple_choice | | |
| |ceval-valid_ideological_and_moral_cultivation |lm_eval/tasks/ceval/ceval-valid_ideological_and_moral_cultivation.yaml |multiple_choice | | |
| |ceval-valid_law |lm_eval/tasks/ceval/ceval-valid_law.yaml |multiple_choice | | |
| |ceval-valid_legal_professional |lm_eval/tasks/ceval/ceval-valid_legal_professional.yaml |multiple_choice | | |
| |ceval-valid_logic |lm_eval/tasks/ceval/ceval-valid_logic.yaml |multiple_choice | | |
| |ceval-valid_mao_zedong_thought |lm_eval/tasks/ceval/ceval-valid_mao_zedong_thought.yaml |multiple_choice | | |
| |ceval-valid_marxism |lm_eval/tasks/ceval/ceval-valid_marxism.yaml |multiple_choice | | |
| |ceval-valid_metrology_engineer |lm_eval/tasks/ceval/ceval-valid_metrology_engineer.yaml |multiple_choice | | |
| |ceval-valid_middle_school_biology |lm_eval/tasks/ceval/ceval-valid_middle_school_biology.yaml |multiple_choice | | |
| |ceval-valid_middle_school_chemistry |lm_eval/tasks/ceval/ceval-valid_middle_school_chemistry.yaml |multiple_choice | | |
| |ceval-valid_middle_school_geography |lm_eval/tasks/ceval/ceval-valid_middle_school_geography.yaml |multiple_choice | | |
| |ceval-valid_middle_school_history |lm_eval/tasks/ceval/ceval-valid_middle_school_history.yaml |multiple_choice | | |
| |ceval-valid_middle_school_mathematics |lm_eval/tasks/ceval/ceval-valid_middle_school_mathematics.yaml |multiple_choice | | |
| |ceval-valid_middle_school_physics |lm_eval/tasks/ceval/ceval-valid_middle_school_physics.yaml |multiple_choice | | |
| |ceval-valid_middle_school_politics |lm_eval/tasks/ceval/ceval-valid_middle_school_politics.yaml |multiple_choice | | |
| |ceval-valid_modern_chinese_history |lm_eval/tasks/ceval/ceval-valid_modern_chinese_history.yaml |multiple_choice | | |
| |ceval-valid_operating_system |lm_eval/tasks/ceval/ceval-valid_operating_system.yaml |multiple_choice | | |
| |ceval-valid_physician |lm_eval/tasks/ceval/ceval-valid_physician.yaml |multiple_choice | | |
| |ceval-valid_plant_protection |lm_eval/tasks/ceval/ceval-valid_plant_protection.yaml |multiple_choice | | |
| |ceval-valid_probability_and_statistics |lm_eval/tasks/ceval/ceval-valid_probability_and_statistics.yaml |multiple_choice | | |
| |ceval-valid_professional_tour_guide |lm_eval/tasks/ceval/ceval-valid_professional_tour_guide.yaml |multiple_choice | | |
| |ceval-valid_sports_science |lm_eval/tasks/ceval/ceval-valid_sports_science.yaml |multiple_choice | | |
| |ceval-valid_tax_accountant |lm_eval/tasks/ceval/ceval-valid_tax_accountant.yaml |multiple_choice | | |
| |ceval-valid_teacher_qualification |lm_eval/tasks/ceval/ceval-valid_teacher_qualification.yaml |multiple_choice | | |
| |ceval-valid_urban_and_rural_planner |lm_eval/tasks/ceval/ceval-valid_urban_and_rural_planner.yaml |multiple_choice | | |
| |ceval-valid_veterinary_medicine |lm_eval/tasks/ceval/ceval-valid_veterinary_medicine.yaml |multiple_choice | | |
| |chartqa |lm_eval/tasks/chartqa/chartqa.yaml |generate_until | | |
| |chartqa_llama |lm_eval/tasks/chartqa/chartqa_llama.yaml |generate_until | | |
| |chartqa_llama_90 |lm_eval/tasks/chartqa/chartqa_llama_90.yaml |generate_until | | |
| |claim_stance_topic |lm_eval/tasks/unitxt/claim_stance_topic.yaml | | | |
| |cmmlu_agronomy |lm_eval/tasks/cmmlu/cmmlu_agronomy.yaml |multiple_choice | | |
| |cmmlu_anatomy |lm_eval/tasks/cmmlu/cmmlu_default_anatomy.yaml |multiple_choice | | |
| |cmmlu_ancient_chinese |lm_eval/tasks/cmmlu/cmmlu_default_ancient_chinese.yaml |multiple_choice | | |
| |cmmlu_arts |lm_eval/tasks/cmmlu/cmmlu_default_arts.yaml |multiple_choice | | |
| |cmmlu_astronomy |lm_eval/tasks/cmmlu/cmmlu_default_astronomy.yaml |multiple_choice | | |
| |cmmlu_business_ethics |lm_eval/tasks/cmmlu/cmmlu_default_business_ethics.yaml |multiple_choice | | |
| |cmmlu_chinese_civil_service_exam |lm_eval/tasks/cmmlu/cmmlu_default_chinese_civil_service_exam.yaml |multiple_choice | | |
| |cmmlu_chinese_driving_rule |lm_eval/tasks/cmmlu/cmmlu_default_chinese_driving_rule.yaml |multiple_choice | | |
| |cmmlu_chinese_food_culture |lm_eval/tasks/cmmlu/cmmlu_chinese_food_culture.yaml |multiple_choice | | |
| |cmmlu_chinese_foreign_policy |lm_eval/tasks/cmmlu/cmmlu_chinese_foreign_policy.yaml |multiple_choice | | |
| |cmmlu_chinese_history |lm_eval/tasks/cmmlu/cmmlu_chinese_history.yaml |multiple_choice | | |
| |cmmlu_chinese_literature |lm_eval/tasks/cmmlu/cmmlu_chinese_literature.yaml |multiple_choice | | |
| |cmmlu_chinese_teacher_qualification |lm_eval/tasks/cmmlu/cmmlu_default_chinese_teacher_qualification.yaml |multiple_choice | | |
| |cmmlu_clinical_knowledge |lm_eval/tasks/cmmlu/cmmlu_default_clinical_knowledge.yaml |multiple_choice | | |
| |cmmlu_college_actuarial_science |lm_eval/tasks/cmmlu/cmmlu_default_college_actuarial_science.yaml |multiple_choice | | |
| |cmmlu_college_education |lm_eval/tasks/cmmlu/cmmlu_default_college_education.yaml |multiple_choice | | |
| |cmmlu_college_engineering_hydrology |lm_eval/tasks/cmmlu/cmmlu_default_college_engineering_hydrology.yaml |multiple_choice | | |
| |cmmlu_college_law |lm_eval/tasks/cmmlu/cmmlu_college_law.yaml |multiple_choice | | |
| |cmmlu_college_mathematics |lm_eval/tasks/cmmlu/cmmlu_college_mathematics.yaml |multiple_choice | | |
| |cmmlu_college_medical_statistics |lm_eval/tasks/cmmlu/cmmlu_college_medical_statistics.yaml |multiple_choice | | |
| |cmmlu_college_medicine |lm_eval/tasks/cmmlu/cmmlu_default_college_medicine.yaml |multiple_choice | | |
| |cmmlu_computer_science |lm_eval/tasks/cmmlu/cmmlu_default_computer_science.yaml |multiple_choice | | |
| |cmmlu_computer_security |lm_eval/tasks/cmmlu/cmmlu_default_computer_security.yaml |multiple_choice | | |
| |cmmlu_conceptual_physics |lm_eval/tasks/cmmlu/cmmlu_default_conceptual_physics.yaml |multiple_choice | | |
| |cmmlu_construction_project_management |lm_eval/tasks/cmmlu/cmmlu_construction_project_management.yaml |multiple_choice | | |
| |cmmlu_economics |lm_eval/tasks/cmmlu/cmmlu_economics.yaml |multiple_choice | | |
| |cmmlu_education |lm_eval/tasks/cmmlu/cmmlu_education.yaml |multiple_choice | | |
| |cmmlu_electrical_engineering |lm_eval/tasks/cmmlu/cmmlu_electrical_engineering.yaml |multiple_choice | | |
| |cmmlu_elementary_chinese |lm_eval/tasks/cmmlu/cmmlu_default_elementary_chinese.yaml |multiple_choice | | |
| |cmmlu_elementary_commonsense |lm_eval/tasks/cmmlu/cmmlu_default_elementary_commonsense.yaml |multiple_choice | | |
| |cmmlu_elementary_information_and_technology |lm_eval/tasks/cmmlu/cmmlu_elementary_information_and_technology.yaml |multiple_choice | | |
| |cmmlu_elementary_mathematics |lm_eval/tasks/cmmlu/cmmlu_elementary_mathematics.yaml |multiple_choice | | |
| |cmmlu_ethnology |lm_eval/tasks/cmmlu/cmmlu_ethnology.yaml |multiple_choice | | |
| |cmmlu_food_science |lm_eval/tasks/cmmlu/cmmlu_default_food_science.yaml |multiple_choice | | |
| |cmmlu_genetics |lm_eval/tasks/cmmlu/cmmlu_default_genetics.yaml |multiple_choice | | |
| |cmmlu_global_facts |lm_eval/tasks/cmmlu/cmmlu_default_global_facts.yaml |multiple_choice | | |
| |cmmlu_high_school_biology |lm_eval/tasks/cmmlu/cmmlu_default_high_school_biology.yaml |multiple_choice | | |
| |cmmlu_high_school_chemistry |lm_eval/tasks/cmmlu/cmmlu_high_school_chemistry.yaml |multiple_choice | | |
| |cmmlu_high_school_geography |lm_eval/tasks/cmmlu/cmmlu_default_high_school_geography.yaml |multiple_choice | | |
| |cmmlu_high_school_mathematics |lm_eval/tasks/cmmlu/cmmlu_default_high_school_mathematics.yaml |multiple_choice | | |
| |cmmlu_high_school_physics |lm_eval/tasks/cmmlu/cmmlu_default_high_school_physics.yaml |multiple_choice | | |
| |cmmlu_high_school_politics |lm_eval/tasks/cmmlu/cmmlu_default_high_school_politics.yaml |multiple_choice | | |
| |cmmlu_human_sexuality |lm_eval/tasks/cmmlu/cmmlu_default_human_sexuality.yaml |multiple_choice | | |
| |cmmlu_international_law |lm_eval/tasks/cmmlu/cmmlu_default_international_law.yaml |multiple_choice | | |
| |cmmlu_journalism |lm_eval/tasks/cmmlu/cmmlu_journalism.yaml |multiple_choice | | |
| |cmmlu_jurisprudence |lm_eval/tasks/cmmlu/cmmlu_jurisprudence.yaml |multiple_choice | | |
| |cmmlu_legal_and_moral_basis |lm_eval/tasks/cmmlu/cmmlu_legal_and_moral_basis.yaml |multiple_choice | | |
| |cmmlu_logical |lm_eval/tasks/cmmlu/cmmlu_logical.yaml |multiple_choice | | |
| |cmmlu_machine_learning |lm_eval/tasks/cmmlu/cmmlu_machine_learning.yaml |multiple_choice | | |
| |cmmlu_management |lm_eval/tasks/cmmlu/cmmlu_management.yaml |multiple_choice | | |
| |cmmlu_marketing |lm_eval/tasks/cmmlu/cmmlu_default_marketing.yaml |multiple_choice | | |
| |cmmlu_marxist_theory |lm_eval/tasks/cmmlu/cmmlu_marxist_theory.yaml |multiple_choice | | |
| |cmmlu_modern_chinese |lm_eval/tasks/cmmlu/cmmlu_default_modern_chinese.yaml |multiple_choice | | |
| |cmmlu_nutrition |lm_eval/tasks/cmmlu/cmmlu_default_nutrition.yaml |multiple_choice | | |
| |cmmlu_philosophy |lm_eval/tasks/cmmlu/cmmlu_philosophy.yaml |multiple_choice | | |
| |cmmlu_professional_accounting |lm_eval/tasks/cmmlu/cmmlu_default_professional_accounting.yaml |multiple_choice | | |
| |cmmlu_professional_law |lm_eval/tasks/cmmlu/cmmlu_default_professional_law.yaml |multiple_choice | | |
| |cmmlu_professional_medicine |lm_eval/tasks/cmmlu/cmmlu_professional_medicine.yaml |multiple_choice | | |
| |cmmlu_professional_psychology |lm_eval/tasks/cmmlu/cmmlu_professional_psychology.yaml |multiple_choice | | |
| |cmmlu_public_relations |lm_eval/tasks/cmmlu/cmmlu_public_relations.yaml |multiple_choice | | |
| |cmmlu_security_study |lm_eval/tasks/cmmlu/cmmlu_default_security_study.yaml |multiple_choice | | |
| |cmmlu_sociology |lm_eval/tasks/cmmlu/cmmlu_sociology.yaml |multiple_choice | | |
| |cmmlu_sports_science |lm_eval/tasks/cmmlu/cmmlu_sports_science.yaml |multiple_choice | | |
| |cmmlu_traditional_chinese_medicine |lm_eval/tasks/cmmlu/cmmlu_traditional_chinese_medicine.yaml |multiple_choice | | |
| |cmmlu_virology |lm_eval/tasks/cmmlu/cmmlu_default_virology.yaml |multiple_choice | | |
| |cmmlu_world_history |lm_eval/tasks/cmmlu/cmmlu_world_history.yaml |multiple_choice | | |
| |cmmlu_world_religions |lm_eval/tasks/cmmlu/cmmlu_world_religions.yaml |multiple_choice | | |
| |cnn_dailymail |lm_eval/tasks/unitxt/cnn_dailymail.yaml | | | |
| |cocoteros_es |lm_eval/tasks/spanish_bench/cocoteros_es.yaml |generate_until | | |
| |cocoteros_va |lm_eval/tasks/catalan_bench/cocoteros_va.yaml |generate_until | | |
| |code2text_go |lm_eval/tasks/code_x_glue/code-text/go.yaml |generate_until | | |
| |code2text_java |lm_eval/tasks/code_x_glue/code-text/java.yaml |generate_until | | |
| |code2text_javascript |lm_eval/tasks/code_x_glue/code-text/javascript.yaml |generate_until | | |
| |code2text_php |lm_eval/tasks/code_x_glue/code-text/php.yaml |generate_until | | |
| |code2text_python |lm_eval/tasks/code_x_glue/code-text/python.yaml |generate_until | | |
| |code2text_ruby |lm_eval/tasks/code_x_glue/code-text/ruby.yaml |generate_until | | |
| |coedit_gec |lm_eval/tasks/unitxt/coedit_gec.yaml | | | |
| |cola |lm_eval/tasks/glue/cola/default.yaml |multiple_choice | | |
| |common_voice_en |lm_eval/tasks/common_voice/common_voice_en.yaml |generate_until | | |
| |commonsense_qa |lm_eval/tasks/commonsense_qa/default.yaml |multiple_choice | | |
| |copa |lm_eval/tasks/super_glue/copa/default.yaml |multiple_choice | | |
| |copa_ar |lm_eval/tasks/alghafa/copa_ar/copa_ar.yaml |multiple_choice | | |
| |copa_ca |lm_eval/tasks/catalan_bench/copa_ca.yaml |multiple_choice | | |
| |copa_es |lm_eval/tasks/spanish_bench/copa_es.yaml |multiple_choice | | |
| |copal_id_colloquial |lm_eval/tasks/copal_id/colloquial.yaml |multiple_choice | | |
| |copal_id_standard |lm_eval/tasks/copal_id/standard.yaml |multiple_choice | | |
| |coqa |lm_eval/tasks/coqa/default.yaml |generate_until | | |
| |coqcat |lm_eval/tasks/catalan_bench/coqcat.yaml |generate_until | | |
| |crows_pairs_english |lm_eval/tasks/crows_pairs/crows_pairs_english.yaml |multiple_choice | | |
| |crows_pairs_english_age |lm_eval/tasks/crows_pairs/crows_pairs_english_age.yaml |multiple_choice | | |
| |crows_pairs_english_autre |lm_eval/tasks/crows_pairs/crows_pairs_english_autre.yaml |multiple_choice | | |
| |crows_pairs_english_disability |lm_eval/tasks/crows_pairs/crows_pairs_english_disability.yaml |multiple_choice | | |
| |crows_pairs_english_gender |lm_eval/tasks/crows_pairs/crows_pairs_english_gender.yaml |multiple_choice | | |
| |crows_pairs_english_nationality |lm_eval/tasks/crows_pairs/crows_pairs_english_nationality.yaml |multiple_choice | | |
| |crows_pairs_english_physical_appearance |lm_eval/tasks/crows_pairs/crows_pairs_english_physical_appearance.yaml |multiple_choice | | |
| |crows_pairs_english_race_color |lm_eval/tasks/crows_pairs/crows_pairs_english_race_color.yaml |multiple_choice | | |
| |crows_pairs_english_religion |lm_eval/tasks/crows_pairs/crows_pairs_english_religion.yaml |multiple_choice | | |
| |crows_pairs_english_sexual_orientation |lm_eval/tasks/crows_pairs/crows_pairs_english_sexual_orientation.yaml |multiple_choice | | |
| |crows_pairs_english_socioeconomic |lm_eval/tasks/crows_pairs/crows_pairs_english_socioeconomic.yaml |multiple_choice | | |
| |crows_pairs_french |lm_eval/tasks/crows_pairs/crows_pairs_french.yaml |multiple_choice | | |
| |crows_pairs_french_age |lm_eval/tasks/crows_pairs/crows_pairs_french_age.yaml |multiple_choice | | |
| |crows_pairs_french_autre |lm_eval/tasks/crows_pairs/crows_pairs_french_autre.yaml |multiple_choice | | |
| |crows_pairs_french_disability |lm_eval/tasks/crows_pairs/crows_pairs_french_disability.yaml |multiple_choice | | |
| |crows_pairs_french_gender |lm_eval/tasks/crows_pairs/crows_pairs_french_gender.yaml |multiple_choice | | |
| |crows_pairs_french_nationality |lm_eval/tasks/crows_pairs/crows_pairs_french_nationality.yaml |multiple_choice | | |
| |crows_pairs_french_physical_appearance |lm_eval/tasks/crows_pairs/crows_pairs_french_physical_appearance.yaml |multiple_choice | | |
| |crows_pairs_french_race_color |lm_eval/tasks/crows_pairs/crows_pairs_french_race_color.yaml |multiple_choice | | |
| |crows_pairs_french_religion |lm_eval/tasks/crows_pairs/crows_pairs_french_religion.yaml |multiple_choice | | |
| |crows_pairs_french_sexual_orientation |lm_eval/tasks/crows_pairs/crows_pairs_french_sexual_orientation.yaml |multiple_choice | | |
| |crows_pairs_french_socioeconomic |lm_eval/tasks/crows_pairs/crows_pairs_french_socioeconomic.yaml |multiple_choice | | |
| |csatqa_gr |lm_eval/tasks/csatqa/csatqa_gr.yaml |multiple_choice | | |
| |csatqa_li |lm_eval/tasks/csatqa/csatqa_li.yaml |multiple_choice | | |
| |csatqa_rch |lm_eval/tasks/csatqa/csatqa_rch.yaml |multiple_choice | | |
| |csatqa_rcs |lm_eval/tasks/csatqa/csatqa_rcs.yaml |multiple_choice | | |
| |csatqa_rcss |lm_eval/tasks/csatqa/csatqa_rcss.yaml |multiple_choice | | |
| |csatqa_wr |lm_eval/tasks/csatqa/csatqa_wr.yaml |multiple_choice | | |
| |cycle_letters |lm_eval/tasks/unscramble/cycle_letters.yaml |generate_until | | |
| |darija_sentiment_electrom |lm_eval/tasks/darija_bench/darija_sentiment/darija_sentiment_electrom.yaml |multiple_choice | | |
| |darija_sentiment_mac |lm_eval/tasks/darija_bench/darija_sentiment/darija_sentiment_mac.yaml |multiple_choice | | |
| |darija_sentiment_msac |lm_eval/tasks/darija_bench/darija_sentiment/darija_sentiment_msac.yaml |multiple_choice | | |
| |darija_sentiment_msda |lm_eval/tasks/darija_bench/darija_sentiment/darija_sentiment_msda.yaml |multiple_choice | | |
| |darija_sentiment_myc |lm_eval/tasks/darija_bench/darija_sentiment/darija_sentiment_myc.yaml |multiple_choice | | |
| |darija_summarization_task |lm_eval/tasks/darija_bench/darija_summarization/summarization.yaml |generate_until | | |
| |darijahellaswag |lm_eval/tasks/darijahellaswag/darijahellaswag.yaml |multiple_choice | | |
| |darijammlu_accounting |lm_eval/tasks/darijammlu/darijammlu_accounting.yaml |multiple_choice | | |
| |darijammlu_arabic_language |lm_eval/tasks/darijammlu/darijammlu_arabic_language.yaml |multiple_choice | | |
| |darijammlu_arabic_language_(general) |lm_eval/tasks/darijammlu/darijammlu_arabic_language_(general).yaml |multiple_choice | | |
| |darijammlu_arabic_language_(grammar) |lm_eval/tasks/darijammlu/darijammlu_arabic_language_(grammar).yaml |multiple_choice | | |
| |darijammlu_biology |lm_eval/tasks/darijammlu/darijammlu_biology.yaml |multiple_choice | | |
| |darijammlu_civics |lm_eval/tasks/darijammlu/darijammlu_civics.yaml |multiple_choice | | |
| |darijammlu_computer_science |lm_eval/tasks/darijammlu/darijammlu_computer_science.yaml |multiple_choice | | |
| |darijammlu_driving_test |lm_eval/tasks/darijammlu/darijammlu_driving_test.yaml |multiple_choice | | |
| |darijammlu_economics |lm_eval/tasks/darijammlu/darijammlu_economics.yaml |multiple_choice | | |
| |darijammlu_general_knowledge |lm_eval/tasks/darijammlu/darijammlu_general_knowledge.yaml |multiple_choice | | |
| |darijammlu_geography |lm_eval/tasks/darijammlu/darijammlu_geography.yaml |multiple_choice | | |
| |darijammlu_global_facts |lm_eval/tasks/darijammlu/darijammlu_global_facts.yaml |multiple_choice | | |
| |darijammlu_high_school_european_history |lm_eval/tasks/darijammlu/darijammlu_high_school_european_history.yaml |multiple_choice | | |
| |darijammlu_high_school_geography |lm_eval/tasks/darijammlu/darijammlu_high_school_geography.yaml |multiple_choice | | |
| |darijammlu_high_school_government_and_politics |lm_eval/tasks/darijammlu/darijammlu_high_school_government_and_politics.yaml |multiple_choice | | |
| |darijammlu_high_school_psychology |lm_eval/tasks/darijammlu/darijammlu_high_school_psychology.yaml |multiple_choice | | |
| |darijammlu_high_school_statistics |lm_eval/tasks/darijammlu/darijammlu_high_school_statistics.yaml |multiple_choice | | |
| |darijammlu_high_school_world_history |lm_eval/tasks/darijammlu/darijammlu_high_school_world_history.yaml |multiple_choice | | |
| |darijammlu_history |lm_eval/tasks/darijammlu/darijammlu_history.yaml |multiple_choice | | |
| |darijammlu_human_aging |lm_eval/tasks/darijammlu/darijammlu_human_aging.yaml |multiple_choice | | |
| |darijammlu_international_law |lm_eval/tasks/darijammlu/darijammlu_international_law.yaml |multiple_choice | | |
| |darijammlu_islamic_studies |lm_eval/tasks/darijammlu/darijammlu_islamic_studies.yaml |multiple_choice | | |
| |darijammlu_jurisprudence |lm_eval/tasks/darijammlu/darijammlu_jurisprudence.yaml |multiple_choice | | |
| |darijammlu_law |lm_eval/tasks/darijammlu/darijammlu_law.yaml |multiple_choice | | |
| |darijammlu_logical_fallacies |lm_eval/tasks/darijammlu/darijammlu_logical_fallacies.yaml |multiple_choice | | |
| |darijammlu_management |lm_eval/tasks/darijammlu/darijammlu_management.yaml |multiple_choice | | |
| |darijammlu_management_ar |lm_eval/tasks/darijammlu/darijammlu_management_ar.yaml |multiple_choice | | |
| |darijammlu_marketing |lm_eval/tasks/darijammlu/darijammlu_marketing.yaml |multiple_choice | | |
| |darijammlu_math |lm_eval/tasks/darijammlu/darijammlu_math.yaml |multiple_choice | | |
| |darijammlu_moral_disputes |lm_eval/tasks/darijammlu/darijammlu_moral_disputes.yaml |multiple_choice | | |
| |darijammlu_moral_scenarios |lm_eval/tasks/darijammlu/darijammlu_moral_scenarios.yaml |multiple_choice | | |
| |darijammlu_natural_science |lm_eval/tasks/darijammlu/darijammlu_natural_science.yaml |multiple_choice | | |
| |darijammlu_nutrition |lm_eval/tasks/darijammlu/darijammlu_nutrition.yaml |multiple_choice | | |
| |darijammlu_philosophy |lm_eval/tasks/darijammlu/darijammlu_philosophy.yaml |multiple_choice | | |
| |darijammlu_philosophy_ar |lm_eval/tasks/darijammlu/darijammlu_philosophy_ar.yaml |multiple_choice | | |
| |darijammlu_physics |lm_eval/tasks/darijammlu/darijammlu_physics.yaml |multiple_choice | | |
| |darijammlu_political_science |lm_eval/tasks/darijammlu/darijammlu_political_science.yaml |multiple_choice | | |
| |darijammlu_professional_law |lm_eval/tasks/darijammlu/darijammlu_professional_law.yaml |multiple_choice | | |
| |darijammlu_professional_psychology |lm_eval/tasks/darijammlu/darijammlu_professional_psychology.yaml |multiple_choice | | |
| |darijammlu_public_relations |lm_eval/tasks/darijammlu/darijammlu_public_relations.yaml |multiple_choice | | |
| |darijammlu_security_studies |lm_eval/tasks/darijammlu/darijammlu_security_studies.yaml |multiple_choice | | |
| |darijammlu_social_science |lm_eval/tasks/darijammlu/darijammlu_social_science.yaml |multiple_choice | | |
| |darijammlu_sociology |lm_eval/tasks/darijammlu/darijammlu_sociology.yaml |multiple_choice | | |
| |darijammlu_world_religions |lm_eval/tasks/darijammlu/darijammlu_world_religions.yaml |multiple_choice | | |
| |dbpedia_14 |lm_eval/tasks/unitxt/dbpedia_14.yaml | | | |
| |doc_vqa |lm_eval/tasks/unitxt/doc_vqa.yaml | | | |
| |drop |lm_eval/tasks/drop/default.yaml |generate_until | | |
| |epec_koref_bin |lm_eval/tasks/basqueglue/coref.yaml |multiple_choice | | |
| |eq_bench |lm_eval/tasks/eq_bench/default.yaml |generate_until | | |
| |escola |lm_eval/tasks/spanish_bench/escola.yaml |multiple_choice | | |
| |ethics_cm |lm_eval/tasks/hendrycks_ethics/commonsense.yaml |multiple_choice | | |
| |ethics_deontology |lm_eval/tasks/hendrycks_ethics/deontology.yaml |multiple_choice | | |
| |ethics_justice |lm_eval/tasks/hendrycks_ethics/justice.yaml |multiple_choice | | |
| |ethics_utilitarianism |lm_eval/tasks/hendrycks_ethics/utilitarianism.yaml |multiple_choice | | |
| |ethics_virtue |lm_eval/tasks/hendrycks_ethics/virtue.yaml |multiple_choice | | |
| |ethos_binary |lm_eval/tasks/unitxt/ethos_binary.yaml | | | |
| |eus_exams_es_ejadministrativo |lm_eval/tasks/eus_exams/eus_exams_es_ejadministrativo.yaml |multiple_choice | | |
| |eus_exams_es_ejauxiliar |lm_eval/tasks/eus_exams/eus_exams_es_ejauxiliar.yaml |multiple_choice | | |
| |eus_exams_es_ejsubalterno |lm_eval/tasks/eus_exams/eus_exams_es_ejsubalterno.yaml |multiple_choice | | |
| |eus_exams_es_ejtecnico |lm_eval/tasks/eus_exams/eus_exams_es_ejtecnico.yaml |multiple_choice | | |
| |eus_exams_es_opeayuntamientovitoria |lm_eval/tasks/eus_exams/eus_exams_es_opeayuntamientovitoria.yaml |multiple_choice | | |
| |eus_exams_es_opebilbao |lm_eval/tasks/eus_exams/eus_exams_es_opebilbao.yaml |multiple_choice | | |
| |eus_exams_es_opeehuadmin |lm_eval/tasks/eus_exams/eus_exams_es_opeehuadmin.yaml |multiple_choice | | |
| |eus_exams_es_opeehuaux |lm_eval/tasks/eus_exams/eus_exams_es_opeehuaux.yaml |multiple_choice | | |
| |eus_exams_es_opeehubiblio |lm_eval/tasks/eus_exams/eus_exams_es_opeehubiblio.yaml |multiple_choice | | |
| |eus_exams_es_opeehuderecho |lm_eval/tasks/eus_exams/eus_exams_es_opeehuderecho.yaml |multiple_choice | | |
| |eus_exams_es_opeehueconomicas |lm_eval/tasks/eus_exams/eus_exams_es_opeehueconomicas.yaml |multiple_choice | | |
| |eus_exams_es_opeehuempresariales |lm_eval/tasks/eus_exams/eus_exams_es_opeehuempresariales.yaml |multiple_choice | | |
| |eus_exams_es_opeehusubalterno |lm_eval/tasks/eus_exams/eus_exams_es_opeehusubalterno.yaml |multiple_choice | | |
| |eus_exams_es_opeehutecnico |lm_eval/tasks/eus_exams/eus_exams_es_opeehutecnico.yaml |multiple_choice | | |
| |eus_exams_es_opeehutecnicob |lm_eval/tasks/eus_exams/eus_exams_es_opeehutecnicob.yaml |multiple_choice | | |
| |eus_exams_es_opeosakiadmin |lm_eval/tasks/eus_exams/eus_exams_es_opeosakiadmin.yaml |multiple_choice | | |
| |eus_exams_es_opeosakiaux |lm_eval/tasks/eus_exams/eus_exams_es_opeosakiaux.yaml |multiple_choice | | |
| |eus_exams_es_opeosakiauxenf |lm_eval/tasks/eus_exams/eus_exams_es_opeosakiauxenf.yaml |multiple_choice | | |
| |eus_exams_es_opeosakicelador |lm_eval/tasks/eus_exams/eus_exams_es_opeosakicelador.yaml |multiple_choice | | |
| |eus_exams_es_opeosakienf |lm_eval/tasks/eus_exams/eus_exams_es_opeosakienf.yaml |multiple_choice | | |
| |eus_exams_es_opeosakijuridico |lm_eval/tasks/eus_exams/eus_exams_es_opeosakijuridico.yaml |multiple_choice | | |
| |eus_exams_es_opeosakioperario |lm_eval/tasks/eus_exams/eus_exams_es_opeosakioperario.yaml |multiple_choice | | |
| |eus_exams_es_opeosakitecnico |lm_eval/tasks/eus_exams/eus_exams_es_opeosakitecnico.yaml |multiple_choice | | |
| |eus_exams_es_opeosakivarios |lm_eval/tasks/eus_exams/eus_exams_es_opeosakivarios.yaml |multiple_choice | | |
| |eus_exams_es_osakidetza1c |lm_eval/tasks/eus_exams/eus_exams_es_osakidetza1c.yaml |multiple_choice | | |
| |eus_exams_es_osakidetza2c |lm_eval/tasks/eus_exams/eus_exams_es_osakidetza2c.yaml |multiple_choice | | |
| |eus_exams_es_osakidetza3c |lm_eval/tasks/eus_exams/eus_exams_es_osakidetza3c.yaml |multiple_choice | | |
| |eus_exams_es_osakidetza4c |lm_eval/tasks/eus_exams/eus_exams_es_osakidetza4c.yaml |multiple_choice | | |
| |eus_exams_es_osakidetza5c |lm_eval/tasks/eus_exams/eus_exams_es_osakidetza5c.yaml |multiple_choice | | |
| |eus_exams_es_osakidetza6c |lm_eval/tasks/eus_exams/eus_exams_es_osakidetza6c.yaml |multiple_choice | | |
| |eus_exams_es_osakidetza7c |lm_eval/tasks/eus_exams/eus_exams_es_osakidetza7c.yaml |multiple_choice | | |
| |eus_exams_es_osakidetza8c |lm_eval/tasks/eus_exams/eus_exams_es_osakidetza8c.yaml |multiple_choice | | |
| |eus_exams_es_osakidetza9c |lm_eval/tasks/eus_exams/eus_exams_es_osakidetza9c.yaml |multiple_choice | | |
| |eus_exams_eu_ejadministrari |lm_eval/tasks/eus_exams/eus_exams_eu_ejadministrari.yaml |multiple_choice | | |
| |eus_exams_eu_ejlaguntza |lm_eval/tasks/eus_exams/eus_exams_eu_ejlaguntza.yaml |multiple_choice | | |
| |eus_exams_eu_ejlaguntzaile |lm_eval/tasks/eus_exams/eus_exams_eu_ejlaguntzaile.yaml |multiple_choice | | |
| |eus_exams_eu_ejteknikari |lm_eval/tasks/eus_exams/eus_exams_eu_ejteknikari.yaml |multiple_choice | | |
| |eus_exams_eu_opebilbaoeu |lm_eval/tasks/eus_exams/eus_exams_eu_opebilbaoeu.yaml |multiple_choice | | |
| |eus_exams_eu_opeehuadmineu |lm_eval/tasks/eus_exams/eus_exams_eu_opeehuadmineu.yaml |multiple_choice | | |
| |eus_exams_eu_opeehuauxeu |lm_eval/tasks/eus_exams/eus_exams_eu_opeehuauxeu.yaml |multiple_choice | | |
| |eus_exams_eu_opeehubiblioeu |lm_eval/tasks/eus_exams/eus_exams_eu_opeehubiblioeu.yaml |multiple_choice | | |
| |eus_exams_eu_opeehuderechoeu |lm_eval/tasks/eus_exams/eus_exams_eu_opeehuderechoeu.yaml |multiple_choice | | |
| |eus_exams_eu_opeehueconomicaseu |lm_eval/tasks/eus_exams/eus_exams_eu_opeehueconomicaseu.yaml |multiple_choice | | |
| |eus_exams_eu_opeehuempresarialeseu |lm_eval/tasks/eus_exams/eus_exams_eu_opeehuempresarialeseu.yaml |multiple_choice | | |
| |eus_exams_eu_opeehusubalternoeu |lm_eval/tasks/eus_exams/eus_exams_eu_opeehusubalternoeu.yaml |multiple_choice | | |
| |eus_exams_eu_opeehutecnicoeu |lm_eval/tasks/eus_exams/eus_exams_eu_opeehutecnicoeu.yaml |multiple_choice | | |
| |eus_exams_eu_opeehuteknikarib |lm_eval/tasks/eus_exams/eus_exams_eu_opeehuteknikarib.yaml |multiple_choice | | |
| |eus_exams_eu_opegasteizkoudala |lm_eval/tasks/eus_exams/eus_exams_eu_opegasteizkoudala.yaml |multiple_choice | | |
| |eus_exams_eu_opeosakiadmineu |lm_eval/tasks/eus_exams/eus_exams_eu_opeosakiadmineu.yaml |multiple_choice | | |
| |eus_exams_eu_opeosakiauxenfeu |lm_eval/tasks/eus_exams/eus_exams_eu_opeosakiauxenfeu.yaml |multiple_choice | | |
| |eus_exams_eu_opeosakiauxeu |lm_eval/tasks/eus_exams/eus_exams_eu_opeosakiauxeu.yaml |multiple_choice | | |
| |eus_exams_eu_opeosakiceladoreu |lm_eval/tasks/eus_exams/eus_exams_eu_opeosakiceladoreu.yaml |multiple_choice | | |
| |eus_exams_eu_opeosakienfeu |lm_eval/tasks/eus_exams/eus_exams_eu_opeosakienfeu.yaml |multiple_choice | | |
| |eus_exams_eu_opeosakioperarioeu |lm_eval/tasks/eus_exams/eus_exams_eu_opeosakioperarioeu.yaml |multiple_choice | | |
| |eus_exams_eu_opeosakitecnicoeu |lm_eval/tasks/eus_exams/eus_exams_eu_opeosakitecnicoeu.yaml |multiple_choice | | |
| |eus_exams_eu_opeosakivarioseu |lm_eval/tasks/eus_exams/eus_exams_eu_opeosakivarioseu.yaml |multiple_choice | | |
| |eus_exams_eu_osakidetza1e |lm_eval/tasks/eus_exams/eus_exams_eu_osakidetza1e.yaml |multiple_choice | | |
| |eus_exams_eu_osakidetza2e |lm_eval/tasks/eus_exams/eus_exams_eu_osakidetza2e.yaml |multiple_choice | | |
| |eus_exams_eu_osakidetza3e |lm_eval/tasks/eus_exams/eus_exams_eu_osakidetza3e.yaml |multiple_choice | | |
| |eus_exams_eu_osakidetza5e |lm_eval/tasks/eus_exams/eus_exams_eu_osakidetza5e.yaml |multiple_choice | | |
| |eus_exams_eu_osakidetza6e |lm_eval/tasks/eus_exams/eus_exams_eu_osakidetza6e.yaml |multiple_choice | | |
| |eus_exams_eu_osakidetza7e |lm_eval/tasks/eus_exams/eus_exams_eu_osakidetza7e.yaml |multiple_choice | | |
| |eus_proficiency |lm_eval/tasks/eus_proficiency/eus_proficiency.yaml |multiple_choice | | |
| |eus_reading |lm_eval/tasks/eus_reading/eus_reading.yaml |multiple_choice | | |
| |eus_trivia |lm_eval/tasks/eus_trivia/eus_trivia.yaml |multiple_choice | | |
| |evalita-mp_at_prompt-1 |lm_eval/tasks/evalita_llm/_evalita-mp_at_task_p1.yaml |multiple_choice | | |
| |evalita-mp_at_prompt-2 |lm_eval/tasks/evalita_llm/_evalita-mp_at_task_p2.yaml |multiple_choice | | |
| |evalita-mp_at_prompt-3 |lm_eval/tasks/evalita_llm/_evalita-mp_at_task_p3.yaml |multiple_choice | | |
| |evalita-mp_at_prompt-4 |lm_eval/tasks/evalita_llm/_evalita-mp_at_task_p4.yaml |multiple_choice | | |
| |evalita-mp_at_prompt-5 |lm_eval/tasks/evalita_llm/_evalita-mp_at_task_p5.yaml |multiple_choice | | |
| |evalita-mp_at_prompt-6 |lm_eval/tasks/evalita_llm/_evalita-mp_at_task_p6.yaml |multiple_choice | | |
| |evalita-mp_faq_prompt-1 |lm_eval/tasks/evalita_llm/_evalita-mp_faq_p1.yaml |multiple_choice | | |
| |evalita-mp_faq_prompt-2 |lm_eval/tasks/evalita_llm/_evalita-mp_faq_p2.yaml |multiple_choice | | |
| |evalita-mp_faq_prompt-3 |lm_eval/tasks/evalita_llm/_evalita-mp_faq_p3.yaml |multiple_choice | | |
| |evalita-mp_faq_prompt-4 |lm_eval/tasks/evalita_llm/_evalita-mp_faq_p4.yaml |multiple_choice | | |
| |evalita-mp_faq_prompt-5 |lm_eval/tasks/evalita_llm/_evalita-mp_faq_p5.yaml |multiple_choice | | |
| |evalita-mp_faq_prompt-6 |lm_eval/tasks/evalita_llm/_evalita-mp_faq_p6.yaml |multiple_choice | | |
| |evalita-mp_hs_prompt-1 |lm_eval/tasks/evalita_llm/_evalita-mp_hs_p1.yaml |multiple_choice | | |
| |evalita-mp_hs_prompt-2 |lm_eval/tasks/evalita_llm/_evalita-mp_hs_p2.yaml |multiple_choice | | |
| |evalita-mp_hs_prompt-3 |lm_eval/tasks/evalita_llm/_evalita-mp_hs_p3.yaml |multiple_choice | | |
| |evalita-mp_hs_prompt-4 |lm_eval/tasks/evalita_llm/_evalita-mp_hs_p4.yaml |multiple_choice | | |
| |evalita-mp_hs_prompt-5 |lm_eval/tasks/evalita_llm/_evalita-mp_hs_p5.yaml |multiple_choice | | |
| |evalita-mp_hs_prompt-6 |lm_eval/tasks/evalita_llm/_evalita-mp_hs_p6.yaml |multiple_choice | | |
| |evalita-mp_ls_prompt-1 |lm_eval/tasks/evalita_llm/_evalita-mp_ls_p1.yaml |generate_until | | |
| |evalita-mp_ls_prompt-2 |lm_eval/tasks/evalita_llm/_evalita-mp_ls_p2.yaml |generate_until | | |
| |evalita-mp_ner-v2_adg_p1 |lm_eval/tasks/evalita_llm/_evalita-mp_ner-adg_group_p1.yaml |generate_until | | |
| |evalita-mp_ner-v2_adg_p2 |lm_eval/tasks/evalita_llm/_evalita-mp_ner-adg_group_p2.yaml |generate_until | | |
| |evalita-mp_ner-v2_fic_p1 |lm_eval/tasks/evalita_llm/_evalita-mp_ner-fic_group_p1.yaml |generate_until | | |
| |evalita-mp_ner-v2_fic_p2 |lm_eval/tasks/evalita_llm/_evalita-mp_ner-fic_group_p2.yaml |generate_until | | |
| |evalita-mp_ner-v2_wn_p1 |lm_eval/tasks/evalita_llm/_evalita-mp_ner-wn_group_p1.yaml |generate_until | | |
| |evalita-mp_ner-v2_wn_p2 |lm_eval/tasks/evalita_llm/_evalita-mp_ner-wn_group_p2.yaml |generate_until | | |
| |evalita-mp_ner_adg_p1 |lm_eval/tasks/evalita_llm/_evalita-mp_ner_adg_p1.yaml |generate_until | | |
| |evalita-mp_ner_adg_p2 |lm_eval/tasks/evalita_llm/_evalita-mp_ner_adg_p2.yaml |generate_until | | |
| |evalita-mp_ner_fic_p1 |lm_eval/tasks/evalita_llm/_evalita-mp_ner_fic_p1.yaml |generate_until | | |
| |evalita-mp_ner_fic_p2 |lm_eval/tasks/evalita_llm/_evalita-mp_ner_fic_p2.yaml |generate_until | | |
| |evalita-mp_ner_wn_p1 |lm_eval/tasks/evalita_llm/_evalita-mp_ner_wn_p1.yaml |generate_until | | |
| |evalita-mp_ner_wn_p2 |lm_eval/tasks/evalita_llm/_evalita-mp_ner_wn_p2.yaml |generate_until | | |
| |evalita-mp_re_prompt-1 |lm_eval/tasks/evalita_llm/_evalita-mp_re_p1.yaml |generate_until | | |
| |evalita-mp_re_prompt-2 |lm_eval/tasks/evalita_llm/_evalita-mp_re_p2.yaml |generate_until | | |
| |evalita-mp_sa_prompt-1 |lm_eval/tasks/evalita_llm/_evalita-mp_sa_p1.yaml |multiple_choice | | |
| |evalita-mp_sa_prompt-2 |lm_eval/tasks/evalita_llm/_evalita-mp_sa_p2.yaml |multiple_choice | | |
| |evalita-mp_sa_prompt-3 |lm_eval/tasks/evalita_llm/_evalita-mp_sa_p3.yaml |multiple_choice | | |
| |evalita-mp_sa_prompt-4 |lm_eval/tasks/evalita_llm/_evalita-mp_sa_p4.yaml |multiple_choice | | |
| |evalita-mp_sa_prompt-5 |lm_eval/tasks/evalita_llm/_evalita-mp_sa_p5.yaml |multiple_choice | | |
| |evalita-mp_sa_prompt-6 |lm_eval/tasks/evalita_llm/_evalita-mp_sa_p6.yaml |multiple_choice | | |
| |evalita-mp_te_prompt-1 |lm_eval/tasks/evalita_llm/_evalita-mp_te_p1.yaml |multiple_choice | | |
| |evalita-mp_te_prompt-2 |lm_eval/tasks/evalita_llm/_evalita-mp_te_p2.yaml |multiple_choice | | |
| |evalita-mp_te_prompt-3 |lm_eval/tasks/evalita_llm/_evalita-mp_te_p3.yaml |multiple_choice | | |
| |evalita-mp_te_prompt-4 |lm_eval/tasks/evalita_llm/_evalita-mp_te_p4.yaml |multiple_choice | | |
| |evalita-mp_te_prompt-5 |lm_eval/tasks/evalita_llm/_evalita-mp_te_p5.yaml |multiple_choice | | |
| |evalita-mp_te_prompt-6 |lm_eval/tasks/evalita_llm/_evalita-mp_te_p6.yaml |multiple_choice | | |
| |evalita-mp_wic_prompt-1 |lm_eval/tasks/evalita_llm/_evalita-mp_wic_p1.yaml |multiple_choice | | |
| |evalita-mp_wic_prompt-2 |lm_eval/tasks/evalita_llm/_evalita-mp_wic_p2.yaml |multiple_choice | | |
| |evalita-mp_wic_prompt-3 |lm_eval/tasks/evalita_llm/_evalita-mp_wic_p3.yaml |multiple_choice | | |
| |evalita-mp_wic_prompt-4 |lm_eval/tasks/evalita_llm/_evalita-mp_wic_p4.yaml |multiple_choice | | |
| |evalita-mp_wic_prompt-5 |lm_eval/tasks/evalita_llm/_evalita-mp_wic_p5.yaml |multiple_choice | | |
| |evalita-mp_wic_prompt-6 |lm_eval/tasks/evalita_llm/_evalita-mp_wic_p6.yaml |multiple_choice | | |
| |evalita-sp_sum_task_fp-small_p1 |lm_eval/tasks/evalita_llm/_evalita-mp_sum_fp-small_p1.yaml |generate_until | | |
| |evalita-sp_sum_task_fp-small_p2 |lm_eval/tasks/evalita_llm/_evalita-mp_sum_fp-small_p2.yaml |generate_until | | |
| |evalita-sp_sum_task_fp_p1 |lm_eval/tasks/evalita_llm/_evalita-mp_sum_fp_p1.yaml |generate_until | | |
| |evalita-sp_sum_task_fp_p2 |lm_eval/tasks/evalita_llm/_evalita-mp_sum_fp_p2.yaml |generate_until | | |
| |fda |lm_eval/tasks/fda/fda.yaml | | | |
| |financial_tweets |lm_eval/tasks/unitxt/financial_tweets.yaml | | | |
| |fld_default |lm_eval/tasks/fld/fld_default.yaml | | | |
| |fld_logical_formula_default |lm_eval/tasks/fld/fld_logical_formula_default.yaml | | | |
| |fld_logical_formula_star |lm_eval/tasks/fld/fld_logical_formula_star.yaml | | | |
| |fld_star |lm_eval/tasks/fld/fld_star.yaml | | | |
| |flores_ace_Arab-eng_Latn_prompt_1 |lm_eval/tasks/afrobench/flores/prompt_1/african-english/flores_ace_Arab-eng_Latn.yaml |generate_until | | |
| |flores_ace_Arab-eng_Latn_prompt_2 |lm_eval/tasks/afrobench/flores/prompt_2/african-english/flores_ace_Arab-eng_Latn.yaml |generate_until | | |
| |flores_ace_Arab-eng_Latn_prompt_3 |lm_eval/tasks/afrobench/flores/prompt_3/african-english/flores_ace_Arab-eng_Latn.yaml |generate_until | | |
| |flores_ace_Latn-eng_Latn_prompt_1 |lm_eval/tasks/afrobench/flores/prompt_1/african-english/flores_ace_Latn-eng_Latn.yaml |generate_until | | |
| |flores_ace_Latn-eng_Latn_prompt_2 |lm_eval/tasks/afrobench/flores/prompt_2/african-english/flores_ace_Latn-eng_Latn.yaml |generate_until | | |
| |flores_ace_Latn-eng_Latn_prompt_3 |lm_eval/tasks/afrobench/flores/prompt_3/african-english/flores_ace_Latn-eng_Latn.yaml |generate_until | | |
| |flores_acq_Arab-eng_Latn_prompt_1 |lm_eval/tasks/afrobench/flores/prompt_1/african-english/flores_acq_Arab-eng_Latn.yaml |generate_until | | |
| |flores_acq_Arab-eng_Latn_prompt_2 |lm_eval/tasks/afrobench/flores/prompt_2/african-english/flores_acq_Arab-eng_Latn.yaml |generate_until | | |
| |flores_acq_Arab-eng_Latn_prompt_3 |lm_eval/tasks/afrobench/flores/prompt_3/african-english/flores_acq_Arab-eng_Latn.yaml |generate_until | | |
| |flores_aeb_Arab-eng_Latn_prompt_1 |lm_eval/tasks/afrobench/flores/prompt_1/african-english/flores_aeb_Arab-eng_Latn.yaml |generate_until | | |
| |flores_aeb_Arab-eng_Latn_prompt_2 |lm_eval/tasks/afrobench/flores/prompt_2/african-english/flores_aeb_Arab-eng_Latn.yaml |generate_until | | |
| |flores_aeb_Arab-eng_Latn_prompt_3 |lm_eval/tasks/afrobench/flores/prompt_3/african-english/flores_aeb_Arab-eng_Latn.yaml |generate_until | | |
| |flores_afr_Latn-eng_Latn_prompt_1 |lm_eval/tasks/afrobench/flores/prompt_1/african-english/flores_afr_Latn-eng_Latn.yaml |generate_until | | |
| |flores_afr_Latn-eng_Latn_prompt_2 |lm_eval/tasks/afrobench/flores/prompt_2/african-english/flores_afr_Latn-eng_Latn.yaml |generate_until | | |
| |flores_afr_Latn-eng_Latn_prompt_3 |lm_eval/tasks/afrobench/flores/prompt_3/african-english/flores_afr_Latn-eng_Latn.yaml |generate_until | | |
| |flores_aka_Latn-eng_Latn_prompt_1 |lm_eval/tasks/afrobench/flores/prompt_1/african-english/flores_aka_Latn-eng_Latn.yaml |generate_until | | |
| |flores_aka_Latn-eng_Latn_prompt_2 |lm_eval/tasks/afrobench/flores/prompt_2/african-english/flores_aka_Latn-eng_Latn.yaml |generate_until | | |
| |flores_aka_Latn-eng_Latn_prompt_3 |lm_eval/tasks/afrobench/flores/prompt_3/african-english/flores_aka_Latn-eng_Latn.yaml |generate_until | | |
| |flores_amh_Ethi-eng_Latn_prompt_1 |lm_eval/tasks/afrobench/flores/prompt_1/african-english/flores_amh_Ethi-eng_Latn.yaml |generate_until | | |
| |flores_amh_Ethi-eng_Latn_prompt_2 |lm_eval/tasks/afrobench/flores/prompt_2/african-english/flores_amh_Ethi-eng_Latn.yaml |generate_until | | |
| |flores_amh_Ethi-eng_Latn_prompt_3 |lm_eval/tasks/afrobench/flores/prompt_3/african-english/flores_amh_Ethi-eng_Latn.yaml |generate_until | | |
| |flores_ary_Arab-eng_Latn_prompt_1 |lm_eval/tasks/afrobench/flores/prompt_1/african-english/flores_ary_Arab-eng_Latn.yaml |generate_until | | |
| |flores_ary_Arab-eng_Latn_prompt_2 |lm_eval/tasks/afrobench/flores/prompt_2/african-english/flores_ary_Arab-eng_Latn.yaml |generate_until | | |
| |flores_ary_Arab-eng_Latn_prompt_3 |lm_eval/tasks/afrobench/flores/prompt_3/african-english/flores_ary_Arab-eng_Latn.yaml |generate_until | | |
| |flores_arz_Arab-eng_Latn_prompt_1 |lm_eval/tasks/afrobench/flores/prompt_1/african-english/flores_arz_Arab-eng_Latn.yaml |generate_until | | |
| |flores_arz_Arab-eng_Latn_prompt_2 |lm_eval/tasks/afrobench/flores/prompt_2/african-english/flores_arz_Arab-eng_Latn.yaml |generate_until | | |
| |flores_arz_Arab-eng_Latn_prompt_3 |lm_eval/tasks/afrobench/flores/prompt_3/african-english/flores_arz_Arab-eng_Latn.yaml |generate_until | | |
| |flores_bam_Latn-eng_Latn_prompt_1 |lm_eval/tasks/afrobench/flores/prompt_1/african-english/flores_bam_Latn-eng_Latn.yaml |generate_until | | |
| |flores_bam_Latn-eng_Latn_prompt_2 |lm_eval/tasks/afrobench/flores/prompt_2/african-english/flores_bam_Latn-eng_Latn.yaml |generate_until | | |
| |flores_bam_Latn-eng_Latn_prompt_3 |lm_eval/tasks/afrobench/flores/prompt_3/african-english/flores_bam_Latn-eng_Latn.yaml |generate_until | | |
| |flores_ban_Latn-eng_Latn_prompt_1 |lm_eval/tasks/afrobench/flores/prompt_1/african-english/flores_ban_Latn-eng_Latn.yaml |generate_until | | |
| |flores_ban_Latn-eng_Latn_prompt_2 |lm_eval/tasks/afrobench/flores/prompt_2/african-english/flores_ban_Latn-eng_Latn.yaml |generate_until | | |
| |flores_ban_Latn-eng_Latn_prompt_3 |lm_eval/tasks/afrobench/flores/prompt_3/african-english/flores_ban_Latn-eng_Latn.yaml |generate_until | | |
| |flores_bem_Latn-eng_Latn_prompt_1 |lm_eval/tasks/afrobench/flores/prompt_1/african-english/flores_bem_Latn-eng_Latn.yaml |generate_until | | |
| |flores_bem_Latn-eng_Latn_prompt_2 |lm_eval/tasks/afrobench/flores/prompt_2/african-english/flores_bem_Latn-eng_Latn.yaml |generate_until | | |
| |flores_bem_Latn-eng_Latn_prompt_3 |lm_eval/tasks/afrobench/flores/prompt_3/african-english/flores_bem_Latn-eng_Latn.yaml |generate_until | | |
| |flores_ca-de |lm_eval/tasks/catalan_bench/flores_ca/flores_ca-de.yaml |generate_until | | |
| |flores_ca-en |lm_eval/tasks/catalan_bench/flores_ca/flores_ca-en.yaml |generate_until | | |
| |flores_ca-es |lm_eval/tasks/spanish_bench/flores_es/flores_ca-es.yaml |generate_until | | |
| |flores_ca-eu |lm_eval/tasks/basque_bench/flores_eu/flores_ca-eu.yaml |generate_until | | |
| |flores_ca-fr |lm_eval/tasks/catalan_bench/flores_ca/flores_ca-fr.yaml |generate_until | | |
| |flores_ca-gl |lm_eval/tasks/galician_bench/flores_gl/flores_ca-gl.yaml |generate_until | | |
| |flores_ca-it |lm_eval/tasks/catalan_bench/flores_ca/flores_ca-it.yaml |generate_until | | |
| |flores_ca-pt |lm_eval/tasks/portuguese_bench/flores_pt/flores_ca-pt.yaml |generate_until | | |
| |flores_cjk_Latn-eng_Latn_prompt_1 |lm_eval/tasks/afrobench/flores/prompt_1/african-english/flores_cjk_Latn-eng_Latn.yaml |generate_until | | |
| |flores_cjk_Latn-eng_Latn_prompt_2 |lm_eval/tasks/afrobench/flores/prompt_2/african-english/flores_cjk_Latn-eng_Latn.yaml |generate_until | | |
| |flores_cjk_Latn-eng_Latn_prompt_3 |lm_eval/tasks/afrobench/flores/prompt_3/african-english/flores_cjk_Latn-eng_Latn.yaml |generate_until | | |
| |flores_de-ca |lm_eval/tasks/catalan_bench/flores_ca/flores_de-ca.yaml |generate_until | | |
| |flores_de-es |lm_eval/tasks/spanish_bench/flores_es/flores_de-es.yaml |generate_until | | |
| |flores_de-eu |lm_eval/tasks/basque_bench/flores_eu/flores_de-eu.yaml |generate_until | | |
| |flores_de-gl |lm_eval/tasks/galician_bench/flores_gl/flores_de-gl.yaml |generate_until | | |
| |flores_de-pt |lm_eval/tasks/portuguese_bench/flores_pt/flores_de-pt.yaml |generate_until | | |
| |flores_dik_Latn-eng_Latn_prompt_1 |lm_eval/tasks/afrobench/flores/prompt_1/african-english/flores_dik_Latn-eng_Latn.yaml |generate_until | | |
| |flores_dik_Latn-eng_Latn_prompt_2 |lm_eval/tasks/afrobench/flores/prompt_2/african-english/flores_dik_Latn-eng_Latn.yaml |generate_until | | |
| |flores_dik_Latn-eng_Latn_prompt_3 |lm_eval/tasks/afrobench/flores/prompt_3/african-english/flores_dik_Latn-eng_Latn.yaml |generate_until | | |
| |flores_dyu_Latn-eng_Latn_prompt_1 |lm_eval/tasks/afrobench/flores/prompt_1/african-english/flores_dyu_Latn-eng_Latn.yaml |generate_until | | |
| |flores_dyu_Latn-eng_Latn_prompt_2 |lm_eval/tasks/afrobench/flores/prompt_2/african-english/flores_dyu_Latn-eng_Latn.yaml |generate_until | | |
| |flores_dyu_Latn-eng_Latn_prompt_3 |lm_eval/tasks/afrobench/flores/prompt_3/african-english/flores_dyu_Latn-eng_Latn.yaml |generate_until | | |
| |flores_en-ca |lm_eval/tasks/catalan_bench/flores_ca/flores_en-ca.yaml |generate_until | | |
| |flores_en-es |lm_eval/tasks/spanish_bench/flores_es/flores_en-es.yaml |generate_until | | |
| |flores_en-eu |lm_eval/tasks/basque_bench/flores_eu/flores_en-eu.yaml |generate_until | | |
| |flores_en-gl |lm_eval/tasks/galician_bench/flores_gl/flores_en-gl.yaml |generate_until | | |
| |flores_en-pt |lm_eval/tasks/portuguese_bench/flores_pt/flores_en-pt.yaml |generate_until | | |
| |flores_eng_Latn-ace_Arab_prompt_1 |lm_eval/tasks/afrobench/flores/prompt_1/english-african/flores_eng_Latn-ace_Arab.yaml |generate_until | | |
| |flores_eng_Latn-ace_Arab_prompt_2 |lm_eval/tasks/afrobench/flores/prompt_2/english-african/flores_eng_Latn-ace_Arab.yaml |generate_until | | |
| |flores_eng_Latn-ace_Arab_prompt_3 |lm_eval/tasks/afrobench/flores/prompt_3/english-african/flores_eng_Latn-ace_Arab.yaml |generate_until | | |
| |flores_eng_Latn-ace_Latn_prompt_1 |lm_eval/tasks/afrobench/flores/prompt_1/english-african/flores_eng_Latn-ace_Latn.yaml |generate_until | | |
| |flores_eng_Latn-ace_Latn_prompt_2 |lm_eval/tasks/afrobench/flores/prompt_2/english-african/flores_eng_Latn-ace_Latn.yaml |generate_until | | |
| |flores_eng_Latn-ace_Latn_prompt_3 |lm_eval/tasks/afrobench/flores/prompt_3/english-african/flores_eng_Latn-ace_Latn.yaml |generate_until | | |
| |flores_eng_Latn-acq_Arab_prompt_1 |lm_eval/tasks/afrobench/flores/prompt_1/english-african/flores_eng_Latn-acq_Arab.yaml |generate_until | | |
| |flores_eng_Latn-acq_Arab_prompt_2 |lm_eval/tasks/afrobench/flores/prompt_2/english-african/flores_eng_Latn-acq_Arab.yaml |generate_until | | |
| |flores_eng_Latn-acq_Arab_prompt_3 |lm_eval/tasks/afrobench/flores/prompt_3/english-african/flores_eng_Latn-acq_Arab.yaml |generate_until | | |
| |flores_eng_Latn-aeb_Arab_prompt_1 |lm_eval/tasks/afrobench/flores/prompt_1/english-african/flores_eng_Latn-aeb_Arab.yaml |generate_until | | |
| |flores_eng_Latn-aeb_Arab_prompt_2 |lm_eval/tasks/afrobench/flores/prompt_2/english-african/flores_eng_Latn-aeb_Arab.yaml |generate_until | | |
| |flores_eng_Latn-aeb_Arab_prompt_3 |lm_eval/tasks/afrobench/flores/prompt_3/english-african/flores_eng_Latn-aeb_Arab.yaml |generate_until | | |
| |flores_eng_Latn-afr_Latn_prompt_1 |lm_eval/tasks/afrobench/flores/prompt_1/english-african/flores_eng_Latn-afr_Latn.yaml |generate_until | | |
| |flores_eng_Latn-afr_Latn_prompt_2 |lm_eval/tasks/afrobench/flores/prompt_2/english-african/flores_eng_Latn-afr_Latn.yaml |generate_until | | |
| |flores_eng_Latn-afr_Latn_prompt_3 |lm_eval/tasks/afrobench/flores/prompt_3/english-african/flores_eng_Latn-afr_Latn.yaml |generate_until | | |
| |flores_eng_Latn-aka_Latn_prompt_1 |lm_eval/tasks/afrobench/flores/prompt_1/english-african/flores_eng_Latn-aka_Latn.yaml |generate_until | | |
| |flores_eng_Latn-aka_Latn_prompt_2 |lm_eval/tasks/afrobench/flores/prompt_2/english-african/flores_eng_Latn-aka_Latn.yaml |generate_until | | |
| |flores_eng_Latn-aka_Latn_prompt_3 |lm_eval/tasks/afrobench/flores/prompt_3/english-african/flores_eng_Latn-aka_Latn.yaml |generate_until | | |
| |flores_eng_Latn-amh_Ethi_prompt_1 |lm_eval/tasks/afrobench/flores/prompt_1/english-african/flores_eng_Latn-amh_Ethi.yaml |generate_until | | |
| |flores_eng_Latn-amh_Ethi_prompt_2 |lm_eval/tasks/afrobench/flores/prompt_2/english-african/flores_eng_Latn-amh_Ethi.yaml |generate_until | | |
| |flores_eng_Latn-amh_Ethi_prompt_3 |lm_eval/tasks/afrobench/flores/prompt_3/english-african/flores_eng_Latn-amh_Ethi.yaml |generate_until | | |
| |flores_eng_Latn-ary_Arab_prompt_1 |lm_eval/tasks/afrobench/flores/prompt_1/english-african/flores_eng_Latn-ary_Arab.yaml |generate_until | | |
| |flores_eng_Latn-ary_Arab_prompt_2 |lm_eval/tasks/afrobench/flores/prompt_2/english-african/flores_eng_Latn-ary_Arab.yaml |generate_until | | |
| |flores_eng_Latn-ary_Arab_prompt_3 |lm_eval/tasks/afrobench/flores/prompt_3/english-african/flores_eng_Latn-ary_Arab.yaml |generate_until | | |
| |flores_eng_Latn-arz_Arab_prompt_1 |lm_eval/tasks/afrobench/flores/prompt_1/english-african/flores_eng_Latn-arz_Arab.yaml |generate_until | | |
| |flores_eng_Latn-arz_Arab_prompt_2 |lm_eval/tasks/afrobench/flores/prompt_2/english-african/flores_eng_Latn-arz_Arab.yaml |generate_until | | |
| |flores_eng_Latn-arz_Arab_prompt_3 |lm_eval/tasks/afrobench/flores/prompt_3/english-african/flores_eng_Latn-arz_Arab.yaml |generate_until | | |
| |flores_eng_Latn-bam_Latn_prompt_1 |lm_eval/tasks/afrobench/flores/prompt_1/english-african/flores_eng_Latn-bam_Latn.yaml |generate_until | | |
| |flores_eng_Latn-bam_Latn_prompt_2 |lm_eval/tasks/afrobench/flores/prompt_2/english-african/flores_eng_Latn-bam_Latn.yaml |generate_until | | |
| |flores_eng_Latn-bam_Latn_prompt_3 |lm_eval/tasks/afrobench/flores/prompt_3/english-african/flores_eng_Latn-bam_Latn.yaml |generate_until | | |
| |flores_eng_Latn-ban_Latn_prompt_1 |lm_eval/tasks/afrobench/flores/prompt_1/english-african/flores_eng_Latn-ban_Latn.yaml |generate_until | | |
| |flores_eng_Latn-ban_Latn_prompt_2 |lm_eval/tasks/afrobench/flores/prompt_2/english-african/flores_eng_Latn-ban_Latn.yaml |generate_until | | |
| |flores_eng_Latn-ban_Latn_prompt_3 |lm_eval/tasks/afrobench/flores/prompt_3/english-african/flores_eng_Latn-ban_Latn.yaml |generate_until | | |
| |flores_eng_Latn-bem_Latn_prompt_1 |lm_eval/tasks/afrobench/flores/prompt_1/english-african/flores_eng_Latn-bem_Latn.yaml |generate_until | | |
| |flores_eng_Latn-bem_Latn_prompt_2 |lm_eval/tasks/afrobench/flores/prompt_2/english-african/flores_eng_Latn-bem_Latn.yaml |generate_until | | |
| |flores_eng_Latn-bem_Latn_prompt_3 |lm_eval/tasks/afrobench/flores/prompt_3/english-african/flores_eng_Latn-bem_Latn.yaml |generate_until | | |
| |flores_eng_Latn-cjk_Latn_prompt_1 |lm_eval/tasks/afrobench/flores/prompt_1/english-african/flores_eng_Latn-cjk_Latn.yaml |generate_until | | |
| |flores_eng_Latn-cjk_Latn_prompt_2 |lm_eval/tasks/afrobench/flores/prompt_2/english-african/flores_eng_Latn-cjk_Latn.yaml |generate_until | | |
| |flores_eng_Latn-cjk_Latn_prompt_3 |lm_eval/tasks/afrobench/flores/prompt_3/english-african/flores_eng_Latn-cjk_Latn.yaml |generate_until | | |
| |flores_eng_Latn-dik_Latn_prompt_1 |lm_eval/tasks/afrobench/flores/prompt_1/english-african/flores_eng_Latn-dik_Latn.yaml |generate_until | | |
| |flores_eng_Latn-dik_Latn_prompt_2 |lm_eval/tasks/afrobench/flores/prompt_2/english-african/flores_eng_Latn-dik_Latn.yaml |generate_until | | |
| |flores_eng_Latn-dik_Latn_prompt_3 |lm_eval/tasks/afrobench/flores/prompt_3/english-african/flores_eng_Latn-dik_Latn.yaml |generate_until | | |
| |flores_eng_Latn-dyu_Latn_prompt_1 |lm_eval/tasks/afrobench/flores/prompt_1/english-african/flores_eng_Latn-dyu_Latn.yaml |generate_until | | |
| |flores_eng_Latn-dyu_Latn_prompt_2 |lm_eval/tasks/afrobench/flores/prompt_2/english-african/flores_eng_Latn-dyu_Latn.yaml |generate_until | | |
| |flores_eng_Latn-dyu_Latn_prompt_3 |lm_eval/tasks/afrobench/flores/prompt_3/english-african/flores_eng_Latn-dyu_Latn.yaml |generate_until | | |
| |flores_eng_Latn-ewe_Latn_prompt_1 |lm_eval/tasks/afrobench/flores/prompt_1/english-african/flores_eng_Latn-ewe_Latn.yaml |generate_until | | |
| |flores_eng_Latn-ewe_Latn_prompt_2 |lm_eval/tasks/afrobench/flores/prompt_2/english-african/flores_eng_Latn-ewe_Latn.yaml |generate_until | | |
| |flores_eng_Latn-ewe_Latn_prompt_3 |lm_eval/tasks/afrobench/flores/prompt_3/english-african/flores_eng_Latn-ewe_Latn.yaml |generate_until | | |
| |flores_eng_Latn-fon_Latn_prompt_1 |lm_eval/tasks/afrobench/flores/prompt_1/english-african/flores_eng_Latn-fon_Latn.yaml |generate_until | | |
| |flores_eng_Latn-fon_Latn_prompt_2 |lm_eval/tasks/afrobench/flores/prompt_2/english-african/flores_eng_Latn-fon_Latn.yaml |generate_until | | |
| |flores_eng_Latn-fon_Latn_prompt_3 |lm_eval/tasks/afrobench/flores/prompt_3/english-african/flores_eng_Latn-fon_Latn.yaml |generate_until | | |
| |flores_eng_Latn-fra_Latn_prompt_1 |lm_eval/tasks/afrobench/flores/prompt_1/english-african/flores_eng_Latn-fra_Latn.yaml |generate_until | | |
| |flores_eng_Latn-fra_Latn_prompt_2 |lm_eval/tasks/afrobench/flores/prompt_2/english-african/flores_eng_Latn-fra_Latn.yaml |generate_until | | |
| |flores_eng_Latn-fra_Latn_prompt_3 |lm_eval/tasks/afrobench/flores/prompt_3/english-african/flores_eng_Latn-fra_Latn.yaml |generate_until | | |
| |flores_eng_Latn-fuv_Latn_prompt_1 |lm_eval/tasks/afrobench/flores/prompt_1/english-african/flores_eng_Latn-fuv_Latn.yaml |generate_until | | |
| |flores_eng_Latn-fuv_Latn_prompt_2 |lm_eval/tasks/afrobench/flores/prompt_2/english-african/flores_eng_Latn-fuv_Latn.yaml |generate_until | | |
| |flores_eng_Latn-fuv_Latn_prompt_3 |lm_eval/tasks/afrobench/flores/prompt_3/english-african/flores_eng_Latn-fuv_Latn.yaml |generate_until | | |
| |flores_eng_Latn-gaz_Latn_prompt_1 |lm_eval/tasks/afrobench/flores/prompt_1/english-african/flores_eng_Latn-gaz_Latn.yaml |generate_until | | |
| |flores_eng_Latn-gaz_Latn_prompt_2 |lm_eval/tasks/afrobench/flores/prompt_2/english-african/flores_eng_Latn-gaz_Latn.yaml |generate_until | | |
| |flores_eng_Latn-gaz_Latn_prompt_3 |lm_eval/tasks/afrobench/flores/prompt_3/english-african/flores_eng_Latn-gaz_Latn.yaml |generate_until | | |
| |flores_eng_Latn-hau_Latn_prompt_1 |lm_eval/tasks/afrobench/flores/prompt_1/english-african/flores_eng_Latn-hau_Latn.yaml |generate_until | | |
| |flores_eng_Latn-hau_Latn_prompt_2 |lm_eval/tasks/afrobench/flores/prompt_2/english-african/flores_eng_Latn-hau_Latn.yaml |generate_until | | |
| |flores_eng_Latn-hau_Latn_prompt_3 |lm_eval/tasks/afrobench/flores/prompt_3/english-african/flores_eng_Latn-hau_Latn.yaml |generate_until | | |
| |flores_eng_Latn-ibo_Latn_prompt_1 |lm_eval/tasks/afrobench/flores/prompt_1/english-african/flores_eng_Latn-ibo_Latn.yaml |generate_until | | |
| |flores_eng_Latn-ibo_Latn_prompt_2 |lm_eval/tasks/afrobench/flores/prompt_2/english-african/flores_eng_Latn-ibo_Latn.yaml |generate_until | | |
| |flores_eng_Latn-ibo_Latn_prompt_3 |lm_eval/tasks/afrobench/flores/prompt_3/english-african/flores_eng_Latn-ibo_Latn.yaml |generate_until | | |
| |flores_eng_Latn-kab_Latn_prompt_1 |lm_eval/tasks/afrobench/flores/prompt_1/english-african/flores_eng_Latn-kab_Latn.yaml |generate_until | | |
| |flores_eng_Latn-kab_Latn_prompt_2 |lm_eval/tasks/afrobench/flores/prompt_2/english-african/flores_eng_Latn-kab_Latn.yaml |generate_until | | |
| |flores_eng_Latn-kab_Latn_prompt_3 |lm_eval/tasks/afrobench/flores/prompt_3/english-african/flores_eng_Latn-kab_Latn.yaml |generate_until | | |
| |flores_eng_Latn-kam_Latn_prompt_1 |lm_eval/tasks/afrobench/flores/prompt_1/english-african/flores_eng_Latn-kam_Latn.yaml |generate_until | | |
| |flores_eng_Latn-kam_Latn_prompt_2 |lm_eval/tasks/afrobench/flores/prompt_2/english-african/flores_eng_Latn-kam_Latn.yaml |generate_until | | |
| |flores_eng_Latn-kam_Latn_prompt_3 |lm_eval/tasks/afrobench/flores/prompt_3/english-african/flores_eng_Latn-kam_Latn.yaml |generate_until | | |
| |flores_eng_Latn-kbp_Latn_prompt_1 |lm_eval/tasks/afrobench/flores/prompt_1/english-african/flores_eng_Latn-kbp_Latn.yaml |generate_until | | |
| |flores_eng_Latn-kbp_Latn_prompt_2 |lm_eval/tasks/afrobench/flores/prompt_2/english-african/flores_eng_Latn-kbp_Latn.yaml |generate_until | | |
| |flores_eng_Latn-kbp_Latn_prompt_3 |lm_eval/tasks/afrobench/flores/prompt_3/english-african/flores_eng_Latn-kbp_Latn.yaml |generate_until | | |
| |flores_eng_Latn-kea_Latn_prompt_1 |lm_eval/tasks/afrobench/flores/prompt_1/english-african/flores_eng_Latn-kea_Latn.yaml |generate_until | | |
| |flores_eng_Latn-kea_Latn_prompt_2 |lm_eval/tasks/afrobench/flores/prompt_2/english-african/flores_eng_Latn-kea_Latn.yaml |generate_until | | |
| |flores_eng_Latn-kea_Latn_prompt_3 |lm_eval/tasks/afrobench/flores/prompt_3/english-african/flores_eng_Latn-kea_Latn.yaml |generate_until | | |
| |flores_eng_Latn-kik_Latn_prompt_1 |lm_eval/tasks/afrobench/flores/prompt_1/english-african/flores_eng_Latn-kik_Latn.yaml |generate_until | | |
| |flores_eng_Latn-kik_Latn_prompt_2 |lm_eval/tasks/afrobench/flores/prompt_2/english-african/flores_eng_Latn-kik_Latn.yaml |generate_until | | |
| |flores_eng_Latn-kik_Latn_prompt_3 |lm_eval/tasks/afrobench/flores/prompt_3/english-african/flores_eng_Latn-kik_Latn.yaml |generate_until | | |
| |flores_eng_Latn-kin_Latn_prompt_1 |lm_eval/tasks/afrobench/flores/prompt_1/english-african/flores_eng_Latn-kin_Latn.yaml |generate_until | | |
| |flores_eng_Latn-kin_Latn_prompt_2 |lm_eval/tasks/afrobench/flores/prompt_2/english-african/flores_eng_Latn-kin_Latn.yaml |generate_until | | |
| |flores_eng_Latn-kin_Latn_prompt_3 |lm_eval/tasks/afrobench/flores/prompt_3/english-african/flores_eng_Latn-kin_Latn.yaml |generate_until | | |
| |flores_eng_Latn-kmb_Latn_prompt_1 |lm_eval/tasks/afrobench/flores/prompt_1/english-african/flores_eng_Latn-kmb_Latn.yaml |generate_until | | |
| |flores_eng_Latn-kmb_Latn_prompt_2 |lm_eval/tasks/afrobench/flores/prompt_2/english-african/flore |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment