Merge branch 'big-refactor' into verbosity-rework

574e565a · Lintang Sutawika · GitHub · 73f3029c · b7a4ea06 · 574e565a
Unverified Commit 574e565a authored Nov 10, 2023 by Lintang Sutawika Committed by GitHub Nov 10, 2023
20 changed files
--- a/lm_eval/tasks/mmlu/default/mmlu_high_school_psychology.yaml
+++ b/lm_eval/tasks/mmlu/default/mmlu_high_school_psychology.yaml
 "dataset_name": "high_school_psychology"
-"description": "The following are multiple choice questions (with answers) about high school psychology.\n\n"
+"description": "The following are multiple choice questions (with answers) about high\
+  \ school psychology.\n\n"
+"group": "mmlu_social_sciences"
+"group_alias": "social_sciences"
 "include": "_default_template_yaml"
 "task": "mmlu_high_school_psychology"
+"task_alias": "high_school_psychology"
--- a/lm_eval/tasks/mmlu/default/mmlu_high_school_statistics.yaml
+++ b/lm_eval/tasks/mmlu/default/mmlu_high_school_statistics.yaml
 "dataset_name": "high_school_statistics"
-"description": "The following are multiple choice questions (with answers) about high school statistics.\n\n"
+"description": "The following are multiple choice questions (with answers) about high\
+  \ school statistics.\n\n"
+"group": "mmlu_stem"
+"group_alias": "stem"
 "include": "_default_template_yaml"
 "task": "mmlu_high_school_statistics"
+"task_alias": "high_school_statistics"
--- a/lm_eval/tasks/mmlu/default/mmlu_high_school_us_history.yaml
+++ b/lm_eval/tasks/mmlu/default/mmlu_high_school_us_history.yaml
 "dataset_name": "high_school_us_history"
-"description": "The following are multiple choice questions (with answers) about high school us history.\n\n"
+"description": "The following are multiple choice questions (with answers) about high\
+  \ school us history.\n\n"
+"group": "mmlu_humanities"
+"group_alias": "humanities"
 "include": "_default_template_yaml"
 "task": "mmlu_high_school_us_history"
+"task_alias": "high_school_us_history"
--- a/lm_eval/tasks/mmlu/default/mmlu_high_school_world_history.yaml
+++ b/lm_eval/tasks/mmlu/default/mmlu_high_school_world_history.yaml
 "dataset_name": "high_school_world_history"
-"description": "The following are multiple choice questions (with answers) about high school world history.\n\n"
+"description": "The following are multiple choice questions (with answers) about high\
+  \ school world history.\n\n"
+"group": "mmlu_humanities"
+"group_alias": "humanities"
 "include": "_default_template_yaml"
 "task": "mmlu_high_school_world_history"
+"task_alias": "high_school_world_history"
--- a/lm_eval/tasks/mmlu/default/mmlu_human_aging.yaml
+++ b/lm_eval/tasks/mmlu/default/mmlu_human_aging.yaml
 "dataset_name": "human_aging"
-"description": "The following are multiple choice questions (with answers) about human aging.\n\n"
+"description": "The following are multiple choice questions (with answers) about human\
+  \ aging.\n\n"
+"group": "mmlu_other"
+"group_alias": "other"
 "include": "_default_template_yaml"
 "task": "mmlu_human_aging"
+"task_alias": "human_aging"
--- a/lm_eval/tasks/mmlu/default/mmlu_human_sexuality.yaml
+++ b/lm_eval/tasks/mmlu/default/mmlu_human_sexuality.yaml
 "dataset_name": "human_sexuality"
-"description": "The following are multiple choice questions (with answers) about human sexuality.\n\n"
+"description": "The following are multiple choice questions (with answers) about human\
+  \ sexuality.\n\n"
+"group": "mmlu_social_sciences"
+"group_alias": "social_sciences"
 "include": "_default_template_yaml"
 "task": "mmlu_human_sexuality"
+"task_alias": "human_sexuality"
--- a/lm_eval/tasks/mmlu/default/mmlu_international_law.yaml
+++ b/lm_eval/tasks/mmlu/default/mmlu_international_law.yaml
 "dataset_name": "international_law"
-"description": "The following are multiple choice questions (with answers) about international law.\n\n"
+"description": "The following are multiple choice questions (with answers) about international\
+  \ law.\n\n"
+"group": "mmlu_humanities"
+"group_alias": "humanities"
 "include": "_default_template_yaml"
 "task": "mmlu_international_law"
+"task_alias": "international_law"
--- a/lm_eval/tasks/mmlu/default/mmlu_jurisprudence.yaml
+++ b/lm_eval/tasks/mmlu/default/mmlu_jurisprudence.yaml
 "dataset_name": "jurisprudence"
-"description": "The following are multiple choice questions (with answers) about jurisprudence.\n\n"
+"description": "The following are multiple choice questions (with answers) about jurisprudence.\n\
+  \n"
+"group": "mmlu_humanities"
+"group_alias": "humanities"
 "include": "_default_template_yaml"
 "task": "mmlu_jurisprudence"
+"task_alias": "jurisprudence"
--- a/lm_eval/tasks/mmlu/default/mmlu_logical_fallacies.yaml
+++ b/lm_eval/tasks/mmlu/default/mmlu_logical_fallacies.yaml
 "dataset_name": "logical_fallacies"
-"description": "The following are multiple choice questions (with answers) about logical fallacies.\n\n"
+"description": "The following are multiple choice questions (with answers) about logical\
+  \ fallacies.\n\n"
+"group": "mmlu_humanities"
+"group_alias": "humanities"
 "include": "_default_template_yaml"
 "task": "mmlu_logical_fallacies"
+"task_alias": "logical_fallacies"
--- a/lm_eval/tasks/mmlu/default/mmlu_machine_learning.yaml
+++ b/lm_eval/tasks/mmlu/default/mmlu_machine_learning.yaml
 "dataset_name": "machine_learning"
-"description": "The following are multiple choice questions (with answers) about machine learning.\n\n"
+"description": "The following are multiple choice questions (with answers) about machine\
+  \ learning.\n\n"
+"group": "mmlu_stem"
+"group_alias": "stem"
 "include": "_default_template_yaml"
 "task": "mmlu_machine_learning"
+"task_alias": "machine_learning"
--- a/lm_eval/tasks/mmlu/default/mmlu_management.yaml
+++ b/lm_eval/tasks/mmlu/default/mmlu_management.yaml
 "dataset_name": "management"
-"description": "The following are multiple choice questions (with answers) about management.\n\n"
+"description": "The following are multiple choice questions (with answers) about management.\n\
+  \n"
+"group": "mmlu_other"
+"group_alias": "other"
 "include": "_default_template_yaml"
 "task": "mmlu_management"
+"task_alias": "management"
--- a/lm_eval/tasks/mmlu/default/mmlu_marketing.yaml
+++ b/lm_eval/tasks/mmlu/default/mmlu_marketing.yaml
 "dataset_name": "marketing"
-"description": "The following are multiple choice questions (with answers) about marketing.\n\n"
+"description": "The following are multiple choice questions (with answers) about marketing.\n\
+  \n"
+"group": "mmlu_other"
+"group_alias": "other"
 "include": "_default_template_yaml"
 "task": "mmlu_marketing"
+"task_alias": "marketing"
--- a/lm_eval/tasks/mmlu/default/mmlu_medical_genetics.yaml
+++ b/lm_eval/tasks/mmlu/default/mmlu_medical_genetics.yaml
 "dataset_name": "medical_genetics"
-"description": "The following are multiple choice questions (with answers) about medical genetics.\n\n"
+"description": "The following are multiple choice questions (with answers) about medical\
+  \ genetics.\n\n"
+"group": "mmlu_other"
+"group_alias": "other"
 "include": "_default_template_yaml"
 "task": "mmlu_medical_genetics"
+"task_alias": "medical_genetics"
--- a/lm_eval/tasks/mmlu/default/mmlu_miscellaneous.yaml
+++ b/lm_eval/tasks/mmlu/default/mmlu_miscellaneous.yaml
 "dataset_name": "miscellaneous"
-"description": "The following are multiple choice questions (with answers) about miscellaneous.\n\n"
+"description": "The following are multiple choice questions (with answers) about miscellaneous.\n\
+  \n"
+"group": "mmlu_other"
+"group_alias": "other"
 "include": "_default_template_yaml"
 "task": "mmlu_miscellaneous"
+"task_alias": "miscellaneous"
--- a/lm_eval/tasks/mmlu/default/mmlu_moral_disputes.yaml
+++ b/lm_eval/tasks/mmlu/default/mmlu_moral_disputes.yaml
 "dataset_name": "moral_disputes"
-"description": "The following are multiple choice questions (with answers) about moral disputes.\n\n"
+"description": "The following are multiple choice questions (with answers) about moral\
+  \ disputes.\n\n"
+"group": "mmlu_humanities"
+"group_alias": "humanities"
 "include": "_default_template_yaml"
 "task": "mmlu_moral_disputes"
+"task_alias": "moral_disputes"
--- a/lm_eval/tasks/mmlu/default/mmlu_moral_scenarios.yaml
+++ b/lm_eval/tasks/mmlu/default/mmlu_moral_scenarios.yaml
 "dataset_name": "moral_scenarios"
-"description": "The following are multiple choice questions (with answers) about moral scenarios.\n\n"
+"description": "The following are multiple choice questions (with answers) about moral\
+  \ scenarios.\n\n"
+"group": "mmlu_humanities"
+"group_alias": "humanities"
 "include": "_default_template_yaml"
 "task": "mmlu_moral_scenarios"
+"task_alias": "moral_scenarios"
--- a/lm_eval/tasks/mmlu/default/mmlu_nutrition.yaml
+++ b/lm_eval/tasks/mmlu/default/mmlu_nutrition.yaml
 "dataset_name": "nutrition"
-"description": "The following are multiple choice questions (with answers) about nutrition.\n\n"
+"description": "The following are multiple choice questions (with answers) about nutrition.\n\
+  \n"
+"group": "mmlu_other"
+"group_alias": "other"
 "include": "_default_template_yaml"
 "task": "mmlu_nutrition"
+"task_alias": "nutrition"
--- a/lm_eval/tasks/mmlu/default/mmlu_philosophy.yaml
+++ b/lm_eval/tasks/mmlu/default/mmlu_philosophy.yaml
 "dataset_name": "philosophy"
-"description": "The following are multiple choice questions (with answers) about philosophy.\n\n"
+"description": "The following are multiple choice questions (with answers) about philosophy.\n\
+  \n"
+"group": "mmlu_humanities"
+"group_alias": "humanities"
 "include": "_default_template_yaml"
 "task": "mmlu_philosophy"
+"task_alias": "philosophy"
--- a/lm_eval/tasks/mmlu/default/mmlu_prehistory.yaml
+++ b/lm_eval/tasks/mmlu/default/mmlu_prehistory.yaml
 "dataset_name": "prehistory"
-"description": "The following are multiple choice questions (with answers) about prehistory.\n\n"
+"description": "The following are multiple choice questions (with answers) about prehistory.\n\
+  \n"
+"group": "mmlu_humanities"
+"group_alias": "humanities"
 "include": "_default_template_yaml"
 "task": "mmlu_prehistory"
+"task_alias": "prehistory"
--- a/lm_eval/tasks/mmlu/default/mmlu_professional_accounting.yaml
+++ b/lm_eval/tasks/mmlu/default/mmlu_professional_accounting.yaml
 "dataset_name": "professional_accounting"
-"description": "The following are multiple choice questions (with answers) about professional accounting.\n\n"
+"description": "The following are multiple choice questions (with answers) about professional\
+  \ accounting.\n\n"
+"group": "mmlu_other"
+"group_alias": "other"
 "include": "_default_template_yaml"
 "task": "mmlu_professional_accounting"
+"task_alias": "professional_accounting"