Unverified Commit 815f59e6 authored by Lintang Sutawika's avatar Lintang Sutawika Committed by GitHub
Browse files

Merge pull request #922 from EleutherAI/mmlu_subgroups

[Refactor] Mmlu subgroups and weight avg
parents 3533e4b9 44124d95
"dataset_name": "international_law"
"description": "The following are multiple choice questions (with answers) about international law.\n\n"
"description": "The following are multiple choice questions (with answers) about international\
\ law.\n\n"
"group": "mmlu_humanities"
"group_alias": "humanities"
"include": "_default_template_yaml"
"task": "mmlu_international_law"
"task_alias": "international_law"
"dataset_name": "jurisprudence"
"description": "The following are multiple choice questions (with answers) about jurisprudence.\n\n"
"description": "The following are multiple choice questions (with answers) about jurisprudence.\n\
\n"
"group": "mmlu_humanities"
"group_alias": "humanities"
"include": "_default_template_yaml"
"task": "mmlu_jurisprudence"
"task_alias": "jurisprudence"
"dataset_name": "logical_fallacies"
"description": "The following are multiple choice questions (with answers) about logical fallacies.\n\n"
"description": "The following are multiple choice questions (with answers) about logical\
\ fallacies.\n\n"
"group": "mmlu_humanities"
"group_alias": "humanities"
"include": "_default_template_yaml"
"task": "mmlu_logical_fallacies"
"task_alias": "logical_fallacies"
"dataset_name": "machine_learning"
"description": "The following are multiple choice questions (with answers) about machine learning.\n\n"
"description": "The following are multiple choice questions (with answers) about machine\
\ learning.\n\n"
"group": "mmlu_stem"
"group_alias": "stem"
"include": "_default_template_yaml"
"task": "mmlu_machine_learning"
"task_alias": "machine_learning"
"dataset_name": "management"
"description": "The following are multiple choice questions (with answers) about management.\n\n"
"description": "The following are multiple choice questions (with answers) about management.\n\
\n"
"group": "mmlu_other"
"group_alias": "other"
"include": "_default_template_yaml"
"task": "mmlu_management"
"task_alias": "management"
"dataset_name": "marketing"
"description": "The following are multiple choice questions (with answers) about marketing.\n\n"
"description": "The following are multiple choice questions (with answers) about marketing.\n\
\n"
"group": "mmlu_other"
"group_alias": "other"
"include": "_default_template_yaml"
"task": "mmlu_marketing"
"task_alias": "marketing"
"dataset_name": "medical_genetics"
"description": "The following are multiple choice questions (with answers) about medical genetics.\n\n"
"description": "The following are multiple choice questions (with answers) about medical\
\ genetics.\n\n"
"group": "mmlu_other"
"group_alias": "other"
"include": "_default_template_yaml"
"task": "mmlu_medical_genetics"
"task_alias": "medical_genetics"
"dataset_name": "miscellaneous"
"description": "The following are multiple choice questions (with answers) about miscellaneous.\n\n"
"description": "The following are multiple choice questions (with answers) about miscellaneous.\n\
\n"
"group": "mmlu_other"
"group_alias": "other"
"include": "_default_template_yaml"
"task": "mmlu_miscellaneous"
"task_alias": "miscellaneous"
"dataset_name": "moral_disputes"
"description": "The following are multiple choice questions (with answers) about moral disputes.\n\n"
"description": "The following are multiple choice questions (with answers) about moral\
\ disputes.\n\n"
"group": "mmlu_humanities"
"group_alias": "humanities"
"include": "_default_template_yaml"
"task": "mmlu_moral_disputes"
"task_alias": "moral_disputes"
"dataset_name": "moral_scenarios"
"description": "The following are multiple choice questions (with answers) about moral scenarios.\n\n"
"description": "The following are multiple choice questions (with answers) about moral\
\ scenarios.\n\n"
"group": "mmlu_humanities"
"group_alias": "humanities"
"include": "_default_template_yaml"
"task": "mmlu_moral_scenarios"
"task_alias": "moral_scenarios"
"dataset_name": "nutrition"
"description": "The following are multiple choice questions (with answers) about nutrition.\n\n"
"description": "The following are multiple choice questions (with answers) about nutrition.\n\
\n"
"group": "mmlu_other"
"group_alias": "other"
"include": "_default_template_yaml"
"task": "mmlu_nutrition"
"task_alias": "nutrition"
"dataset_name": "philosophy"
"description": "The following are multiple choice questions (with answers) about philosophy.\n\n"
"description": "The following are multiple choice questions (with answers) about philosophy.\n\
\n"
"group": "mmlu_humanities"
"group_alias": "humanities"
"include": "_default_template_yaml"
"task": "mmlu_philosophy"
"task_alias": "philosophy"
"dataset_name": "prehistory"
"description": "The following are multiple choice questions (with answers) about prehistory.\n\n"
"description": "The following are multiple choice questions (with answers) about prehistory.\n\
\n"
"group": "mmlu_humanities"
"group_alias": "humanities"
"include": "_default_template_yaml"
"task": "mmlu_prehistory"
"task_alias": "prehistory"
"dataset_name": "professional_accounting"
"description": "The following are multiple choice questions (with answers) about professional accounting.\n\n"
"description": "The following are multiple choice questions (with answers) about professional\
\ accounting.\n\n"
"group": "mmlu_other"
"group_alias": "other"
"include": "_default_template_yaml"
"task": "mmlu_professional_accounting"
"task_alias": "professional_accounting"
"dataset_name": "professional_law"
"description": "The following are multiple choice questions (with answers) about professional law.\n\n"
"description": "The following are multiple choice questions (with answers) about professional\
\ law.\n\n"
"group": "mmlu_humanities"
"group_alias": "humanities"
"include": "_default_template_yaml"
"task": "mmlu_professional_law"
"task_alias": "professional_law"
"dataset_name": "professional_medicine"
"description": "The following are multiple choice questions (with answers) about professional medicine.\n\n"
"description": "The following are multiple choice questions (with answers) about professional\
\ medicine.\n\n"
"group": "mmlu_other"
"group_alias": "other"
"include": "_default_template_yaml"
"task": "mmlu_professional_medicine"
"task_alias": "professional_medicine"
"dataset_name": "professional_psychology"
"description": "The following are multiple choice questions (with answers) about professional psychology.\n\n"
"description": "The following are multiple choice questions (with answers) about professional\
\ psychology.\n\n"
"group": "mmlu_social_sciences"
"group_alias": "social_sciences"
"include": "_default_template_yaml"
"task": "mmlu_professional_psychology"
"task_alias": "professional_psychology"
"dataset_name": "public_relations"
"description": "The following are multiple choice questions (with answers) about public relations.\n\n"
"description": "The following are multiple choice questions (with answers) about public\
\ relations.\n\n"
"group": "mmlu_social_sciences"
"group_alias": "social_sciences"
"include": "_default_template_yaml"
"task": "mmlu_public_relations"
"task_alias": "public_relations"
"dataset_name": "security_studies"
"description": "The following are multiple choice questions (with answers) about security studies.\n\n"
"description": "The following are multiple choice questions (with answers) about security\
\ studies.\n\n"
"group": "mmlu_social_sciences"
"group_alias": "social_sciences"
"include": "_default_template_yaml"
"task": "mmlu_security_studies"
"task_alias": "security_studies"
"dataset_name": "sociology"
"description": "The following are multiple choice questions (with answers) about sociology.\n\n"
"description": "The following are multiple choice questions (with answers) about sociology.\n\
\n"
"group": "mmlu_social_sciences"
"group_alias": "social_sciences"
"include": "_default_template_yaml"
"task": "mmlu_sociology"
"task_alias": "sociology"
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment