Unverified Commit 815f59e6 authored by Lintang Sutawika's avatar Lintang Sutawika Committed by GitHub
Browse files

Merge pull request #922 from EleutherAI/mmlu_subgroups

[Refactor] Mmlu subgroups and weight avg
parents 3533e4b9 44124d95
dataset_name: logical_fallacies
description: 'The following are multiple choice questions (with answers) about logical
fallacies.
'
include: _mmlu_flan_generative_template_yaml
task: mmlu_flan_cot_zeroshot_logical_fallacies
"dataset_name": "logical_fallacies"
"description": "The following are multiple choice questions (with answers) about logical\
\ fallacies.\n\n"
"group": "mmlu_flan_cot_zeroshot_humanities"
"include": "_mmlu_flan_cot_zeroshot_template_yaml"
"task": "mmlu_flan_cot_zeroshot_logical_fallacies"
dataset_name: machine_learning
description: 'The following are multiple choice questions (with answers) about machine
learning.
'
include: _mmlu_flan_generative_template_yaml
task: mmlu_flan_cot_zeroshot_machine_learning
"dataset_name": "machine_learning"
"description": "The following are multiple choice questions (with answers) about machine\
\ learning.\n\n"
"group": "mmlu_flan_cot_zeroshot_stem"
"include": "_mmlu_flan_cot_zeroshot_template_yaml"
"task": "mmlu_flan_cot_zeroshot_machine_learning"
dataset_name: management
description: 'The following are multiple choice questions (with answers) about management.
'
include: _mmlu_flan_generative_template_yaml
task: mmlu_flan_cot_zeroshot_management
"dataset_name": "management"
"description": "The following are multiple choice questions (with answers) about management.\n\
\n"
"group": "mmlu_flan_cot_zeroshot_other"
"include": "_mmlu_flan_cot_zeroshot_template_yaml"
"task": "mmlu_flan_cot_zeroshot_management"
dataset_name: marketing
description: 'The following are multiple choice questions (with answers) about marketing.
'
include: _mmlu_flan_generative_template_yaml
task: mmlu_flan_cot_zeroshot_marketing
"dataset_name": "marketing"
"description": "The following are multiple choice questions (with answers) about marketing.\n\
\n"
"group": "mmlu_flan_cot_zeroshot_other"
"include": "_mmlu_flan_cot_zeroshot_template_yaml"
"task": "mmlu_flan_cot_zeroshot_marketing"
dataset_name: medical_genetics
description: 'The following are multiple choice questions (with answers) about medical
genetics.
'
include: _mmlu_flan_generative_template_yaml
task: mmlu_flan_cot_zeroshot_medical_genetics
"dataset_name": "medical_genetics"
"description": "The following are multiple choice questions (with answers) about medical\
\ genetics.\n\n"
"group": "mmlu_flan_cot_zeroshot_other"
"include": "_mmlu_flan_cot_zeroshot_template_yaml"
"task": "mmlu_flan_cot_zeroshot_medical_genetics"
dataset_name: miscellaneous
description: 'The following are multiple choice questions (with answers) about miscellaneous.
'
include: _mmlu_flan_generative_template_yaml
task: mmlu_flan_cot_zeroshot_miscellaneous
"dataset_name": "miscellaneous"
"description": "The following are multiple choice questions (with answers) about miscellaneous.\n\
\n"
"group": "mmlu_flan_cot_zeroshot_other"
"include": "_mmlu_flan_cot_zeroshot_template_yaml"
"task": "mmlu_flan_cot_zeroshot_miscellaneous"
dataset_name: moral_disputes
description: 'The following are multiple choice questions (with answers) about moral
disputes.
'
include: _mmlu_flan_generative_template_yaml
task: mmlu_flan_cot_zeroshot_moral_disputes
"dataset_name": "moral_disputes"
"description": "The following are multiple choice questions (with answers) about moral\
\ disputes.\n\n"
"group": "mmlu_flan_cot_zeroshot_humanities"
"include": "_mmlu_flan_cot_zeroshot_template_yaml"
"task": "mmlu_flan_cot_zeroshot_moral_disputes"
dataset_name: moral_scenarios
description: 'The following are multiple choice questions (with answers) about moral
scenarios.
'
include: _mmlu_flan_generative_template_yaml
task: mmlu_flan_cot_zeroshot_moral_scenarios
"dataset_name": "moral_scenarios"
"description": "The following are multiple choice questions (with answers) about moral\
\ scenarios.\n\n"
"group": "mmlu_flan_cot_zeroshot_humanities"
"include": "_mmlu_flan_cot_zeroshot_template_yaml"
"task": "mmlu_flan_cot_zeroshot_moral_scenarios"
dataset_name: nutrition
description: 'The following are multiple choice questions (with answers) about nutrition.
'
include: _mmlu_flan_generative_template_yaml
task: mmlu_flan_cot_zeroshot_nutrition
"dataset_name": "nutrition"
"description": "The following are multiple choice questions (with answers) about nutrition.\n\
\n"
"group": "mmlu_flan_cot_zeroshot_other"
"include": "_mmlu_flan_cot_zeroshot_template_yaml"
"task": "mmlu_flan_cot_zeroshot_nutrition"
dataset_name: philosophy
description: 'The following are multiple choice questions (with answers) about philosophy.
'
include: _mmlu_flan_generative_template_yaml
task: mmlu_flan_cot_zeroshot_philosophy
"dataset_name": "philosophy"
"description": "The following are multiple choice questions (with answers) about philosophy.\n\
\n"
"group": "mmlu_flan_cot_zeroshot_humanities"
"include": "_mmlu_flan_cot_zeroshot_template_yaml"
"task": "mmlu_flan_cot_zeroshot_philosophy"
dataset_name: prehistory
description: 'The following are multiple choice questions (with answers) about prehistory.
'
include: _mmlu_flan_generative_template_yaml
task: mmlu_flan_cot_zeroshot_prehistory
"dataset_name": "prehistory"
"description": "The following are multiple choice questions (with answers) about prehistory.\n\
\n"
"group": "mmlu_flan_cot_zeroshot_humanities"
"include": "_mmlu_flan_cot_zeroshot_template_yaml"
"task": "mmlu_flan_cot_zeroshot_prehistory"
dataset_name: professional_accounting
description: 'The following are multiple choice questions (with answers) about professional
accounting.
'
include: _mmlu_flan_generative_template_yaml
task: mmlu_flan_cot_zeroshot_professional_accounting
"dataset_name": "professional_accounting"
"description": "The following are multiple choice questions (with answers) about professional\
\ accounting.\n\n"
"group": "mmlu_flan_cot_zeroshot_other"
"include": "_mmlu_flan_cot_zeroshot_template_yaml"
"task": "mmlu_flan_cot_zeroshot_professional_accounting"
dataset_name: professional_law
description: 'The following are multiple choice questions (with answers) about professional
law.
'
include: _mmlu_flan_generative_template_yaml
task: mmlu_flan_cot_zeroshot_professional_law
"dataset_name": "professional_law"
"description": "The following are multiple choice questions (with answers) about professional\
\ law.\n\n"
"group": "mmlu_flan_cot_zeroshot_humanities"
"include": "_mmlu_flan_cot_zeroshot_template_yaml"
"task": "mmlu_flan_cot_zeroshot_professional_law"
dataset_name: professional_medicine
description: 'The following are multiple choice questions (with answers) about professional
medicine.
'
include: _mmlu_flan_generative_template_yaml
task: mmlu_flan_cot_zeroshot_professional_medicine
"dataset_name": "professional_medicine"
"description": "The following are multiple choice questions (with answers) about professional\
\ medicine.\n\n"
"group": "mmlu_flan_cot_zeroshot_other"
"include": "_mmlu_flan_cot_zeroshot_template_yaml"
"task": "mmlu_flan_cot_zeroshot_professional_medicine"
dataset_name: professional_psychology
description: 'The following are multiple choice questions (with answers) about professional
psychology.
'
include: _mmlu_flan_generative_template_yaml
task: mmlu_flan_cot_zeroshot_professional_psychology
"dataset_name": "professional_psychology"
"description": "The following are multiple choice questions (with answers) about professional\
\ psychology.\n\n"
"group": "mmlu_flan_cot_zeroshot_social_sciences"
"include": "_mmlu_flan_cot_zeroshot_template_yaml"
"task": "mmlu_flan_cot_zeroshot_professional_psychology"
dataset_name: public_relations
description: 'The following are multiple choice questions (with answers) about public
relations.
'
include: _mmlu_flan_generative_template_yaml
task: mmlu_flan_cot_zeroshot_public_relations
"dataset_name": "public_relations"
"description": "The following are multiple choice questions (with answers) about public\
\ relations.\n\n"
"group": "mmlu_flan_cot_zeroshot_social_sciences"
"include": "_mmlu_flan_cot_zeroshot_template_yaml"
"task": "mmlu_flan_cot_zeroshot_public_relations"
dataset_name: security_studies
description: 'The following are multiple choice questions (with answers) about security
studies.
'
include: _mmlu_flan_generative_template_yaml
task: mmlu_flan_cot_zeroshot_security_studies
"dataset_name": "security_studies"
"description": "The following are multiple choice questions (with answers) about security\
\ studies.\n\n"
"group": "mmlu_flan_cot_zeroshot_social_sciences"
"include": "_mmlu_flan_cot_zeroshot_template_yaml"
"task": "mmlu_flan_cot_zeroshot_security_studies"
dataset_name: sociology
description: 'The following are multiple choice questions (with answers) about sociology.
'
include: _mmlu_flan_generative_template_yaml
task: mmlu_flan_cot_zeroshot_sociology
"dataset_name": "sociology"
"description": "The following are multiple choice questions (with answers) about sociology.\n\
\n"
"group": "mmlu_flan_cot_zeroshot_social_sciences"
"include": "_mmlu_flan_cot_zeroshot_template_yaml"
"task": "mmlu_flan_cot_zeroshot_sociology"
dataset_name: us_foreign_policy
description: 'The following are multiple choice questions (with answers) about us
foreign policy.
'
include: _mmlu_flan_generative_template_yaml
task: mmlu_flan_cot_zeroshot_us_foreign_policy
"dataset_name": "us_foreign_policy"
"description": "The following are multiple choice questions (with answers) about us\
\ foreign policy.\n\n"
"group": "mmlu_flan_cot_zeroshot_social_sciences"
"include": "_mmlu_flan_cot_zeroshot_template_yaml"
"task": "mmlu_flan_cot_zeroshot_us_foreign_policy"
dataset_name: virology
description: 'The following are multiple choice questions (with answers) about virology.
'
include: _mmlu_flan_generative_template_yaml
task: mmlu_flan_cot_zeroshot_virology
"dataset_name": "virology"
"description": "The following are multiple choice questions (with answers) about virology.\n\
\n"
"group": "mmlu_flan_cot_zeroshot_other"
"include": "_mmlu_flan_cot_zeroshot_template_yaml"
"task": "mmlu_flan_cot_zeroshot_virology"
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment