Commit 2184b8de authored by lintangsutawika's avatar lintangsutawika
Browse files

Merge branch 'cont-metrics' of https://github.com/EleutherAI/lm-evaluation-harness into alt_worlds

parents b1ba4e71 1522009c
dataset_name: high_school_macroeconomics "dataset_name": "high_school_macroeconomics"
description: 'The following are multiple choice questions (with answers) about high "description": "The following are multiple choice questions (with answers) about high\
school macroeconomics. \ school macroeconomics.\n\n"
"group": "mmlu_flan_cot_zeroshot_social_sciences"
"include": "_mmlu_flan_cot_zeroshot_template_yaml"
' "task": "mmlu_flan_cot_zeroshot_high_school_macroeconomics"
include: _mmlu_flan_generative_template_yaml
task: mmlu_flan_cot_zeroshot_high_school_macroeconomics
dataset_name: high_school_mathematics "dataset_name": "high_school_mathematics"
description: 'The following are multiple choice questions (with answers) about high "description": "The following are multiple choice questions (with answers) about high\
school mathematics. \ school mathematics.\n\n"
"group": "mmlu_flan_cot_zeroshot_stem"
"include": "_mmlu_flan_cot_zeroshot_template_yaml"
' "task": "mmlu_flan_cot_zeroshot_high_school_mathematics"
include: _mmlu_flan_generative_template_yaml
task: mmlu_flan_cot_zeroshot_high_school_mathematics
dataset_name: high_school_microeconomics "dataset_name": "high_school_microeconomics"
description: 'The following are multiple choice questions (with answers) about high "description": "The following are multiple choice questions (with answers) about high\
school microeconomics. \ school microeconomics.\n\n"
"group": "mmlu_flan_cot_zeroshot_social_sciences"
"include": "_mmlu_flan_cot_zeroshot_template_yaml"
' "task": "mmlu_flan_cot_zeroshot_high_school_microeconomics"
include: _mmlu_flan_generative_template_yaml
task: mmlu_flan_cot_zeroshot_high_school_microeconomics
dataset_name: high_school_physics "dataset_name": "high_school_physics"
description: 'The following are multiple choice questions (with answers) about high "description": "The following are multiple choice questions (with answers) about high\
school physics. \ school physics.\n\n"
"group": "mmlu_flan_cot_zeroshot_stem"
"include": "_mmlu_flan_cot_zeroshot_template_yaml"
' "task": "mmlu_flan_cot_zeroshot_high_school_physics"
include: _mmlu_flan_generative_template_yaml
task: mmlu_flan_cot_zeroshot_high_school_physics
dataset_name: high_school_psychology "dataset_name": "high_school_psychology"
description: 'The following are multiple choice questions (with answers) about high "description": "The following are multiple choice questions (with answers) about high\
school psychology. \ school psychology.\n\n"
"group": "mmlu_flan_cot_zeroshot_social_sciences"
"include": "_mmlu_flan_cot_zeroshot_template_yaml"
' "task": "mmlu_flan_cot_zeroshot_high_school_psychology"
include: _mmlu_flan_generative_template_yaml
task: mmlu_flan_cot_zeroshot_high_school_psychology
dataset_name: high_school_statistics "dataset_name": "high_school_statistics"
description: 'The following are multiple choice questions (with answers) about high "description": "The following are multiple choice questions (with answers) about high\
school statistics. \ school statistics.\n\n"
"group": "mmlu_flan_cot_zeroshot_stem"
"include": "_mmlu_flan_cot_zeroshot_template_yaml"
' "task": "mmlu_flan_cot_zeroshot_high_school_statistics"
include: _mmlu_flan_generative_template_yaml
task: mmlu_flan_cot_zeroshot_high_school_statistics
dataset_name: high_school_us_history "dataset_name": "high_school_us_history"
description: 'The following are multiple choice questions (with answers) about high "description": "The following are multiple choice questions (with answers) about high\
school us history. \ school us history.\n\n"
"group": "mmlu_flan_cot_zeroshot_humanities"
"include": "_mmlu_flan_cot_zeroshot_template_yaml"
' "task": "mmlu_flan_cot_zeroshot_high_school_us_history"
include: _mmlu_flan_generative_template_yaml
task: mmlu_flan_cot_zeroshot_high_school_us_history
dataset_name: high_school_world_history "dataset_name": "high_school_world_history"
description: 'The following are multiple choice questions (with answers) about high "description": "The following are multiple choice questions (with answers) about high\
school world history. \ school world history.\n\n"
"group": "mmlu_flan_cot_zeroshot_humanities"
"include": "_mmlu_flan_cot_zeroshot_template_yaml"
' "task": "mmlu_flan_cot_zeroshot_high_school_world_history"
include: _mmlu_flan_generative_template_yaml
task: mmlu_flan_cot_zeroshot_high_school_world_history
dataset_name: human_aging "dataset_name": "human_aging"
description: 'The following are multiple choice questions (with answers) about human "description": "The following are multiple choice questions (with answers) about human\
aging. \ aging.\n\n"
"group": "mmlu_flan_cot_zeroshot_other"
"include": "_mmlu_flan_cot_zeroshot_template_yaml"
' "task": "mmlu_flan_cot_zeroshot_human_aging"
include: _mmlu_flan_generative_template_yaml
task: mmlu_flan_cot_zeroshot_human_aging
dataset_name: human_sexuality "dataset_name": "human_sexuality"
description: 'The following are multiple choice questions (with answers) about human "description": "The following are multiple choice questions (with answers) about human\
sexuality. \ sexuality.\n\n"
"group": "mmlu_flan_cot_zeroshot_social_sciences"
"include": "_mmlu_flan_cot_zeroshot_template_yaml"
' "task": "mmlu_flan_cot_zeroshot_human_sexuality"
include: _mmlu_flan_generative_template_yaml
task: mmlu_flan_cot_zeroshot_human_sexuality
dataset_name: international_law "dataset_name": "international_law"
description: 'The following are multiple choice questions (with answers) about international "description": "The following are multiple choice questions (with answers) about international\
law. \ law.\n\n"
"group": "mmlu_flan_cot_zeroshot_humanities"
"include": "_mmlu_flan_cot_zeroshot_template_yaml"
' "task": "mmlu_flan_cot_zeroshot_international_law"
include: _mmlu_flan_generative_template_yaml
task: mmlu_flan_cot_zeroshot_international_law
dataset_name: jurisprudence "dataset_name": "jurisprudence"
description: 'The following are multiple choice questions (with answers) about jurisprudence. "description": "The following are multiple choice questions (with answers) about jurisprudence.\n\
\n"
"group": "mmlu_flan_cot_zeroshot_humanities"
' "include": "_mmlu_flan_cot_zeroshot_template_yaml"
include: _mmlu_flan_generative_template_yaml "task": "mmlu_flan_cot_zeroshot_jurisprudence"
task: mmlu_flan_cot_zeroshot_jurisprudence
dataset_name: logical_fallacies "dataset_name": "logical_fallacies"
description: 'The following are multiple choice questions (with answers) about logical "description": "The following are multiple choice questions (with answers) about logical\
fallacies. \ fallacies.\n\n"
"group": "mmlu_flan_cot_zeroshot_humanities"
"include": "_mmlu_flan_cot_zeroshot_template_yaml"
' "task": "mmlu_flan_cot_zeroshot_logical_fallacies"
include: _mmlu_flan_generative_template_yaml
task: mmlu_flan_cot_zeroshot_logical_fallacies
dataset_name: machine_learning "dataset_name": "machine_learning"
description: 'The following are multiple choice questions (with answers) about machine "description": "The following are multiple choice questions (with answers) about machine\
learning. \ learning.\n\n"
"group": "mmlu_flan_cot_zeroshot_stem"
"include": "_mmlu_flan_cot_zeroshot_template_yaml"
' "task": "mmlu_flan_cot_zeroshot_machine_learning"
include: _mmlu_flan_generative_template_yaml
task: mmlu_flan_cot_zeroshot_machine_learning
dataset_name: management "dataset_name": "management"
description: 'The following are multiple choice questions (with answers) about management. "description": "The following are multiple choice questions (with answers) about management.\n\
\n"
"group": "mmlu_flan_cot_zeroshot_other"
' "include": "_mmlu_flan_cot_zeroshot_template_yaml"
include: _mmlu_flan_generative_template_yaml "task": "mmlu_flan_cot_zeroshot_management"
task: mmlu_flan_cot_zeroshot_management
dataset_name: marketing "dataset_name": "marketing"
description: 'The following are multiple choice questions (with answers) about marketing. "description": "The following are multiple choice questions (with answers) about marketing.\n\
\n"
"group": "mmlu_flan_cot_zeroshot_other"
' "include": "_mmlu_flan_cot_zeroshot_template_yaml"
include: _mmlu_flan_generative_template_yaml "task": "mmlu_flan_cot_zeroshot_marketing"
task: mmlu_flan_cot_zeroshot_marketing
dataset_name: medical_genetics "dataset_name": "medical_genetics"
description: 'The following are multiple choice questions (with answers) about medical "description": "The following are multiple choice questions (with answers) about medical\
genetics. \ genetics.\n\n"
"group": "mmlu_flan_cot_zeroshot_other"
"include": "_mmlu_flan_cot_zeroshot_template_yaml"
' "task": "mmlu_flan_cot_zeroshot_medical_genetics"
include: _mmlu_flan_generative_template_yaml
task: mmlu_flan_cot_zeroshot_medical_genetics
dataset_name: miscellaneous "dataset_name": "miscellaneous"
description: 'The following are multiple choice questions (with answers) about miscellaneous. "description": "The following are multiple choice questions (with answers) about miscellaneous.\n\
\n"
"group": "mmlu_flan_cot_zeroshot_other"
' "include": "_mmlu_flan_cot_zeroshot_template_yaml"
include: _mmlu_flan_generative_template_yaml "task": "mmlu_flan_cot_zeroshot_miscellaneous"
task: mmlu_flan_cot_zeroshot_miscellaneous
dataset_name: moral_disputes "dataset_name": "moral_disputes"
description: 'The following are multiple choice questions (with answers) about moral "description": "The following are multiple choice questions (with answers) about moral\
disputes. \ disputes.\n\n"
"group": "mmlu_flan_cot_zeroshot_humanities"
"include": "_mmlu_flan_cot_zeroshot_template_yaml"
' "task": "mmlu_flan_cot_zeroshot_moral_disputes"
include: _mmlu_flan_generative_template_yaml
task: mmlu_flan_cot_zeroshot_moral_disputes
dataset_name: moral_scenarios "dataset_name": "moral_scenarios"
description: 'The following are multiple choice questions (with answers) about moral "description": "The following are multiple choice questions (with answers) about moral\
scenarios. \ scenarios.\n\n"
"group": "mmlu_flan_cot_zeroshot_humanities"
"include": "_mmlu_flan_cot_zeroshot_template_yaml"
' "task": "mmlu_flan_cot_zeroshot_moral_scenarios"
include: _mmlu_flan_generative_template_yaml
task: mmlu_flan_cot_zeroshot_moral_scenarios
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment