Commit 89b6bdb3 authored by Baber's avatar Baber
Browse files

Merge branch 'main' into ai2d

parents 59053d58 144a1e58
# Generated by _generate_configs.py
include: _ar_template_yaml
process_docs: !function utils.process_moral_disputes
tag: global_mmlu_full_ar_humanities_tasks
task: global_mmlu_full_ar_moral_disputes
# Generated by _generate_configs.py
include: _ar_template_yaml
process_docs: !function utils.process_moral_scenarios
tag: global_mmlu_full_ar_humanities_tasks
task: global_mmlu_full_ar_moral_scenarios
# Generated by _generate_configs.py
include: _ar_template_yaml
process_docs: !function utils.process_nutrition
tag: global_mmlu_full_ar_other_tasks
task: global_mmlu_full_ar_nutrition
# Generated by _generate_configs.py
include: _ar_template_yaml
process_docs: !function utils.process_philosophy
tag: global_mmlu_full_ar_humanities_tasks
task: global_mmlu_full_ar_philosophy
# Generated by _generate_configs.py
include: _ar_template_yaml
process_docs: !function utils.process_prehistory
tag: global_mmlu_full_ar_humanities_tasks
task: global_mmlu_full_ar_prehistory
# Generated by _generate_configs.py
include: _ar_template_yaml
process_docs: !function utils.process_professional_accounting
tag: global_mmlu_full_ar_other_tasks
task: global_mmlu_full_ar_professional_accounting
# Generated by _generate_configs.py
include: _ar_template_yaml
process_docs: !function utils.process_professional_law
tag: global_mmlu_full_ar_humanities_tasks
task: global_mmlu_full_ar_professional_law
# Generated by _generate_configs.py
include: _ar_template_yaml
process_docs: !function utils.process_professional_medicine
tag: global_mmlu_full_ar_other_tasks
task: global_mmlu_full_ar_professional_medicine
# Generated by _generate_configs.py
include: _ar_template_yaml
process_docs: !function utils.process_professional_psychology
tag: global_mmlu_full_ar_social_sciences_tasks
task: global_mmlu_full_ar_professional_psychology
# Generated by _generate_configs.py
include: _ar_template_yaml
process_docs: !function utils.process_public_relations
tag: global_mmlu_full_ar_social_sciences_tasks
task: global_mmlu_full_ar_public_relations
# Generated by _generate_configs.py
include: _ar_template_yaml
process_docs: !function utils.process_security_studies
tag: global_mmlu_full_ar_social_sciences_tasks
task: global_mmlu_full_ar_security_studies
# Generated by _generate_configs.py
include: _ar_template_yaml
process_docs: !function utils.process_sociology
tag: global_mmlu_full_ar_social_sciences_tasks
task: global_mmlu_full_ar_sociology
# Generated by _generate_configs.py
include: _ar_template_yaml
process_docs: !function utils.process_us_foreign_policy
tag: global_mmlu_full_ar_social_sciences_tasks
task: global_mmlu_full_ar_us_foreign_policy
# Generated by _generate_configs.py
include: _ar_template_yaml
process_docs: !function utils.process_virology
tag: global_mmlu_full_ar_other_tasks
task: global_mmlu_full_ar_virology
# Generated by _generate_configs.py
include: _ar_template_yaml
process_docs: !function utils.process_world_religions
tag: global_mmlu_full_ar_humanities_tasks
task: global_mmlu_full_ar_world_religions
from functools import partial
SUBJECTS = [
"abstract_algebra",
"anatomy",
"astronomy",
"business_ethics",
"clinical_knowledge",
"college_biology",
"college_chemistry",
"college_computer_science",
"college_mathematics",
"college_medicine",
"college_physics",
"computer_security",
"conceptual_physics",
"econometrics",
"electrical_engineering",
"elementary_mathematics",
"formal_logic",
"global_facts",
"high_school_biology",
"high_school_chemistry",
"high_school_computer_science",
"high_school_european_history",
"high_school_geography",
"high_school_government_and_politics",
"high_school_macroeconomics",
"high_school_mathematics",
"high_school_microeconomics",
"high_school_physics",
"high_school_psychology",
"high_school_statistics",
"high_school_us_history",
"high_school_world_history",
"human_aging",
"human_sexuality",
"international_law",
"jurisprudence",
"logical_fallacies",
"machine_learning",
"management",
"marketing",
"medical_genetics",
"miscellaneous",
"moral_disputes",
"moral_scenarios",
"nutrition",
"philosophy",
"prehistory",
"professional_accounting",
"professional_law",
"professional_medicine",
"professional_psychology",
"public_relations",
"security_studies",
"sociology",
"us_foreign_policy",
"virology",
"world_religions",
]
def process_docs(dataset, subject):
return dataset.filter(lambda x: x["subject"] == subject)
process_functions = {
f"process_{subject}": partial(process_docs, subject=subject) for subject in SUBJECTS
}
globals().update(process_functions)
dataset_path: CohereForAI/Global-MMLU
dataset_name: bn
test_split: test
fewshot_split: dev
fewshot_config:
sampler: first_n
output_type: multiple_choice
doc_to_text: "{{question.strip()}}\nA. {{option_a}}\nB. {{option_b}}\nC. {{option_c}}\nD. {{option_d}}\nAnswer:"
doc_to_choice: ["A", "B", "C", "D"]
doc_to_target: answer
metric_list:
- metric: acc
aggregation: mean
higher_is_better: true
metadata:
version: 0.0
group: global_mmlu_full_bn
task:
- global_mmlu_full_bn_stem
- global_mmlu_full_bn_other
- global_mmlu_full_bn_social_sciences
- global_mmlu_full_bn_humanities
aggregate_metric_list:
- metric: acc
weight_by_size: True
metadata:
version: 0.0
group: global_mmlu_full_bn_humanities
task:
- global_mmlu_full_bn_humanities_tasks
aggregate_metric_list:
- metric: acc
weight_by_size: true
metadata:
version: 0.0
group: global_mmlu_full_bn_other
task:
- global_mmlu_full_bn_other_tasks
aggregate_metric_list:
- metric: acc
weight_by_size: true
metadata:
version: 0.0
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment