Unverified Commit 5c006ed4 authored by Minho Ryu's avatar Minho Ryu Committed by GitHub
Browse files

separate category for `global_mmlu` (#2652)

* separate category

* set version 0.0

* apply precommit
parent 370e2f9e
group: global_mmlu_de
task:
- global_mmlu_de_business
- global_mmlu_de_humanities
- global_mmlu_de_medical
- global_mmlu_de_other
- global_mmlu_de_stem
- global_mmlu_de_social_sciences
aggregate_metric_list:
- metric: acc
weight_by_size: True
metadata:
version: 0.0
# Generated by _generate_configs.py
include: _de_template_yaml
process_docs: !function utils.process_business
task: global_mmlu_de_business
# Generated by _generate_configs.py
include: _de_template_yaml
process_docs: !function utils.process_humanities
task: global_mmlu_de_humanities
# Generated by _generate_configs.py
include: _de_template_yaml
process_docs: !function utils.process_medical
task: global_mmlu_de_medical
# Generated by _generate_configs.py
include: _de_template_yaml
process_docs: !function utils.process_other
task: global_mmlu_de_other
# Generated by _generate_configs.py
include: _de_template_yaml
process_docs: !function utils.process_social_sciences
task: global_mmlu_de_social_sciences
# Generated by _generate_configs.py
include: _de_template_yaml
process_docs: !function utils.process_stem
task: global_mmlu_de_stem
from functools import partial
CATEGORIES = ["Business", "Humanities", "Medical", "Other", "STEM", "Social Sciences"]
def process_docs(dataset, category):
return dataset.filter(lambda x: x["subject_category"] == category)
process_functions = {
f"process_{category.lower().replace(' ', '_')}": partial(
process_docs, category=category
)
for category in CATEGORIES
}
globals().update(process_functions)
dataset_path: CohereForAI/Global-MMLU-Lite
dataset_name: en
test_split: test
fewshot_split: dev
fewshot_config:
sampler: default
output_type: multiple_choice
doc_to_text: "{{question.strip()}}\nA. {{option_a}}\nB. {{option_b}}\nC. {{option_c}}\nD. {{option_d}}\nAnswer:"
doc_to_choice: ["A", "B", "C", "D"]
doc_to_target: answer
metric_list:
- metric: acc
aggregation: mean
higher_is_better: true
metadata:
version: 0.0
group: global_mmlu_en
task:
- global_mmlu_en_business
- global_mmlu_en_humanities
- global_mmlu_en_medical
- global_mmlu_en_other
- global_mmlu_en_stem
- global_mmlu_en_social_sciences
aggregate_metric_list:
- metric: acc
weight_by_size: True
metadata:
version: 0.0
# Generated by _generate_configs.py
include: _en_template_yaml
process_docs: !function utils.process_business
task: global_mmlu_en_business
# Generated by _generate_configs.py
include: _en_template_yaml
process_docs: !function utils.process_humanities
task: global_mmlu_en_humanities
# Generated by _generate_configs.py
include: _en_template_yaml
process_docs: !function utils.process_medical
task: global_mmlu_en_medical
# Generated by _generate_configs.py
include: _en_template_yaml
process_docs: !function utils.process_other
task: global_mmlu_en_other
# Generated by _generate_configs.py
include: _en_template_yaml
process_docs: !function utils.process_social_sciences
task: global_mmlu_en_social_sciences
# Generated by _generate_configs.py
include: _en_template_yaml
process_docs: !function utils.process_stem
task: global_mmlu_en_stem
from functools import partial
CATEGORIES = ["Business", "Humanities", "Medical", "Other", "STEM", "Social Sciences"]
def process_docs(dataset, category):
return dataset.filter(lambda x: x["subject_category"] == category)
process_functions = {
f"process_{category.lower().replace(' ', '_')}": partial(
process_docs, category=category
)
for category in CATEGORIES
}
globals().update(process_functions)
dataset_path: CohereForAI/Global-MMLU-Lite
dataset_name: es
test_split: test
fewshot_split: dev
fewshot_config:
sampler: default
output_type: multiple_choice
doc_to_text: "{{question.strip()}}\nA. {{option_a}}\nB. {{option_b}}\nC. {{option_c}}\nD. {{option_d}}\nAnswer:"
doc_to_choice: ["A", "B", "C", "D"]
doc_to_target: answer
metric_list:
- metric: acc
aggregation: mean
higher_is_better: true
metadata:
version: 0.0
group: global_mmlu_es
task:
- global_mmlu_es_business
- global_mmlu_es_humanities
- global_mmlu_es_medical
- global_mmlu_es_other
- global_mmlu_es_stem
- global_mmlu_es_social_sciences
aggregate_metric_list:
- metric: acc
weight_by_size: True
metadata:
version: 0.0
# Generated by _generate_configs.py
include: _es_template_yaml
process_docs: !function utils.process_business
task: global_mmlu_es_business
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment