"test/vscode:/vscode.git/clone" did not exist on "9a7bb6d233a13be69b1db43adc6a6be9aac7cd4d"
Unverified Commit 5c006ed4 authored by Minho Ryu's avatar Minho Ryu Committed by GitHub
Browse files

separate category for `global_mmlu` (#2652)

* separate category

* set version 0.0

* apply precommit
parent 370e2f9e
# Generated by _generate_configs.py
dataset_name: fr
include: _default_yaml
task: global_mmlu_fr
# Generated by _generate_configs.py
dataset_name: hi
include: _default_yaml
task: global_mmlu_hi
# Generated by _generate_configs.py
dataset_name: id
include: _default_yaml
task: global_mmlu_id
# Generated by _generate_configs.py
dataset_name: it
include: _default_yaml
task: global_mmlu_it
# Generated by _generate_configs.py
dataset_name: ja
include: _default_yaml
task: global_mmlu_ja
# Generated by _generate_configs.py
dataset_name: ko
include: _default_yaml
task: global_mmlu_ko
# Generated by _generate_configs.py
dataset_name: pt
include: _default_yaml
task: global_mmlu_pt
# Generated by _generate_configs.py
dataset_name: sw
include: _default_yaml
task: global_mmlu_sw
# Generated by _generate_configs.py
dataset_name: yo
include: _default_yaml
task: global_mmlu_yo
# Generated by _generate_configs.py
dataset_name: zh
include: _default_yaml
task: global_mmlu_zh
group: global_mmlu_hi
task:
- global_mmlu_hi_business
- global_mmlu_hi_humanities
- global_mmlu_hi_medical
- global_mmlu_hi_other
- global_mmlu_hi_stem
- global_mmlu_hi_social_sciences
aggregate_metric_list:
- metric: acc
weight_by_size: True
metadata:
version: 0.0
dataset_path: CohereForAI/Global-MMLU-Lite
dataset_name: hi
test_split: test
fewshot_split: dev
fewshot_config:
sampler: default
output_type: multiple_choice
doc_to_text: "{{question.strip()}}\nA. {{option_a}}\nB. {{option_b}}\nC. {{option_c}}\nD. {{option_d}}\nAnswer:"
doc_to_choice: ["A", "B", "C", "D"]
doc_to_target: answer
metric_list:
- metric: acc
aggregation: mean
higher_is_better: true
metadata:
version: 0.0
# Generated by _generate_configs.py
include: _hi_template_yaml
process_docs: !function utils.process_business
task: global_mmlu_hi_business
# Generated by _generate_configs.py
include: _hi_template_yaml
process_docs: !function utils.process_humanities
task: global_mmlu_hi_humanities
# Generated by _generate_configs.py
include: _hi_template_yaml
process_docs: !function utils.process_medical
task: global_mmlu_hi_medical
# Generated by _generate_configs.py
include: _hi_template_yaml
process_docs: !function utils.process_other
task: global_mmlu_hi_other
# Generated by _generate_configs.py
include: _hi_template_yaml
process_docs: !function utils.process_social_sciences
task: global_mmlu_hi_social_sciences
# Generated by _generate_configs.py
include: _hi_template_yaml
process_docs: !function utils.process_stem
task: global_mmlu_hi_stem
from functools import partial
CATEGORIES = ["Business", "Humanities", "Medical", "Other", "STEM", "Social Sciences"]
def process_docs(dataset, category):
return dataset.filter(lambda x: x["subject_category"] == category)
process_functions = {
f"process_{category.lower().replace(' ', '_')}": partial(
process_docs, category=category
)
for category in CATEGORIES
}
globals().update(process_functions)
group: global_mmlu_id
task:
- global_mmlu_id_business
- global_mmlu_id_humanities
- global_mmlu_id_medical
- global_mmlu_id_other
- global_mmlu_id_stem
- global_mmlu_id_social_sciences
aggregate_metric_list:
- metric: acc
weight_by_size: True
metadata:
version: 0.0
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment