Commit 4288b53e authored by Baber's avatar Baber
Browse files

Merge branch 'main' into llama

parents 37eb9c9d 94344a61
dataset_path: CohereForAI/Global-MMLU-Lite
dataset_name: pt
test_split: test
fewshot_split: dev
fewshot_config:
sampler: default
output_type: multiple_choice
doc_to_text: "{{question.strip()}}\nA. {{option_a}}\nB. {{option_b}}\nC. {{option_c}}\nD. {{option_d}}\nAnswer:"
doc_to_choice: ["A", "B", "C", "D"]
doc_to_target: answer
metric_list:
- metric: acc
aggregation: mean
higher_is_better: true
metadata:
version: 0.0
# Generated by _generate_configs.py
include: _pt_template_yaml
process_docs: !function utils.process_business
task: global_mmlu_pt_business
# Generated by _generate_configs.py
include: _pt_template_yaml
process_docs: !function utils.process_humanities
task: global_mmlu_pt_humanities
# Generated by _generate_configs.py
include: _pt_template_yaml
process_docs: !function utils.process_medical
task: global_mmlu_pt_medical
# Generated by _generate_configs.py
include: _pt_template_yaml
process_docs: !function utils.process_other
task: global_mmlu_pt_other
# Generated by _generate_configs.py
include: _pt_template_yaml
process_docs: !function utils.process_social_sciences
task: global_mmlu_pt_social_sciences
# Generated by _generate_configs.py
include: _pt_template_yaml
process_docs: !function utils.process_stem
task: global_mmlu_pt_stem
from functools import partial
CATEGORIES = ["Business", "Humanities", "Medical", "Other", "STEM", "Social Sciences"]
def process_docs(dataset, category):
return dataset.filter(lambda x: x["subject_category"] == category)
process_functions = {
f"process_{category.lower().replace(' ', '_')}": partial(
process_docs, category=category
)
for category in CATEGORIES
}
globals().update(process_functions)
group: global_mmlu_sw
task:
- global_mmlu_sw_business
- global_mmlu_sw_humanities
- global_mmlu_sw_medical
- global_mmlu_sw_other
- global_mmlu_sw_stem
- global_mmlu_sw_social_sciences
aggregate_metric_list:
- metric: acc
weight_by_size: True
metadata:
version: 0.0
dataset_path: CohereForAI/Global-MMLU-Lite
dataset_name: sw
test_split: test
fewshot_split: dev
fewshot_config:
sampler: default
output_type: multiple_choice
doc_to_text: "{{question.strip()}}\nA. {{option_a}}\nB. {{option_b}}\nC. {{option_c}}\nD. {{option_d}}\nAnswer:"
doc_to_choice: ["A", "B", "C", "D"]
doc_to_target: answer
metric_list:
- metric: acc
aggregation: mean
higher_is_better: true
metadata:
version: 0.0
# Generated by _generate_configs.py
include: _sw_template_yaml
process_docs: !function utils.process_business
task: global_mmlu_sw_business
# Generated by _generate_configs.py
include: _sw_template_yaml
process_docs: !function utils.process_humanities
task: global_mmlu_sw_humanities
# Generated by _generate_configs.py
include: _sw_template_yaml
process_docs: !function utils.process_medical
task: global_mmlu_sw_medical
# Generated by _generate_configs.py
include: _sw_template_yaml
process_docs: !function utils.process_other
task: global_mmlu_sw_other
# Generated by _generate_configs.py
include: _sw_template_yaml
process_docs: !function utils.process_social_sciences
task: global_mmlu_sw_social_sciences
# Generated by _generate_configs.py
include: _sw_template_yaml
process_docs: !function utils.process_stem
task: global_mmlu_sw_stem
from functools import partial
CATEGORIES = ["Business", "Humanities", "Medical", "Other", "STEM", "Social Sciences"]
def process_docs(dataset, category):
return dataset.filter(lambda x: x["subject_category"] == category)
process_functions = {
f"process_{category.lower().replace(' ', '_')}": partial(
process_docs, category=category
)
for category in CATEGORIES
}
globals().update(process_functions)
group: global_mmlu_yo
task:
- global_mmlu_yo_business
- global_mmlu_yo_humanities
- global_mmlu_yo_medical
- global_mmlu_yo_other
- global_mmlu_yo_stem
- global_mmlu_yo_social_sciences
aggregate_metric_list:
- metric: acc
weight_by_size: True
metadata:
version: 0.0
dataset_path: CohereForAI/Global-MMLU-Lite
dataset_name: yo
test_split: test
fewshot_split: dev
fewshot_config:
sampler: default
output_type: multiple_choice
doc_to_text: "{{question.strip()}}\nA. {{option_a}}\nB. {{option_b}}\nC. {{option_c}}\nD. {{option_d}}\nAnswer:"
doc_to_choice: ["A", "B", "C", "D"]
doc_to_target: answer
metric_list:
- metric: acc
aggregation: mean
higher_is_better: true
metadata:
version: 0.0
# Generated by _generate_configs.py
include: _yo_template_yaml
process_docs: !function utils.process_business
task: global_mmlu_yo_business
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment