"...lm-evaluation-harness.git" did not exist on "a36348faf5ac0a04f5f3a0ecd0e2c00414c50d0e"
Commit 8fada609 authored by Baber's avatar Baber
Browse files

Merge branch 'main' into mathvista

parents 0007b74a 1208afd3
group: global_mmlu_full_ar_humanities
task:
- global_mmlu_full_ar_humanities_tasks
aggregate_metric_list:
- metric: acc
weight_by_size: true
metadata:
version: 0.0
group: global_mmlu_full_ar_other
task:
- global_mmlu_full_ar_other_tasks
aggregate_metric_list:
- metric: acc
weight_by_size: true
metadata:
version: 0.0
group: global_mmlu_full_ar_social_sciences
task:
- global_mmlu_full_ar_social_sciences_tasks
aggregate_metric_list:
- metric: acc
weight_by_size: true
metadata:
version: 0.0
group: global_mmlu_full_ar_stem
task:
- global_mmlu_full_ar_stem_tasks
aggregate_metric_list:
- metric: acc
weight_by_size: true
metadata:
version: 0.0
# Generated by _generate_configs.py
include: _ar_template_yaml
process_docs: !function utils.process_abstract_algebra
tag: global_mmlu_full_ar_stem_tasks
task: global_mmlu_full_ar_abstract_algebra
# Generated by _generate_configs.py
include: _ar_template_yaml
process_docs: !function utils.process_anatomy
tag: global_mmlu_full_ar_stem_tasks
task: global_mmlu_full_ar_anatomy
# Generated by _generate_configs.py
include: _ar_template_yaml
process_docs: !function utils.process_astronomy
tag: global_mmlu_full_ar_stem_tasks
task: global_mmlu_full_ar_astronomy
# Generated by _generate_configs.py
include: _ar_template_yaml
process_docs: !function utils.process_business_ethics
tag: global_mmlu_full_ar_other_tasks
task: global_mmlu_full_ar_business_ethics
# Generated by _generate_configs.py
include: _ar_template_yaml
process_docs: !function utils.process_clinical_knowledge
tag: global_mmlu_full_ar_other_tasks
task: global_mmlu_full_ar_clinical_knowledge
# Generated by _generate_configs.py
include: _ar_template_yaml
process_docs: !function utils.process_college_biology
tag: global_mmlu_full_ar_stem_tasks
task: global_mmlu_full_ar_college_biology
# Generated by _generate_configs.py
include: _ar_template_yaml
process_docs: !function utils.process_college_chemistry
tag: global_mmlu_full_ar_stem_tasks
task: global_mmlu_full_ar_college_chemistry
# Generated by _generate_configs.py
include: _ar_template_yaml
process_docs: !function utils.process_college_computer_science
tag: global_mmlu_full_ar_stem_tasks
task: global_mmlu_full_ar_college_computer_science
# Generated by _generate_configs.py
include: _ar_template_yaml
process_docs: !function utils.process_college_mathematics
tag: global_mmlu_full_ar_stem_tasks
task: global_mmlu_full_ar_college_mathematics
# Generated by _generate_configs.py
include: _ar_template_yaml
process_docs: !function utils.process_college_medicine
tag: global_mmlu_full_ar_other_tasks
task: global_mmlu_full_ar_college_medicine
# Generated by _generate_configs.py
include: _ar_template_yaml
process_docs: !function utils.process_college_physics
tag: global_mmlu_full_ar_stem_tasks
task: global_mmlu_full_ar_college_physics
# Generated by _generate_configs.py
include: _ar_template_yaml
process_docs: !function utils.process_computer_security
tag: global_mmlu_full_ar_stem_tasks
task: global_mmlu_full_ar_computer_security
# Generated by _generate_configs.py
include: _ar_template_yaml
process_docs: !function utils.process_conceptual_physics
tag: global_mmlu_full_ar_stem_tasks
task: global_mmlu_full_ar_conceptual_physics
# Generated by _generate_configs.py
include: _ar_template_yaml
process_docs: !function utils.process_econometrics
tag: global_mmlu_full_ar_social_sciences_tasks
task: global_mmlu_full_ar_econometrics
# Generated by _generate_configs.py
include: _ar_template_yaml
process_docs: !function utils.process_electrical_engineering
tag: global_mmlu_full_ar_stem_tasks
task: global_mmlu_full_ar_electrical_engineering
# Generated by _generate_configs.py
include: _ar_template_yaml
process_docs: !function utils.process_elementary_mathematics
tag: global_mmlu_full_ar_stem_tasks
task: global_mmlu_full_ar_elementary_mathematics
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment