Commit 44a602ab authored by haileyschoelkopf's avatar haileyschoelkopf
Browse files

add many explicit group configs

parent c9801daf
...@@ -4,28 +4,28 @@ task: ...@@ -4,28 +4,28 @@ task:
- group: stem - group: stem
task: task:
- mmlu_flan_n_shot_loglikelihood_stem - mmlu_flan_n_shot_loglikelihood_stem
aggregate_metric: aggregate_metric_list:
- metric: acc - metric: acc
weight_by_size: True weight_by_size: True
- group: other - group: other
task: task:
- mmlu_flan_n_shot_loglikelihood_other - mmlu_flan_n_shot_loglikelihood_other
aggregate_metric: aggregate_metric_list:
- metric: acc - metric: acc
weight_by_size: True weight_by_size: True
- group: social sciences - group: social sciences
task: task:
- mmlu_flan_n_shot_loglikelihood_social_sciences - mmlu_flan_n_shot_loglikelihood_social_sciences
aggregate_metric: aggregate_metric_list:
- metric: acc - metric: acc
weight_by_size: True weight_by_size: True
- group: humanities - group: humanities
task: task:
- mmlu_flan_n_shot_loglikelihood_humanities - mmlu_flan_n_shot_loglikelihood_humanities
aggregate_metric: aggregate_metric_list:
- metric: acc - metric: acc
weight_by_size: True weight_by_size: True
aggregate_metric: aggregate_metric_list:
- metric: acc - metric: acc
weight_by_size: True weight_by_size: True
metadata: metadata:
......
...@@ -4,28 +4,28 @@ task: ...@@ -4,28 +4,28 @@ task:
- group: stem - group: stem
task: task:
- mmlu_stem_generative - mmlu_stem_generative
aggregate_metric: aggregate_metric_list:
- metric: acc - metric: acc
weight_by_size: True weight_by_size: True
- group: other - group: other
task: task:
- mmlu_other_generative - mmlu_other_generative
aggregate_metric: aggregate_metric_list:
- metric: acc - metric: acc
weight_by_size: True weight_by_size: True
- group: social sciences - group: social sciences
task: task:
- mmlu_social_sciences_generative - mmlu_social_sciences_generative
aggregate_metric: aggregate_metric_list:
- metric: acc - metric: acc
weight_by_size: True weight_by_size: True
- group: humanities - group: humanities
task: task:
- mmlu_humanities_generative - mmlu_humanities_generative
aggregate_metric: aggregate_metric_list:
- metric: acc - metric: acc
weight_by_size: True weight_by_size: True
aggregate_metric: aggregate_metric_list:
- metric: acc - metric: acc
weight_by_size: True weight_by_size: True
metadata: metadata:
......
group: tag:
- arc_multilingual - arc_multilingual
dataset_path: null dataset_path: null
dataset_name: null dataset_name: null
......
group: tag:
- hellaswag_multilingual - hellaswag_multilingual
dataset_path: null dataset_path: null
dataset_name: null dataset_name: null
......
group: tag:
- m_mmlu - m_mmlu
dataset_path: alexandrainst/m_mmlu dataset_path: alexandrainst/m_mmlu
test_split: test test_split: test
......
group: tag:
- truthfulqa_multilingual - truthfulqa_multilingual
dataset_path: null dataset_path: null
dataset_name: null dataset_name: null
......
group: pawsx
task:
- paws_en
- paws_de
- paws_es
- paws_fr
- paws_ja
- paws_ko
- paws_zh
aggregate_metric_list:
- metric: acc
aggregation: mean
weight_by_size: true
metadata:
version: 0.0
# This file will be included in the generated language-specific task configs. # This file will be included in the generated language-specific task configs.
# It doesn't have a yaml file extension as it is not meant to be imported directly # It doesn't have a yaml file extension as it is not meant to be imported directly
# by the harness. # by the harness.
group: pawsx
task: null task: null
dataset_path: paws-x dataset_path: paws-x
dataset_name: null dataset_name: null
......
group: tag:
- qa4mre - qa4mre
task: qa4mre_2011 task: qa4mre_2011
dataset_path: qa4mre dataset_path: qa4mre
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment