Commit 44a602ab authored by haileyschoelkopf's avatar haileyschoelkopf
Browse files

add many explicit group configs

parent c9801daf
......@@ -4,28 +4,28 @@ task:
- group: stem
task:
- mmlu_flan_n_shot_loglikelihood_stem
aggregate_metric:
aggregate_metric_list:
- metric: acc
weight_by_size: True
- group: other
task:
- mmlu_flan_n_shot_loglikelihood_other
aggregate_metric:
aggregate_metric_list:
- metric: acc
weight_by_size: True
- group: social sciences
task:
- mmlu_flan_n_shot_loglikelihood_social_sciences
aggregate_metric:
aggregate_metric_list:
- metric: acc
weight_by_size: True
- group: humanities
task:
- mmlu_flan_n_shot_loglikelihood_humanities
aggregate_metric:
aggregate_metric_list:
- metric: acc
weight_by_size: True
aggregate_metric:
aggregate_metric_list:
- metric: acc
weight_by_size: True
metadata:
......
......@@ -4,28 +4,28 @@ task:
- group: stem
task:
- mmlu_stem_generative
aggregate_metric:
aggregate_metric_list:
- metric: acc
weight_by_size: True
- group: other
task:
- mmlu_other_generative
aggregate_metric:
aggregate_metric_list:
- metric: acc
weight_by_size: True
- group: social sciences
task:
- mmlu_social_sciences_generative
aggregate_metric:
aggregate_metric_list:
- metric: acc
weight_by_size: True
- group: humanities
task:
- mmlu_humanities_generative
aggregate_metric:
aggregate_metric_list:
- metric: acc
weight_by_size: True
aggregate_metric:
aggregate_metric_list:
- metric: acc
weight_by_size: True
metadata:
......
group:
tag:
- arc_multilingual
dataset_path: null
dataset_name: null
......
group:
tag:
- hellaswag_multilingual
dataset_path: null
dataset_name: null
......
group:
tag:
- m_mmlu
dataset_path: alexandrainst/m_mmlu
test_split: test
......
group:
tag:
- truthfulqa_multilingual
dataset_path: null
dataset_name: null
......
group: pawsx
task:
- paws_en
- paws_de
- paws_es
- paws_fr
- paws_ja
- paws_ko
- paws_zh
aggregate_metric_list:
- metric: acc
aggregation: mean
weight_by_size: true
metadata:
version: 0.0
# This file will be included in the generated language-specific task configs.
# It doesn't have a yaml file extension as it is not meant to be imported directly
# by the harness.
group: pawsx
task: null
dataset_path: paws-x
dataset_name: null
......
group:
tag:
- qa4mre
task: qa4mre_2011
dataset_path: qa4mre
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment