Commit 8fdcbc13 authored by haileyschoelkopf's avatar haileyschoelkopf
Browse files

add more explicit group configs

parent 51519e40
......@@ -15,7 +15,7 @@ task:
- aclue_polysemy_resolution
- aclue_reading_comprehension
- aclue_sentence_segmentation
aggregate_metric:
aggregate_metric_list:
- metric: acc
aggregation: mean
weight_by_size: true
......
......@@ -5,7 +5,7 @@ task:
- aexams_Physics
- aexams_Science
- aexams_Social
aggregate_metric:
aggregate_metric_list:
- metric: acc
aggregation: mean
weight_by_size: true
......
group: blimp
dataset_path: blimp
output_type: multiple_choice
validation_split: train
......
tag:
- crows_pairs
- social_bias
task: crows_pairs_english
dataset_path: BigScienceBiasEval/crows_pairs_multilingual
dataset_name: english
......
include: gsm8k-cot.yaml
group:
tag:
- chain_of_thought
- self_consistency
task: gsm8k_cot_self_consistency
......
group:
tag:
- math_word_problems
task: gsm8k_cot_zeroshot
dataset_path: gsm8k
......
......@@ -61,7 +61,7 @@ generation_kwargs:
- 'Q:'
- </s>
- <|im_end|>
group:
tag:
- chain_of_thought
metadata:
version: 3.0
......
group:
tag:
- math_word_problems
task: gsm8k
dataset_path: gsm8k
......
group:
tag:
- multiple_choice
task: hellaswag
dataset_path: hellaswag
......
group:
tag:
- hendrycks_ethics
task: ethics_cm
dataset_path: EleutherAI/hendrycks_ethics
......
include: deontology.yaml
group:
tag:
- hendrycks_ethics
task: ethics_justice
dataset_name: justice
......
include: commonsense.yaml
group:
tag:
- hendrycks_ethics
task: ethics_utilitarianism
dataset_name: utilitarianism
......
include: commonsense.yaml
group:
tag:
- hendrycks_ethics
task: ethics_virtue
dataset_name: virtue
......
group:
tag:
- kobest
task: kobest_boolq
dataset_path: skt/kobest_v1
......
group:
tag:
- kobest
task: kobest_copa
dataset_path: skt/kobest_v1
......
group:
tag:
- kobest
task: kobest_hellaswag
dataset_path: skt/kobest_v1
......
group:
tag:
- kobest
task: kobest_sentineg
dataset_path: skt/kobest_v1
......
group:
tag:
- kobest
task: kobest_wic
dataset_path: skt/kobest_v1
......
group: qasper
tag: qasper
task: qasper_bool
dataset_path: allenai/qasper
output_type: multiple_choice
......
group: qasper
tag: qasper
task: qasper_freeform
dataset_path: allenai/qasper
output_type: generate_until
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment