Commit 8fdcbc13 authored by haileyschoelkopf's avatar haileyschoelkopf
Browse files

add more explicit group configs

parent 51519e40
...@@ -15,7 +15,7 @@ task: ...@@ -15,7 +15,7 @@ task:
- aclue_polysemy_resolution - aclue_polysemy_resolution
- aclue_reading_comprehension - aclue_reading_comprehension
- aclue_sentence_segmentation - aclue_sentence_segmentation
aggregate_metric: aggregate_metric_list:
- metric: acc - metric: acc
aggregation: mean aggregation: mean
weight_by_size: true weight_by_size: true
......
...@@ -5,7 +5,7 @@ task: ...@@ -5,7 +5,7 @@ task:
- aexams_Physics - aexams_Physics
- aexams_Science - aexams_Science
- aexams_Social - aexams_Social
aggregate_metric: aggregate_metric_list:
- metric: acc - metric: acc
aggregation: mean aggregation: mean
weight_by_size: true weight_by_size: true
......
group: blimp
dataset_path: blimp dataset_path: blimp
output_type: multiple_choice output_type: multiple_choice
validation_split: train validation_split: train
......
tag: tag:
- crows_pairs - crows_pairs
- social_bias
task: crows_pairs_english task: crows_pairs_english
dataset_path: BigScienceBiasEval/crows_pairs_multilingual dataset_path: BigScienceBiasEval/crows_pairs_multilingual
dataset_name: english dataset_name: english
......
include: gsm8k-cot.yaml include: gsm8k-cot.yaml
group: tag:
- chain_of_thought - chain_of_thought
- self_consistency - self_consistency
task: gsm8k_cot_self_consistency task: gsm8k_cot_self_consistency
......
group: tag:
- math_word_problems - math_word_problems
task: gsm8k_cot_zeroshot task: gsm8k_cot_zeroshot
dataset_path: gsm8k dataset_path: gsm8k
......
...@@ -61,7 +61,7 @@ generation_kwargs: ...@@ -61,7 +61,7 @@ generation_kwargs:
- 'Q:' - 'Q:'
- </s> - </s>
- <|im_end|> - <|im_end|>
group: tag:
- chain_of_thought - chain_of_thought
metadata: metadata:
version: 3.0 version: 3.0
......
group: tag:
- math_word_problems - math_word_problems
task: gsm8k task: gsm8k
dataset_path: gsm8k dataset_path: gsm8k
......
group: tag:
- multiple_choice - multiple_choice
task: hellaswag task: hellaswag
dataset_path: hellaswag dataset_path: hellaswag
......
group: tag:
- hendrycks_ethics - hendrycks_ethics
task: ethics_cm task: ethics_cm
dataset_path: EleutherAI/hendrycks_ethics dataset_path: EleutherAI/hendrycks_ethics
......
include: deontology.yaml include: deontology.yaml
group: tag:
- hendrycks_ethics - hendrycks_ethics
task: ethics_justice task: ethics_justice
dataset_name: justice dataset_name: justice
......
include: commonsense.yaml include: commonsense.yaml
group: tag:
- hendrycks_ethics - hendrycks_ethics
task: ethics_utilitarianism task: ethics_utilitarianism
dataset_name: utilitarianism dataset_name: utilitarianism
......
include: commonsense.yaml include: commonsense.yaml
group: tag:
- hendrycks_ethics - hendrycks_ethics
task: ethics_virtue task: ethics_virtue
dataset_name: virtue dataset_name: virtue
......
group: tag:
- kobest - kobest
task: kobest_boolq task: kobest_boolq
dataset_path: skt/kobest_v1 dataset_path: skt/kobest_v1
......
group: tag:
- kobest - kobest
task: kobest_copa task: kobest_copa
dataset_path: skt/kobest_v1 dataset_path: skt/kobest_v1
......
group: tag:
- kobest - kobest
task: kobest_hellaswag task: kobest_hellaswag
dataset_path: skt/kobest_v1 dataset_path: skt/kobest_v1
......
group: tag:
- kobest - kobest
task: kobest_sentineg task: kobest_sentineg
dataset_path: skt/kobest_v1 dataset_path: skt/kobest_v1
......
group: tag:
- kobest - kobest
task: kobest_wic task: kobest_wic
dataset_path: skt/kobest_v1 dataset_path: skt/kobest_v1
......
group: qasper tag: qasper
task: qasper_bool task: qasper_bool
dataset_path: allenai/qasper dataset_path: allenai/qasper
output_type: multiple_choice output_type: multiple_choice
......
group: qasper tag: qasper
task: qasper_freeform task: qasper_freeform
dataset_path: allenai/qasper dataset_path: allenai/qasper
output_type: generate_until output_type: generate_until
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment