Commit 7d09b24c authored by haileyschoelkopf's avatar haileyschoelkopf
Browse files

fix alllll the merge conflicts

parents 96dfe976 6348b947
group: sycophancy
tag: sycophancy
task: sycophancy_on_philpapers2020
dataset_path: EleutherAI/sycophancy
dataset_name: sycophancy_on_philpapers2020
......
group: sycophancy
tag: sycophancy
task: sycophancy_on_political_typology_quiz
dataset_path: EleutherAI/sycophancy
dataset_name: sycophancy_on_political_typology_quiz
......
group: winogenerated
tag: winogenerated
dataset_path: EleutherAI/winogenerated
output_type: multiple_choice
validation_split: validation
......
group:
tag:
- arc_multilingual
dataset_path: null
dataset_name: null
......
group:
tag:
- hellaswag_multilingual
dataset_path: null
dataset_name: null
......
group:
tag:
- m_mmlu
dataset_path: alexandrainst/m_mmlu
test_split: test
......
group:
tag:
- truthfulqa_multilingual
dataset_path: null
dataset_name: null
......
group: pawsx
task:
- paws_en
- paws_de
- paws_es
- paws_fr
- paws_ja
- paws_ko
- paws_zh
aggregate_metric_list:
- metric: acc
aggregation: mean
weight_by_size: true
metadata:
version: 0.0
# This file will be included in the generated language-specific task configs.
# It doesn't have a yaml file extension as it is not meant to be imported directly
# by the harness.
group: pawsx
task: null
dataset_path: paws-x
dataset_name: null
......
group:
- pile
task: pile_arxiv
dataset_path: EleutherAI/pile
dataset_name: pile_arxiv
......
group:
tag:
- polemo2
task: polemo2_in
dataset_path: allegro/klej-polemo2-in
......
group:
tag:
- qa4mre
task: qa4mre_2011
dataset_path: qa4mre
......
group: qasper
tag: qasper
task: qasper_bool
dataset_path: allenai/qasper
output_type: multiple_choice
......
group: qasper
tag: qasper
task: qasper_freeform
dataset_path: allenai/qasper
output_type: generate_until
......
......@@ -12,7 +12,7 @@ class SQUADCompletion(ConfigurableTask):
DATASET_PATH = "hazyresearch/based-squad"
DATASET_NAME = "default"
def __init__(self):
def __init__(self, **kwargs):
super().__init__(config={"metadata": {"version": self.VERSION}})
def has_training_docs(self):
......
group: storycloze
tag: storycloze
task: storycloze_2016
dataset_path: story_cloze
dataset_name: 2016
......
group: storycloze
tag: storycloze
task: storycloze_2018
dataset_path: story_cloze
dataset_name: 2018
......
......@@ -26,10 +26,14 @@ Homepage: https://super.gluebenchmark.com/
}
```
### Groups and Tasks
### Groups, Tags, and Tasks
#### Groups
None.
#### Tags
* `super-glue-lm-eval-v1`: SuperGLUE eval adapted from LM Eval V1
* `super-glue-t5-prompt`: SuperGLUE prompt and evaluation that matches the T5 paper (if using accelerate, will error if record is included.)
......
......@@ -12,7 +12,7 @@ class SWDE(ConfigurableTask):
DATASET_PATH = "hazyresearch/based-swde-v2"
DATASET_NAME = "default"
def __init__(self):
def __init__(self, **kwargs):
super().__init__(config={"metadata": {"version": self.VERSION}})
def has_training_docs(self):
......
......@@ -5,8 +5,7 @@ doc_to_target: ' {{translation["en"]}}'
doc_to_text: 'Arabic phrase: {{translation["ar"]}}
English phrase:'
group:
- generate_until
tag:
- translation
- iwslt2017
include: wmt_common_yaml
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment