Unverified Commit dc5b3d5d authored by Stella Biderman's avatar Stella Biderman Committed by GitHub
Browse files

Merge pull request #1031 from EleutherAI/versioning

[Refactor] Versioning
parents 39c2bb4e 52f75f0e
......@@ -18,3 +18,5 @@ metric_list:
- metric: acc_norm
aggregation: mean
higher_is_better: true
metadata:
- version: 1.0
......@@ -10,3 +10,5 @@ doc_to_target: 1
doc_to_choice: ["no", "yes"]
metric_list:
- metric: f1
metadata:
- version: 1.0
......@@ -14,3 +14,5 @@ metric_list:
- metric: !function metrics.f1_abstractive
aggregation: mean
higher_is_better: true
metadata:
- version: 1.0
......@@ -10,3 +10,5 @@ metric_list:
- metric: acc
aggregation: mean
higher_is_better: true
metadata:
- version: 2.0
......@@ -13,3 +13,5 @@ generation_kwargs:
- "\n\n"
do_sample: false
temperature: 0.0
metadata:
- version: 0.0
......@@ -17,3 +17,5 @@ metric_list:
- metric: acc_norm
aggregation: mean
higher_is_better: true
metadata:
- version: 1.0
......@@ -108,7 +108,7 @@ def _num_cpu_cores():
class _SCROLLSTask(Task):
VERSION = 0
VERSION = 1
DATASET_PATH = "tau/scrolls"
DATASET_NAME = None
PRUNE_TOKENIZERS = None
......
......@@ -12,3 +12,5 @@ metric_list:
- metric: acc
aggregation: mean
higher_is_better: true
metadata:
- version: 0.0
......@@ -50,7 +50,7 @@ def _squad_agg(key, items):
@register_task("squadv2")
class SQuAD2(Task):
VERSION = 1
VERSION = 2
DATASET_PATH = "squad_v2"
DATASET_NAME = None
......
......@@ -14,3 +14,5 @@ metric_list:
- metric: acc
aggregation: mean
higher_is_better: true
metadata:
- version: 1.0
......@@ -13,3 +13,5 @@ should_decontaminate: true
doc_to_decontamination_query: passage
metric_list:
- metric: acc
metadata:
- version: 2.0
......@@ -22,3 +22,5 @@ metric_list:
higher_is_better: true
ignore_case: true
ignore_punctuation: true
metadata:
- version: 0.0
......@@ -18,3 +18,5 @@ metric_list:
higher_is_better: true
ignore_case: true
ignore_punctuation: true
metadata:
- version: 0.0
......@@ -13,3 +13,5 @@ metric_list:
- metric: acc
- metric: f1
aggregation: !function "aggregate.cb_multi_fi"
metadata:
- version: 1.0
......@@ -21,3 +21,5 @@ metric_list:
- metric: !function "t5_utils.mean_3class_f1"
aggregation: !function "t5_utils.agg_mean_3class_f1"
higher_is_better: true
metadata:
- version: 0.0
......@@ -11,3 +11,5 @@ doc_to_target: !function utils.doc_to_target
doc_to_choice: !function utils.doc_to_choice
metric_list:
- metric: acc
metadata:
- version: 1.0
......@@ -18,3 +18,5 @@ metric_list:
higher_is_better: true
ignore_case: true
ignore_punctuation: true
metadata:
- version: 0.0
......@@ -11,3 +11,5 @@ doc_to_target: label
doc_to_choice: "['''{{answer}}\\nIs the answer correct? yes''', '''{{answer}}\\nIs the answer correct? no''']"
metric_list:
- metric: acc
metadata:
- version: 2.0
......@@ -19,3 +19,5 @@ metric_list:
- metric: !function t5_utils.em
aggregation: !function t5_utils.agg_em
higher_is_better: true
metadata:
- version: 0.0
......@@ -16,3 +16,5 @@ metric_list:
- metric: em
higher_is_better: True
aggregation: mean
metadata:
- version: 1.0
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment