Unverified Commit ff739414 authored by Hailey Schoelkopf's avatar Hailey Schoelkopf Committed by GitHub
Browse files

Fix bug in multi-token Stop Sequences (#1268)

* fix incorrect lookback protections

* bump generate_until task versions
parent 818c056b
...@@ -34,4 +34,4 @@ filter_list: ...@@ -34,4 +34,4 @@ filter_list:
regex_pattern: "#### (\\-?[0-9\\.\\,]+)" regex_pattern: "#### (\\-?[0-9\\.\\,]+)"
- function: "take_first" - function: "take_first"
metadata: metadata:
version: 1.0 version: 2.0
...@@ -26,4 +26,4 @@ metric_list: ...@@ -26,4 +26,4 @@ metric_list:
aggregation: !function utils.agg_inst_level_acc aggregation: !function utils.agg_inst_level_acc
higher_is_better: true higher_is_better: true
metadata: metadata:
version: 1.0 version: 2.0
...@@ -26,4 +26,4 @@ metric_list: ...@@ -26,4 +26,4 @@ metric_list:
ignore_case: true ignore_case: true
ignore_punctuation: true ignore_punctuation: true
metadata: metadata:
version: 0.0 version: 1.0
...@@ -28,4 +28,4 @@ filter_list: ...@@ -28,4 +28,4 @@ filter_list:
regex_pattern: "The answer is (\\-?[0-9\\.\\,]+)" regex_pattern: "The answer is (\\-?[0-9\\.\\,]+)"
- function: "take_first" - function: "take_first"
metadata: metadata:
version: 0.0 version: 1.0
...@@ -28,4 +28,4 @@ filter_list: ...@@ -28,4 +28,4 @@ filter_list:
regex_pattern: "The answer is (\\-?[0-9\\.\\,]+)" regex_pattern: "The answer is (\\-?[0-9\\.\\,]+)"
- function: "take_first" - function: "take_first"
metadata: metadata:
version: 1.0 version: 2.0
...@@ -21,4 +21,4 @@ metric_list: ...@@ -21,4 +21,4 @@ metric_list:
higher_is_better: true higher_is_better: true
num_fewshot: 0 num_fewshot: 0
metadata: metadata:
version: 0.0 version: 1.0
...@@ -29,4 +29,4 @@ metric_list: ...@@ -29,4 +29,4 @@ metric_list:
regexes_to_ignore: regexes_to_ignore:
- "\ban|a|the\b" - "\ban|a|the\b"
metadata: metadata:
version: 0.0 version: 1.0
...@@ -42,4 +42,4 @@ metric_list: ...@@ -42,4 +42,4 @@ metric_list:
aggregation: mean aggregation: mean
higher_is_better: true higher_is_better: true
metadata: metadata:
version: 0.0 version: 1.0
...@@ -15,4 +15,4 @@ metric_list: ...@@ -15,4 +15,4 @@ metric_list:
aggregation: mean aggregation: mean
higher_is_better: true higher_is_better: true
metadata: metadata:
version: 1.0 version: 2.0
...@@ -108,7 +108,7 @@ def _num_cpu_cores(): ...@@ -108,7 +108,7 @@ def _num_cpu_cores():
class _SCROLLSTask(Task): class _SCROLLSTask(Task):
VERSION = 1 VERSION = 2
DATASET_PATH = "tau/scrolls" DATASET_PATH = "tau/scrolls"
DATASET_NAME = None DATASET_NAME = None
PRUNE_TOKENIZERS = None PRUNE_TOKENIZERS = None
......
...@@ -49,7 +49,7 @@ def _squad_agg(key, items): ...@@ -49,7 +49,7 @@ def _squad_agg(key, items):
@register_task("squadv2") @register_task("squadv2")
class SQuAD2(Task): class SQuAD2(Task):
VERSION = 2 VERSION = 3
DATASET_PATH = "squad_v2" DATASET_PATH = "squad_v2"
DATASET_NAME = None DATASET_NAME = None
......
...@@ -14,4 +14,4 @@ generation_kwargs: ...@@ -14,4 +14,4 @@ generation_kwargs:
temperature: 0.0 temperature: 0.0
repeats: 1 repeats: 1
metadata: metadata:
version: 0.0 version: 1.0
...@@ -28,4 +28,4 @@ metric_list: ...@@ -28,4 +28,4 @@ metric_list:
ignore_case: true ignore_case: true
ignore_punctuation: true ignore_punctuation: true
metadata: metadata:
version: 2.0 version: 3.0
...@@ -76,4 +76,4 @@ metric_list: ...@@ -76,4 +76,4 @@ metric_list:
aggregation: mean aggregation: mean
higher_is_better: true higher_is_better: true
metadata: metadata:
version: 2.0 version: 3.0
...@@ -17,4 +17,4 @@ metric_list: ...@@ -17,4 +17,4 @@ metric_list:
ignore_case: false ignore_case: false
ignore_punctuation: false ignore_punctuation: false
metadata: metadata:
version: 1.0 version: 2.0
...@@ -17,4 +17,4 @@ metric_list: ...@@ -17,4 +17,4 @@ metric_list:
ignore_case: false ignore_case: false
ignore_punctuation: false ignore_punctuation: false
metadata: metadata:
version: 1.0 version: 2.0
...@@ -17,4 +17,4 @@ metric_list: ...@@ -17,4 +17,4 @@ metric_list:
ignore_case: false ignore_case: false
ignore_punctuation: false ignore_punctuation: false
metadata: metadata:
version: 1.0 version: 2.0
...@@ -17,4 +17,4 @@ metric_list: ...@@ -17,4 +17,4 @@ metric_list:
ignore_case: false ignore_case: false
ignore_punctuation: false ignore_punctuation: false
metadata: metadata:
version: 1.0 version: 2.0
...@@ -17,4 +17,4 @@ metric_list: ...@@ -17,4 +17,4 @@ metric_list:
ignore_case: false ignore_case: false
ignore_punctuation: false ignore_punctuation: false
metadata: metadata:
version: 1.0 version: 2.0
...@@ -17,4 +17,4 @@ metric_list: ...@@ -17,4 +17,4 @@ metric_list:
aggregation: mean aggregation: mean
higher_is_better: true higher_is_better: true
metadata: metadata:
version: 1.0 version: 2.0
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment