Unverified Commit e5dfd030 authored by Lintang Sutawika's avatar Lintang Sutawika Committed by GitHub
Browse files

Merge pull request #1074 from EleutherAI/lintangsutawika-patch-4

Update _cot_fewshot_template_yaml
parents f0b96491 965c5330
...@@ -3,7 +3,7 @@ ...@@ -3,7 +3,7 @@
[![DOI](https://zenodo.org/badge/DOI/10.5281/zenodo.10256836.svg)](https://doi.org/10.5281/zenodo.10256836) [![DOI](https://zenodo.org/badge/DOI/10.5281/zenodo.10256836.svg)](https://doi.org/10.5281/zenodo.10256836)
## Announcement ## Announcement
**A new v0.4.0 release of lm-evaluation-harness is available** ! **A new v0.4.0 release of lm-evaluation-harness is available** !
New updates and features include: New updates and features include:
......
...@@ -24,5 +24,6 @@ filter_list: ...@@ -24,5 +24,6 @@ filter_list:
- function: "regex" - function: "regex"
regex_pattern: "(?<=the answer is )(.*)(?=.)" regex_pattern: "(?<=the answer is )(.*)(?=.)"
- function: "take_first" - function: "take_first"
num_fewshot: 0
metadata: metadata:
- version: 0.0 - version: 0.0
...@@ -22,5 +22,6 @@ filter_list: ...@@ -22,5 +22,6 @@ filter_list:
- function: "regex" - function: "regex"
regex_pattern: "((?<=The answer is )(.*)(?=.)|(?<=the answer is )(.*)(?=.)|(?<=The answer: )(.*)(?=.)|(?<=The final answer: )(.*)(?=.))" regex_pattern: "((?<=The answer is )(.*)(?=.)|(?<=the answer is )(.*)(?=.)|(?<=The answer: )(.*)(?=.)|(?<=The final answer: )(.*)(?=.))"
- function: "take_first" - function: "take_first"
num_fewshot: 0
metadata: metadata:
- version: 0 - version: 0
...@@ -16,5 +16,6 @@ generation_kwargs: ...@@ -16,5 +16,6 @@ generation_kwargs:
- "\n\n" - "\n\n"
do_sample: false do_sample: false
temperature: 0.0 temperature: 0.0
num_fewshot: 0
metadata: metadata:
- version: 0 - version: 0
...@@ -16,5 +16,6 @@ generation_kwargs: ...@@ -16,5 +16,6 @@ generation_kwargs:
- "\n\n" - "\n\n"
do_sample: false do_sample: false
temperature: 0.0 temperature: 0.0
num_fewshot: 0
metadata: metadata:
- version: 0 - version: 0
...@@ -19,5 +19,6 @@ metric_list: ...@@ -19,5 +19,6 @@ metric_list:
- metric: exact_match - metric: exact_match
aggregation: mean aggregation: mean
higher_is_better: true higher_is_better: true
num_fewshot: 0
metadata: metadata:
- version: 0.0 - version: 0.0
...@@ -15,6 +15,7 @@ generation_kwargs: ...@@ -15,6 +15,7 @@ generation_kwargs:
- "</s>" - "</s>"
do_sample: false do_sample: false
temperature: 0.0 temperature: 0.0
num_fewshot: 0
metric_list: metric_list:
- metric: exact_match - metric: exact_match
aggregation: mean aggregation: mean
......
...@@ -15,6 +15,7 @@ generation_kwargs: ...@@ -15,6 +15,7 @@ generation_kwargs:
- "</s>" - "</s>"
do_sample: false do_sample: false
temperature: 0.0 temperature: 0.0
num_fewshot: 0
metric_list: metric_list:
- metric: exact_match - metric: exact_match
aggregation: mean aggregation: mean
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment