Unverified Commit 26bc3eab authored by Lintang Sutawika's avatar Lintang Sutawika Committed by GitHub
Browse files

Merge branch 'big-refactor' into model-written-eval

parents 0d701496 cf617ab1
# Generated by utils.py
dataset_name: word_sorting_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_word_sorting_greedy_until
include: ../generate_until_template_yaml
task: bigbench_word_sorting_generate_until
# Generated by utils.py
dataset_name: word_unscrambling_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_word_unscrambling_greedy_until
include: ../generate_until_template_yaml
task: bigbench_word_unscrambling_generate_until
group: bigbench
dataset_path: bigbench # will switch to `hails/bigbench` when all tasks are pushed
output_type: greedy_until
output_type: generate_until
dataset_kwargs:
# num_shots: 0 # TODO: num of shots for `bigbench` HF dataset should be controlled through this, not through the typical methods
# subtask_name: null
......
......@@ -5,7 +5,7 @@ dataset_path: CM/codexglue_code2text_go
training_split: train
validation_split: validation
test_split: test
output_type: greedy_until
output_type: generate_until
generation_kwargs:
num_beams: 10
max_length: 128
......
......@@ -5,7 +5,7 @@ dataset_path: CM/codexglue_code2text_java
training_split: train
validation_split: validation
test_split: test
output_type: greedy_until
output_type: generate_until
generation_kwargs:
num_beams: 10
max_length: 128
......
......@@ -5,7 +5,7 @@ dataset_path: CM/codexglue_code2text_javascript
training_split: train
validation_split: validation
test_split: test
output_type: greedy_until
output_type: generate_until
generation_kwargs:
num_beams: 10
max_length: 128
......
......@@ -5,7 +5,7 @@ dataset_path: CM/codexglue_code2text_php
training_split: train
validation_split: validation
test_split: test
output_type: greedy_until
output_type: generate_until
generation_kwargs:
num_beams: 10
max_length: 128
......
......@@ -5,7 +5,7 @@ dataset_path: CM/codexglue_code2text_python
training_split: train
validation_split: validation
test_split: test
output_type: greedy_until
output_type: generate_until
generation_kwargs:
num_beams: 10
max_length: 128
......
......@@ -5,7 +5,7 @@ dataset_path: CM/codexglue_code2text_ruby
training_split: train
validation_split: validation
test_split: test
output_type: greedy_until
output_type: generate_until
generation_kwargs:
num_beams: 10
max_length: 128
......
task: coqa
dataset_path: EleutherAI/coqa
output_type: greedy_until
output_type: generate_until
training_split: train
validation_split: validation
doc_to_text: !function utils.doc_to_text
......
task: drop
dataset_path: EleutherAI/drop
output_type: greedy_until
output_type: generate_until
training_split: train
validation_split: validation
process_docs: !function utils.process_docs
......
......@@ -3,7 +3,7 @@ group:
task: gsm8k_cot
dataset_path: gsm8k
dataset_name: main
output_type: greedy_until
output_type: generate_until
test_split: test
doc_to_text: "Q: There are 15 trees in the grove. Grove workers will plant trees in the grove today. After they are done, there will be 21 trees. How many trees did the grove workers plant today?\n\nA: There are 15 trees originally. Then there were 21 trees after some more were planted. So there must have been 21 - 15 = 6. The answer is 6.\n\n\
Q: If there are 3 cars in the parking lot and 2 more cars arrive, how many cars are in the parking lot?\n\nA: There are originally 3 cars. 2 more cars arrive. 3 + 2 = 5. The answer is 5.\n\n\
......
......@@ -3,7 +3,7 @@ group:
task: gsm8k_yaml
dataset_path: gsm8k
dataset_name: main
output_type: greedy_until
output_type: generate_until
training_split: train
fewshot_split: train
test_split: test
......
task: logieval
dataset_path: baber/logiqa2
dataset_name: logieval
output_type: greedy_until
output_type: generate_until
training_split: train
test_split: test
# Instructions + {content}
......
......@@ -4,7 +4,7 @@
group: mgsm_direct
dataset_path: juletxara/mgsm
dataset_name: null # Overridden by language-specific config.
output_type: greedy_until
output_type: generate_until
training_split: train
test_split: test
target_delimiter: ""
......
......@@ -4,7 +4,7 @@
group: mgsm_cot_native
dataset_path: juletxara/mgsm
dataset_name: null # Overridden by language-specific config.
output_type: greedy_until
output_type: generate_until
training_split: train
test_split: test
target_delimiter: ""
......
......@@ -4,7 +4,7 @@
group: mgsm_cot_native
dataset_path: juletxara/mgsm
dataset_name: null # Overridden by language-specific config.
output_type: greedy_until
output_type: generate_until
training_split: train
test_split: test
target_delimiter: ""
......
......@@ -37,7 +37,7 @@ Eprint = {arXiv:2206.14858},
#### Groups
- `math_word_problems`
- `greedy_until`
- `generate_until`
#### Tasks
......
......@@ -4,7 +4,7 @@ task: minerva_math_algebra
dataset_path: EleutherAI/hendrycks_math
process_docs: !function utils.process_docs
dataset_name: algebra
output_type: greedy_until
output_type: generate_until
training_split: train
test_split: test
doc_to_text: !function utils.doc_to_text
......
......@@ -2,7 +2,7 @@ group: mmlu_flan_cot_fewshot
dataset_path: cais/mmlu
validation_split: validation
fewshot_split: dev
output_type: greedy_until
output_type: generate_until
doc_to_text: "Q: {{question.strip()}}\n(A) {{choices[0]}} (B) {{choices[1]}} (C) {{choices[2]}} (D) {{choices[3]}}\nA: Let's think step by step."
doc_to_target: "{{['(A)', '(B)', '(C)', '(D)'][answer]}}"
filter_list:
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment