Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
lm-evaluation-harness
Commits
8371662c
Unverified
Commit
8371662c
authored
Feb 24, 2024
by
thnkinbtfly
Committed by
GitHub
Feb 23, 2024
Browse files
update parsing logic of mgsm following gsm8k (#1462)
parent
75ac1f47
Changes
37
Hide whitespace changes
Inline
Side-by-side
Showing
20 changed files
with
123 additions
and
3 deletions
+123
-3
lm_eval/tasks/mgsm/direct/direct_yaml
lm_eval/tasks/mgsm/direct/direct_yaml
+7
-1
lm_eval/tasks/mgsm/direct/mgsm_direct_bn.yaml
lm_eval/tasks/mgsm/direct/mgsm_direct_bn.yaml
+6
-0
lm_eval/tasks/mgsm/direct/mgsm_direct_de.yaml
lm_eval/tasks/mgsm/direct/mgsm_direct_de.yaml
+6
-0
lm_eval/tasks/mgsm/direct/mgsm_direct_en.yaml
lm_eval/tasks/mgsm/direct/mgsm_direct_en.yaml
+6
-0
lm_eval/tasks/mgsm/direct/mgsm_direct_es.yaml
lm_eval/tasks/mgsm/direct/mgsm_direct_es.yaml
+6
-0
lm_eval/tasks/mgsm/direct/mgsm_direct_fr.yaml
lm_eval/tasks/mgsm/direct/mgsm_direct_fr.yaml
+6
-0
lm_eval/tasks/mgsm/direct/mgsm_direct_ja.yaml
lm_eval/tasks/mgsm/direct/mgsm_direct_ja.yaml
+6
-0
lm_eval/tasks/mgsm/direct/mgsm_direct_ru.yaml
lm_eval/tasks/mgsm/direct/mgsm_direct_ru.yaml
+6
-0
lm_eval/tasks/mgsm/direct/mgsm_direct_sw.yaml
lm_eval/tasks/mgsm/direct/mgsm_direct_sw.yaml
+6
-0
lm_eval/tasks/mgsm/direct/mgsm_direct_te.yaml
lm_eval/tasks/mgsm/direct/mgsm_direct_te.yaml
+6
-0
lm_eval/tasks/mgsm/direct/mgsm_direct_th.yaml
lm_eval/tasks/mgsm/direct/mgsm_direct_th.yaml
+6
-0
lm_eval/tasks/mgsm/direct/mgsm_direct_zh.yaml
lm_eval/tasks/mgsm/direct/mgsm_direct_zh.yaml
+6
-0
lm_eval/tasks/mgsm/en_cot/cot_yaml
lm_eval/tasks/mgsm/en_cot/cot_yaml
+8
-2
lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_bn.yaml
lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_bn.yaml
+6
-0
lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_de.yaml
lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_de.yaml
+6
-0
lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_en.yaml
lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_en.yaml
+6
-0
lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_es.yaml
lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_es.yaml
+6
-0
lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_fr.yaml
lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_fr.yaml
+6
-0
lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_ja.yaml
lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_ja.yaml
+6
-0
lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_ru.yaml
lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_ru.yaml
+6
-0
No files found.
lm_eval/tasks/mgsm/direct/direct_yaml
View file @
8371662c
...
@@ -19,6 +19,12 @@ filter_list:
...
@@ -19,6 +19,12 @@ filter_list:
filter:
filter:
- function: remove_whitespace
- function: remove_whitespace
- function: take_first
- function: take_first
- filter:
- function: regex
group_select: -1
regex_pattern: (-?[$0-9.,]{2,})|(-?[0-9]+)
- function: take_first
name: flexible-extract
metric_list:
metric_list:
- metric: exact_match
- metric: exact_match
aggregation: mean
aggregation: mean
...
@@ -26,4 +32,4 @@ metric_list:
...
@@ -26,4 +32,4 @@ metric_list:
ignore_case: true
ignore_case: true
ignore_punctuation: true
ignore_punctuation: true
metadata:
metadata:
version:
1
.0
version:
2
.0
lm_eval/tasks/mgsm/direct/mgsm_direct_bn.yaml
View file @
8371662c
...
@@ -2,5 +2,11 @@
...
@@ -2,5 +2,11 @@
dataset_name
:
bn
dataset_name
:
bn
doc_to_target
:
'
{%
if
answer
is
not
none
%}{{answer[17:]}}{%
else
%}{{answer_number|string}}{%
endif
%}'
doc_to_target
:
'
{%
if
answer
is
not
none
%}{{answer[17:]}}{%
else
%}{{answer_number|string}}{%
endif
%}'
doc_to_text
:
'
{%
if
answer
is
not
none
%}{{question+"\nAnswer:"}}{%
else
%}{{"প্রশ্ন:
"+question+"\nAnswer:"}}{%
endif
%}'
doc_to_text
:
'
{%
if
answer
is
not
none
%}{{question+"\nAnswer:"}}{%
else
%}{{"প্রশ্ন:
"+question+"\nAnswer:"}}{%
endif
%}'
generation_kwargs
:
do_sample
:
false
until
:
-
'
প্রশ্ন:'
-
</s>
-
<|im_end|>
include
:
direct_yaml
include
:
direct_yaml
task
:
mgsm_direct_bn
task
:
mgsm_direct_bn
lm_eval/tasks/mgsm/direct/mgsm_direct_de.yaml
View file @
8371662c
...
@@ -2,5 +2,11 @@
...
@@ -2,5 +2,11 @@
dataset_name
:
de
dataset_name
:
de
doc_to_target
:
'
{%
if
answer
is
not
none
%}{{answer[29:]}}{%
else
%}{{answer_number|string}}{%
endif
%}'
doc_to_target
:
'
{%
if
answer
is
not
none
%}{{answer[29:]}}{%
else
%}{{answer_number|string}}{%
endif
%}'
doc_to_text
:
'
{%
if
answer
is
not
none
%}{{question+"\nAntwort:"}}{%
else
%}{{"Frage:
"+question+"\nAntwort:"}}{%
endif
%}'
doc_to_text
:
'
{%
if
answer
is
not
none
%}{{question+"\nAntwort:"}}{%
else
%}{{"Frage:
"+question+"\nAntwort:"}}{%
endif
%}'
generation_kwargs
:
do_sample
:
false
until
:
-
'
Frage:'
-
</s>
-
<|im_end|>
include
:
direct_yaml
include
:
direct_yaml
task
:
mgsm_direct_de
task
:
mgsm_direct_de
lm_eval/tasks/mgsm/direct/mgsm_direct_en.yaml
View file @
8371662c
...
@@ -2,5 +2,11 @@
...
@@ -2,5 +2,11 @@
dataset_name
:
en
dataset_name
:
en
doc_to_target
:
'
{%
if
answer
is
not
none
%}{{answer[21:]}}{%
else
%}{{answer_number|string}}{%
endif
%}'
doc_to_target
:
'
{%
if
answer
is
not
none
%}{{answer[21:]}}{%
else
%}{{answer_number|string}}{%
endif
%}'
doc_to_text
:
'
{%
if
answer
is
not
none
%}{{question+"\nAnswer:"}}{%
else
%}{{"Question:
"+question+"\nAnswer:"}}{%
endif
%}'
doc_to_text
:
'
{%
if
answer
is
not
none
%}{{question+"\nAnswer:"}}{%
else
%}{{"Question:
"+question+"\nAnswer:"}}{%
endif
%}'
generation_kwargs
:
do_sample
:
false
until
:
-
'
Question:'
-
</s>
-
<|im_end|>
include
:
direct_yaml
include
:
direct_yaml
task
:
mgsm_direct_en
task
:
mgsm_direct_en
lm_eval/tasks/mgsm/direct/mgsm_direct_es.yaml
View file @
8371662c
...
@@ -2,5 +2,11 @@
...
@@ -2,5 +2,11 @@
dataset_name
:
es
dataset_name
:
es
doc_to_target
:
'
{%
if
answer
is
not
none
%}{{answer[23:]}}{%
else
%}{{answer_number|string}}{%
endif
%}'
doc_to_target
:
'
{%
if
answer
is
not
none
%}{{answer[23:]}}{%
else
%}{{answer_number|string}}{%
endif
%}'
doc_to_text
:
'
{%
if
answer
is
not
none
%}{{question+"\nRespuesta:"}}{%
else
%}{{"Pregunta:
"+question+"\nRespuesta:"}}{%
endif
%}'
doc_to_text
:
'
{%
if
answer
is
not
none
%}{{question+"\nRespuesta:"}}{%
else
%}{{"Pregunta:
"+question+"\nRespuesta:"}}{%
endif
%}'
generation_kwargs
:
do_sample
:
false
until
:
-
'
Pregunta:'
-
</s>
-
<|im_end|>
include
:
direct_yaml
include
:
direct_yaml
task
:
mgsm_direct_es
task
:
mgsm_direct_es
lm_eval/tasks/mgsm/direct/mgsm_direct_fr.yaml
View file @
8371662c
...
@@ -2,5 +2,11 @@
...
@@ -2,5 +2,11 @@
dataset_name
:
fr
dataset_name
:
fr
doc_to_target
:
'
{%
if
answer
is
not
none
%}{{answer[26:]}}{%
else
%}{{answer_number|string}}{%
endif
%}'
doc_to_target
:
'
{%
if
answer
is
not
none
%}{{answer[26:]}}{%
else
%}{{answer_number|string}}{%
endif
%}'
doc_to_text
:
'
{%
if
answer
is
not
none
%}{{question+"\nRéponse
:"}}{%
else
%}{{"Question
:
"+question+"\nRéponse
:"}}{%
endif
%}'
doc_to_text
:
'
{%
if
answer
is
not
none
%}{{question+"\nRéponse
:"}}{%
else
%}{{"Question
:
"+question+"\nRéponse
:"}}{%
endif
%}'
generation_kwargs
:
do_sample
:
false
until
:
-
'
Question
:'
-
</s>
-
<|im_end|>
include
:
direct_yaml
include
:
direct_yaml
task
:
mgsm_direct_fr
task
:
mgsm_direct_fr
lm_eval/tasks/mgsm/direct/mgsm_direct_ja.yaml
View file @
8371662c
...
@@ -2,5 +2,11 @@
...
@@ -2,5 +2,11 @@
dataset_name
:
ja
dataset_name
:
ja
doc_to_target
:
'
{%
if
answer
is
not
none
%}{{answer[11:]}}{%
else
%}{{answer_number|string}}{%
endif
%}'
doc_to_target
:
'
{%
if
answer
is
not
none
%}{{answer[11:]}}{%
else
%}{{answer_number|string}}{%
endif
%}'
doc_to_text
:
'
{%
if
answer
is
not
none
%}{{question+"\nAnswer:"}}{%
else
%}{{"問題:
"+question+"\nAnswer:"}}{%
endif
%}'
doc_to_text
:
'
{%
if
answer
is
not
none
%}{{question+"\nAnswer:"}}{%
else
%}{{"問題:
"+question+"\nAnswer:"}}{%
endif
%}'
generation_kwargs
:
do_sample
:
false
until
:
-
'
問題:'
-
</s>
-
<|im_end|>
include
:
direct_yaml
include
:
direct_yaml
task
:
mgsm_direct_ja
task
:
mgsm_direct_ja
lm_eval/tasks/mgsm/direct/mgsm_direct_ru.yaml
View file @
8371662c
...
@@ -2,5 +2,11 @@
...
@@ -2,5 +2,11 @@
dataset_name
:
ru
dataset_name
:
ru
doc_to_target
:
'
{%
if
answer
is
not
none
%}{{answer[18:]}}{%
else
%}{{answer_number|string}}{%
endif
%}'
doc_to_target
:
'
{%
if
answer
is
not
none
%}{{answer[18:]}}{%
else
%}{{answer_number|string}}{%
endif
%}'
doc_to_text
:
'
{%
if
answer
is
not
none
%}{{question+"\nAnswer:"}}{%
else
%}{{"Задача:
"+question+"\nAnswer:"}}{%
endif
%}'
doc_to_text
:
'
{%
if
answer
is
not
none
%}{{question+"\nAnswer:"}}{%
else
%}{{"Задача:
"+question+"\nAnswer:"}}{%
endif
%}'
generation_kwargs
:
do_sample
:
false
until
:
-
'
Задача:'
-
</s>
-
<|im_end|>
include
:
direct_yaml
include
:
direct_yaml
task
:
mgsm_direct_ru
task
:
mgsm_direct_ru
lm_eval/tasks/mgsm/direct/mgsm_direct_sw.yaml
View file @
8371662c
...
@@ -2,5 +2,11 @@
...
@@ -2,5 +2,11 @@
dataset_name
:
sw
dataset_name
:
sw
doc_to_target
:
'
{%
if
answer
is
not
none
%}{{answer[25:]}}{%
else
%}{{answer_number|string}}{%
endif
%}'
doc_to_target
:
'
{%
if
answer
is
not
none
%}{{answer[25:]}}{%
else
%}{{answer_number|string}}{%
endif
%}'
doc_to_text
:
'
{%
if
answer
is
not
none
%}{{question+"\nAnswer:"}}{%
else
%}{{"Swali:
"+question+"\nAnswer:"}}{%
endif
%}'
doc_to_text
:
'
{%
if
answer
is
not
none
%}{{question+"\nAnswer:"}}{%
else
%}{{"Swali:
"+question+"\nAnswer:"}}{%
endif
%}'
generation_kwargs
:
do_sample
:
false
until
:
-
'
Swali:'
-
</s>
-
<|im_end|>
include
:
direct_yaml
include
:
direct_yaml
task
:
mgsm_direct_sw
task
:
mgsm_direct_sw
lm_eval/tasks/mgsm/direct/mgsm_direct_te.yaml
View file @
8371662c
...
@@ -2,5 +2,11 @@
...
@@ -2,5 +2,11 @@
dataset_name
:
te
dataset_name
:
te
doc_to_target
:
'
{%
if
answer
is
not
none
%}{{answer[19:]}}{%
else
%}{{answer_number|string}}{%
endif
%}'
doc_to_target
:
'
{%
if
answer
is
not
none
%}{{answer[19:]}}{%
else
%}{{answer_number|string}}{%
endif
%}'
doc_to_text
:
'
{%
if
answer
is
not
none
%}{{question+"\nAnswer:"}}{%
else
%}{{"ప్రశ్న:
"+question+"\nAnswer:"}}{%
endif
%}'
doc_to_text
:
'
{%
if
answer
is
not
none
%}{{question+"\nAnswer:"}}{%
else
%}{{"ప్రశ్న:
"+question+"\nAnswer:"}}{%
endif
%}'
generation_kwargs
:
do_sample
:
false
until
:
-
'
ప్రశ్న:'
-
</s>
-
<|im_end|>
include
:
direct_yaml
include
:
direct_yaml
task
:
mgsm_direct_te
task
:
mgsm_direct_te
lm_eval/tasks/mgsm/direct/mgsm_direct_th.yaml
View file @
8371662c
...
@@ -2,5 +2,11 @@
...
@@ -2,5 +2,11 @@
dataset_name
:
th
dataset_name
:
th
doc_to_target
:
'
{%
if
answer
is
not
none
%}{{answer[18:]}}{%
else
%}{{answer_number|string}}{%
endif
%}'
doc_to_target
:
'
{%
if
answer
is
not
none
%}{{answer[18:]}}{%
else
%}{{answer_number|string}}{%
endif
%}'
doc_to_text
:
'
{%
if
answer
is
not
none
%}{{question+"\nAnswer:"}}{%
else
%}{{"โจทย์:
"+question+"\nAnswer:"}}{%
endif
%}'
doc_to_text
:
'
{%
if
answer
is
not
none
%}{{question+"\nAnswer:"}}{%
else
%}{{"โจทย์:
"+question+"\nAnswer:"}}{%
endif
%}'
generation_kwargs
:
do_sample
:
false
until
:
-
'
โจทย์:'
-
</s>
-
<|im_end|>
include
:
direct_yaml
include
:
direct_yaml
task
:
mgsm_direct_th
task
:
mgsm_direct_th
lm_eval/tasks/mgsm/direct/mgsm_direct_zh.yaml
View file @
8371662c
...
@@ -2,5 +2,11 @@
...
@@ -2,5 +2,11 @@
dataset_name
:
zh
dataset_name
:
zh
doc_to_target
:
'
{%
if
answer
is
not
none
%}{{answer[6:]}}{%
else
%}{{answer_number|string}}{%
endif
%}'
doc_to_target
:
'
{%
if
answer
is
not
none
%}{{answer[6:]}}{%
else
%}{{answer_number|string}}{%
endif
%}'
doc_to_text
:
'
{%
if
answer
is
not
none
%}{{question+"\nAnswer:"}}{%
else
%}{{"问题:
"+question+"\nAnswer:"}}{%
endif
%}'
doc_to_text
:
'
{%
if
answer
is
not
none
%}{{question+"\nAnswer:"}}{%
else
%}{{"问题:
"+question+"\nAnswer:"}}{%
endif
%}'
generation_kwargs
:
do_sample
:
false
until
:
-
'
问题:'
-
</s>
-
<|im_end|>
include
:
direct_yaml
include
:
direct_yaml
task
:
mgsm_direct_zh
task
:
mgsm_direct_zh
lm_eval/tasks/mgsm/en_cot/cot_yaml
View file @
8371662c
...
@@ -21,10 +21,16 @@ metric_list:
...
@@ -21,10 +21,16 @@ metric_list:
ignore_case: true
ignore_case: true
ignore_punctuation: true
ignore_punctuation: true
filter_list:
filter_list:
- name: "
get-answer
"
- name: "
strict-match
"
filter:
filter:
- function: "regex"
- function: "regex"
regex_pattern: "The answer is (\\-?[0-9\\.\\,]+)"
regex_pattern: "The answer is (\\-?[0-9\\.\\,]+)"
- function: "take_first"
- function: "take_first"
- filter:
- function: regex
group_select: -1
regex_pattern: (-?[$0-9.,]{2,})|(-?[0-9]+)
- function: take_first
name: flexible-extract
metadata:
metadata:
version:
1
.0
version:
2
.0
lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_bn.yaml
View file @
8371662c
...
@@ -2,5 +2,11 @@
...
@@ -2,5 +2,11 @@
dataset_name
:
bn
dataset_name
:
bn
doc_to_target
:
'
{%
if
answer
is
not
none
%}{{answer[17:]}}{%
else
%}{{answer_number|string}}{%
endif
%}'
doc_to_target
:
'
{%
if
answer
is
not
none
%}{{answer[17:]}}{%
else
%}{{answer_number|string}}{%
endif
%}'
doc_to_text
:
'
{%
if
answer
is
not
none
%}{{question+"\nStep-by-Step
Answer:"}}{%
else
%}{{"প্রশ্ন:
"+question+"\nStep-by-Step
Answer:"}}{%
endif
%}'
doc_to_text
:
'
{%
if
answer
is
not
none
%}{{question+"\nStep-by-Step
Answer:"}}{%
else
%}{{"প্রশ্ন:
"+question+"\nStep-by-Step
Answer:"}}{%
endif
%}'
generation_kwargs
:
do_sample
:
false
until
:
-
'
প্রশ্ন:'
-
</s>
-
<|im_end|>
include
:
cot_yaml
include
:
cot_yaml
task
:
mgsm_en_cot_bn
task
:
mgsm_en_cot_bn
lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_de.yaml
View file @
8371662c
...
@@ -2,5 +2,11 @@
...
@@ -2,5 +2,11 @@
dataset_name
:
de
dataset_name
:
de
doc_to_target
:
'
{%
if
answer
is
not
none
%}{{answer[29:]}}{%
else
%}{{answer_number|string}}{%
endif
%}'
doc_to_target
:
'
{%
if
answer
is
not
none
%}{{answer[29:]}}{%
else
%}{{answer_number|string}}{%
endif
%}'
doc_to_text
:
'
{%
if
answer
is
not
none
%}{{question+"\nStep-by-Step
Answer:"}}{%
else
%}{{"Frage:
"+question+"\nStep-by-Step
Answer:"}}{%
endif
%}'
doc_to_text
:
'
{%
if
answer
is
not
none
%}{{question+"\nStep-by-Step
Answer:"}}{%
else
%}{{"Frage:
"+question+"\nStep-by-Step
Answer:"}}{%
endif
%}'
generation_kwargs
:
do_sample
:
false
until
:
-
'
Frage:'
-
</s>
-
<|im_end|>
include
:
cot_yaml
include
:
cot_yaml
task
:
mgsm_en_cot_de
task
:
mgsm_en_cot_de
lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_en.yaml
View file @
8371662c
...
@@ -2,5 +2,11 @@
...
@@ -2,5 +2,11 @@
dataset_name
:
en
dataset_name
:
en
doc_to_target
:
'
{%
if
answer
is
not
none
%}{{answer[21:]}}{%
else
%}{{answer_number|string}}{%
endif
%}'
doc_to_target
:
'
{%
if
answer
is
not
none
%}{{answer[21:]}}{%
else
%}{{answer_number|string}}{%
endif
%}'
doc_to_text
:
'
{%
if
answer
is
not
none
%}{{question+"\nStep-by-Step
Answer:"}}{%
else
%}{{"Question:
"+question+"\nStep-by-Step
Answer:"}}{%
endif
%}'
doc_to_text
:
'
{%
if
answer
is
not
none
%}{{question+"\nStep-by-Step
Answer:"}}{%
else
%}{{"Question:
"+question+"\nStep-by-Step
Answer:"}}{%
endif
%}'
generation_kwargs
:
do_sample
:
false
until
:
-
'
Question:'
-
</s>
-
<|im_end|>
include
:
cot_yaml
include
:
cot_yaml
task
:
mgsm_en_cot_en
task
:
mgsm_en_cot_en
lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_es.yaml
View file @
8371662c
...
@@ -2,5 +2,11 @@
...
@@ -2,5 +2,11 @@
dataset_name
:
es
dataset_name
:
es
doc_to_target
:
'
{%
if
answer
is
not
none
%}{{answer[23:]}}{%
else
%}{{answer_number|string}}{%
endif
%}'
doc_to_target
:
'
{%
if
answer
is
not
none
%}{{answer[23:]}}{%
else
%}{{answer_number|string}}{%
endif
%}'
doc_to_text
:
'
{%
if
answer
is
not
none
%}{{question+"\nStep-by-Step
Answer:"}}{%
else
%}{{"Pregunta:
"+question+"\nStep-by-Step
Answer:"}}{%
endif
%}'
doc_to_text
:
'
{%
if
answer
is
not
none
%}{{question+"\nStep-by-Step
Answer:"}}{%
else
%}{{"Pregunta:
"+question+"\nStep-by-Step
Answer:"}}{%
endif
%}'
generation_kwargs
:
do_sample
:
false
until
:
-
'
Pregunta:'
-
</s>
-
<|im_end|>
include
:
cot_yaml
include
:
cot_yaml
task
:
mgsm_en_cot_es
task
:
mgsm_en_cot_es
lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_fr.yaml
View file @
8371662c
...
@@ -2,5 +2,11 @@
...
@@ -2,5 +2,11 @@
dataset_name
:
fr
dataset_name
:
fr
doc_to_target
:
'
{%
if
answer
is
not
none
%}{{answer[26:]}}{%
else
%}{{answer_number|string}}{%
endif
%}'
doc_to_target
:
'
{%
if
answer
is
not
none
%}{{answer[26:]}}{%
else
%}{{answer_number|string}}{%
endif
%}'
doc_to_text
:
'
{%
if
answer
is
not
none
%}{{question+"\nStep-by-Step
Answer:"}}{%
else
%}{{"Question
:
"+question+"\nStep-by-Step
Answer:"}}{%
endif
%}'
doc_to_text
:
'
{%
if
answer
is
not
none
%}{{question+"\nStep-by-Step
Answer:"}}{%
else
%}{{"Question
:
"+question+"\nStep-by-Step
Answer:"}}{%
endif
%}'
generation_kwargs
:
do_sample
:
false
until
:
-
'
Question
:'
-
</s>
-
<|im_end|>
include
:
cot_yaml
include
:
cot_yaml
task
:
mgsm_en_cot_fr
task
:
mgsm_en_cot_fr
lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_ja.yaml
View file @
8371662c
...
@@ -2,5 +2,11 @@
...
@@ -2,5 +2,11 @@
dataset_name
:
ja
dataset_name
:
ja
doc_to_target
:
'
{%
if
answer
is
not
none
%}{{answer[11:]}}{%
else
%}{{answer_number|string}}{%
endif
%}'
doc_to_target
:
'
{%
if
answer
is
not
none
%}{{answer[11:]}}{%
else
%}{{answer_number|string}}{%
endif
%}'
doc_to_text
:
'
{%
if
answer
is
not
none
%}{{question+"\nStep-by-Step
Answer:"}}{%
else
%}{{"問題:
"+question+"\nStep-by-Step
Answer:"}}{%
endif
%}'
doc_to_text
:
'
{%
if
answer
is
not
none
%}{{question+"\nStep-by-Step
Answer:"}}{%
else
%}{{"問題:
"+question+"\nStep-by-Step
Answer:"}}{%
endif
%}'
generation_kwargs
:
do_sample
:
false
until
:
-
'
問題:'
-
</s>
-
<|im_end|>
include
:
cot_yaml
include
:
cot_yaml
task
:
mgsm_en_cot_ja
task
:
mgsm_en_cot_ja
lm_eval/tasks/mgsm/en_cot/mgsm_en_cot_ru.yaml
View file @
8371662c
...
@@ -2,5 +2,11 @@
...
@@ -2,5 +2,11 @@
dataset_name
:
ru
dataset_name
:
ru
doc_to_target
:
'
{%
if
answer
is
not
none
%}{{answer[18:]}}{%
else
%}{{answer_number|string}}{%
endif
%}'
doc_to_target
:
'
{%
if
answer
is
not
none
%}{{answer[18:]}}{%
else
%}{{answer_number|string}}{%
endif
%}'
doc_to_text
:
'
{%
if
answer
is
not
none
%}{{question+"\nStep-by-Step
Answer:"}}{%
else
%}{{"Задача:
"+question+"\nStep-by-Step
Answer:"}}{%
endif
%}'
doc_to_text
:
'
{%
if
answer
is
not
none
%}{{question+"\nStep-by-Step
Answer:"}}{%
else
%}{{"Задача:
"+question+"\nStep-by-Step
Answer:"}}{%
endif
%}'
generation_kwargs
:
do_sample
:
false
until
:
-
'
Задача:'
-
</s>
-
<|im_end|>
include
:
cot_yaml
include
:
cot_yaml
task
:
mgsm_en_cot_ru
task
:
mgsm_en_cot_ru
Prev
1
2
Next
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment