Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
lm-evaluation-harness
Commits
3e9c9a95
Commit
3e9c9a95
authored
Aug 16, 2023
by
lintangsutawika
Browse files
add mgsm yamls
parent
416a3ca1
Changes
13
Hide whitespace changes
Inline
Side-by-side
Showing
13 changed files
with
105 additions
and
17 deletions
+105
-17
lm_eval/tasks/mgsm/common_template_yaml
lm_eval/tasks/mgsm/common_template_yaml
+6
-0
lm_eval/tasks/mgsm/mgsm_bn.yaml
lm_eval/tasks/mgsm/mgsm_bn.yaml
+8
-0
lm_eval/tasks/mgsm/mgsm_de.yaml
lm_eval/tasks/mgsm/mgsm_de.yaml
+8
-0
lm_eval/tasks/mgsm/mgsm_en.yaml
lm_eval/tasks/mgsm/mgsm_en.yaml
+8
-0
lm_eval/tasks/mgsm/mgsm_es.yaml
lm_eval/tasks/mgsm/mgsm_es.yaml
+8
-0
lm_eval/tasks/mgsm/mgsm_fr.yaml
lm_eval/tasks/mgsm/mgsm_fr.yaml
+8
-0
lm_eval/tasks/mgsm/mgsm_ja.yaml
lm_eval/tasks/mgsm/mgsm_ja.yaml
+8
-0
lm_eval/tasks/mgsm/mgsm_ru.yaml
lm_eval/tasks/mgsm/mgsm_ru.yaml
+8
-0
lm_eval/tasks/mgsm/mgsm_sw.yaml
lm_eval/tasks/mgsm/mgsm_sw.yaml
+8
-0
lm_eval/tasks/mgsm/mgsm_te.yaml
lm_eval/tasks/mgsm/mgsm_te.yaml
+8
-0
lm_eval/tasks/mgsm/mgsm_th.yaml
lm_eval/tasks/mgsm/mgsm_th.yaml
+8
-0
lm_eval/tasks/mgsm/mgsm_zh.yaml
lm_eval/tasks/mgsm/mgsm_zh.yaml
+8
-0
lm_eval/tasks/mgsm/utils.py
lm_eval/tasks/mgsm/utils.py
+11
-17
No files found.
lm_eval/tasks/mgsm/common_template_yaml
View file @
3e9c9a95
...
...
@@ -14,6 +14,12 @@ generation_kwargs:
- "\n"
do_sample: false
temperature: 0.0
filter_list:
- name: remove_whitespace
filter:
- function: remove_whitespace
- function: take_first
target_delimiter: " "
metric_list:
- metric: exact_match
aggregation: mean
...
...
lm_eval/tasks/mgsm/mgsm_bn.yaml
0 → 100644
View file @
3e9c9a95
# Generated by utils.py
dataset_name
:
bn
doc_to_target
:
'
{%
if
answer
is
not
none
%}{{answer[16+1]}}{%
else
%}{{answer_number|string}}{%
endif
%}'
doc_to_text
:
'
{%
if
answer
is
not
none
%}{{question+"\nধাপে
ধাপে
উত্তর:"}}{%
else
%}{{"প্রশ্ন:
"+question+"\nধাপে
ধাপে
উত্তর:"}}{%
endif
%}'
include
:
common_template_yaml
task
:
mgsm_bn
lm_eval/tasks/mgsm/mgsm_de.yaml
0 → 100644
View file @
3e9c9a95
# Generated by utils.py
dataset_name
:
de
doc_to_target
:
'
{%
if
answer
is
not
none
%}{{answer[28+1]}}{%
else
%}{{answer_number|string}}{%
endif
%}'
doc_to_text
:
'
{%
if
answer
is
not
none
%}{{question+"\nSchritt-für-Schritt-Antwort:"}}{%
else
%}{{"Frage:
"+question+"\nSchritt-für-Schritt-Antwort:"}}{%
endif
%}'
include
:
common_template_yaml
task
:
mgsm_de
lm_eval/tasks/mgsm/mgsm_en.yaml
0 → 100644
View file @
3e9c9a95
# Generated by utils.py
dataset_name
:
en
doc_to_target
:
'
{%
if
answer
is
not
none
%}{{answer[20+1]}}{%
else
%}{{answer_number|string}}{%
endif
%}'
doc_to_text
:
'
{%
if
answer
is
not
none
%}{{question+"\nStep-by-Step
Answer:"}}{%
else
%}{{"Question:
"+question+"\nStep-by-Step
Answer:"}}{%
endif
%}'
include
:
common_template_yaml
task
:
mgsm_en
lm_eval/tasks/mgsm/mgsm_es.yaml
0 → 100644
View file @
3e9c9a95
# Generated by utils.py
dataset_name
:
es
doc_to_target
:
'
{%
if
answer
is
not
none
%}{{answer[22+1]}}{%
else
%}{{answer_number|string}}{%
endif
%}'
doc_to_text
:
'
{%
if
answer
is
not
none
%}{{question+"\nRespuesta
paso
a
paso:"}}{%
else
%}{{"Pregunta:
"+question+"\nRespuesta
paso
a
paso:"}}{%
endif
%}'
include
:
common_template_yaml
task
:
mgsm_es
lm_eval/tasks/mgsm/mgsm_fr.yaml
0 → 100644
View file @
3e9c9a95
# Generated by utils.py
dataset_name
:
fr
doc_to_target
:
'
{%
if
answer
is
not
none
%}{{answer[25+1]}}{%
else
%}{{answer_number|string}}{%
endif
%}'
doc_to_text
:
'
{%
if
answer
is
not
none
%}{{question+"\nRéponse
étape
par
étape
:"}}{%
else
%}{{"Question
:
"+question+"\nRéponse
étape
par
étape
:"}}{%
endif
%}'
include
:
common_template_yaml
task
:
mgsm_fr
lm_eval/tasks/mgsm/mgsm_ja.yaml
0 → 100644
View file @
3e9c9a95
# Generated by utils.py
dataset_name
:
ja
doc_to_target
:
'
{%
if
answer
is
not
none
%}{{answer[10+1]}}{%
else
%}{{answer_number|string}}{%
endif
%}'
doc_to_text
:
'
{%
if
answer
is
not
none
%}{{question+"\nステップごとの答え:"}}{%
else
%}{{"問題:
"+question+"\nステップごとの答え:"}}{%
endif
%}'
include
:
common_template_yaml
task
:
mgsm_ja
lm_eval/tasks/mgsm/mgsm_ru.yaml
0 → 100644
View file @
3e9c9a95
# Generated by utils.py
dataset_name
:
ru
doc_to_target
:
'
{%
if
answer
is
not
none
%}{{answer[17+1]}}{%
else
%}{{answer_number|string}}{%
endif
%}'
doc_to_text
:
'
{%
if
answer
is
not
none
%}{{question+"\nПошаговоерешение:"}}{%
else
%}{{"Задача:
"+question+"\nПошаговоерешение:"}}{%
endif
%}'
include
:
common_template_yaml
task
:
mgsm_ru
lm_eval/tasks/mgsm/mgsm_sw.yaml
0 → 100644
View file @
3e9c9a95
# Generated by utils.py
dataset_name
:
sw
doc_to_target
:
'
{%
if
answer
is
not
none
%}{{answer[24+1]}}{%
else
%}{{answer_number|string}}{%
endif
%}'
doc_to_text
:
'
{%
if
answer
is
not
none
%}{{question+"\nJibu
la
Hatua
kwa
Hatua:"}}{%
else
%}{{"Swali:
"+question+"\nJibu
la
Hatua
kwa
Hatua:"}}{%
endif
%}'
include
:
common_template_yaml
task
:
mgsm_sw
lm_eval/tasks/mgsm/mgsm_te.yaml
0 → 100644
View file @
3e9c9a95
# Generated by utils.py
dataset_name
:
te
doc_to_target
:
'
{%
if
answer
is
not
none
%}{{answer[18+1]}}{%
else
%}{{answer_number|string}}{%
endif
%}'
doc_to_text
:
'
{%
if
answer
is
not
none
%}{{question+"\nదశలవారీగా
సమాధానం:"}}{%
else
%}{{"ప్రశ్న:
"+question+"\nదశలవారీగా
సమాధానం:"}}{%
endif
%}'
include
:
common_template_yaml
task
:
mgsm_te
lm_eval/tasks/mgsm/mgsm_th.yaml
0 → 100644
View file @
3e9c9a95
# Generated by utils.py
dataset_name
:
th
doc_to_target
:
'
{%
if
answer
is
not
none
%}{{answer[17+1]}}{%
else
%}{{answer_number|string}}{%
endif
%}'
doc_to_text
:
'
{%
if
answer
is
not
none
%}{{question+"\nคำตอบทีละขั้นตอน:"}}{%
else
%}{{"โจทย์:
"+question+"\nคำตอบทีละขั้นตอน:"}}{%
endif
%}'
include
:
common_template_yaml
task
:
mgsm_th
lm_eval/tasks/mgsm/mgsm_zh.yaml
0 → 100644
View file @
3e9c9a95
# Generated by utils.py
dataset_name
:
zh
doc_to_target
:
'
{%
if
answer
is
not
none
%}{{answer[5+1]}}{%
else
%}{{answer_number|string}}{%
endif
%}'
doc_to_text
:
'
{%
if
answer
is
not
none
%}{{question+"\n逐步解答:"}}{%
else
%}{{"问题:
"+question+"\n逐步解答:"}}{%
endif
%}'
include
:
common_template_yaml
task
:
mgsm_zh
lm_eval/tasks/mgsm/utils.py
View file @
3e9c9a95
import
argparse
from
typing
import
Dict
,
List
import
yaml
import
argparse
LANGUAGES
=
{
...
...
@@ -51,18 +49,6 @@ LANGUAGES = {
},
}
def
doc_to_text
(
doc
,
QUESTION
,
ANSWER
):
if
doc
[
"answer"
]
is
not
None
:
return
doc
[
"question"
]
+
"
\n
"
+
ANSWER
else
:
return
QUESTION
+
" "
+
doc
[
"question"
]
+
"
\n
"
+
ANSWER
def
doc_to_target
(
doc
,
QUESTION
,
ANSWER
):
if
doc
[
"answer"
]
is
not
None
:
return
" "
+
doc
[
"answer"
][
len
(
ANSWER
)
+
1
:]
else
:
return
" "
+
str
(
doc
[
"answer_number"
])
def
gen_lang_yamls
(
output_dir
:
str
,
overwrite
:
bool
)
->
None
:
"""
...
...
@@ -86,8 +72,16 @@ def gen_lang_yamls(output_dir: str, overwrite: bool) -> None:
"include"
:
"common_template_yaml"
,
"dataset_name"
:
lang
,
"task"
:
f
"mgsm_
{
lang
}
"
,
"doc_to_text"
:
doc_to_text
(
doc
,
QUESTION
,
ANSWER
),
"doc_to_target"
:
doc_to_target
(
doc
,
QUESTION
,
ANSWER
),
"doc_to_text"
:
f
"""{{% if answer is not none %}}"""
\
f
"""{{{{question+"
\\
n
{
ANSWER
}
"}}}}"""
\
f
"""{{% else %}}"""
\
f
"""{{{{"
{
QUESTION
}
"+question+"
\\
n
{
ANSWER
}
"}}}}"""
\
f
"""{{% endif %}}"""
,
"doc_to_target"
:
f
"""{{% if answer is not none %}}"""
\
f
"""{{{{answer[
{
len
(
ANSWER
)
}
+1]}}}}"""
\
f
"""{{% else %}}"""
\
f
"""{{{{answer_number|string}}}}"""
\
f
"""{{% endif %}}"""
,
},
f
,
allow_unicode
=
True
,
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment