Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
lm-evaluation-harness
Commits
9822b06e
Unverified
Commit
9822b06e
authored
Mar 01, 2024
by
Lintang Sutawika
Committed by
GitHub
Mar 01, 2024
Browse files
Merge branch 'main' into weight_by_size
parents
51f27158
b177c82c
Changes
656
Hide whitespace changes
Inline
Side-by-side
Showing
20 changed files
with
155 additions
and
1 deletion
+155
-1
lm_eval/tasks/okapi/arc_multilingual/arc_te.yaml
lm_eval/tasks/okapi/arc_multilingual/arc_te.yaml
+7
-0
lm_eval/tasks/okapi/arc_multilingual/arc_uk.yaml
lm_eval/tasks/okapi/arc_multilingual/arc_uk.yaml
+7
-0
lm_eval/tasks/okapi/arc_multilingual/arc_vi.yaml
lm_eval/tasks/okapi/arc_multilingual/arc_vi.yaml
+7
-0
lm_eval/tasks/okapi/arc_multilingual/arc_zh.yaml
lm_eval/tasks/okapi/arc_multilingual/arc_zh.yaml
+7
-0
lm_eval/tasks/okapi/arc_multilingual/utils.py
lm_eval/tasks/okapi/arc_multilingual/utils.py
+33
-0
lm_eval/tasks/okapi/hellaswag_multilingual/utils.py
lm_eval/tasks/okapi/hellaswag_multilingual/utils.py
+2
-1
lm_eval/tasks/okapi/mmlu_multilingual/_default_yaml
lm_eval/tasks/okapi/mmlu_multilingual/_default_yaml
+17
-0
lm_eval/tasks/okapi/mmlu_multilingual/_generate_configs.py
lm_eval/tasks/okapi/mmlu_multilingual/_generate_configs.py
+27
-0
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_ar.yaml
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_ar.yaml
+4
-0
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_bn.yaml
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_bn.yaml
+4
-0
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_ca.yaml
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_ca.yaml
+4
-0
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_da.yaml
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_da.yaml
+4
-0
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_de.yaml
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_de.yaml
+4
-0
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_en.yaml
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_en.yaml
+4
-0
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_es.yaml
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_es.yaml
+4
-0
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_eu.yaml
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_eu.yaml
+4
-0
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_fr.yaml
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_fr.yaml
+4
-0
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_gu.yaml
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_gu.yaml
+4
-0
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_hi.yaml
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_hi.yaml
+4
-0
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_hr.yaml
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_hr.yaml
+4
-0
No files found.
lm_eval/tasks/okapi/arc_multilingual/arc_te.yaml
0 → 100644
View file @
9822b06e
include
:
_arc_yaml
task
:
arc_te
dataset_path
:
alexandrainst/m_arc
dataset_name
:
te
training_split
:
train
validation_split
:
validation
test_split
:
test
lm_eval/tasks/okapi/arc_multilingual/arc_uk.yaml
0 → 100644
View file @
9822b06e
include
:
_arc_yaml
task
:
arc_uk
dataset_path
:
alexandrainst/m_arc
dataset_name
:
uk
training_split
:
train
validation_split
:
validation
test_split
:
test
lm_eval/tasks/okapi/arc_multilingual/arc_vi.yaml
0 → 100644
View file @
9822b06e
include
:
_arc_yaml
task
:
arc_vi
dataset_path
:
alexandrainst/m_arc
dataset_name
:
vi
training_split
:
train
validation_split
:
validation
test_split
:
test
lm_eval/tasks/okapi/arc_multilingual/arc_zh.yaml
0 → 100644
View file @
9822b06e
include
:
_arc_yaml
task
:
arc_zh
dataset_path
:
alexandrainst/m_arc
dataset_name
:
zh
training_split
:
train
validation_split
:
validation
test_split
:
test
lm_eval/tasks/okapi/arc_multilingual/utils.py
0 → 100644
View file @
9822b06e
import
re
import
datasets
def
preprocess
(
text
):
if
text
is
None
:
return
" "
text
=
text
.
strip
()
text
=
text
.
replace
(
" [title]"
,
". "
)
text
=
re
.
sub
(
"
\\
[.*?
\\
]"
,
""
,
text
)
text
=
text
.
replace
(
" "
,
" "
)
return
text
def
process_docs
(
dataset
:
datasets
.
Dataset
)
->
datasets
.
Dataset
:
def
_process_doc
(
doc
):
# breakpoint()
out_doc
=
{
"id"
:
doc
[
"id"
],
"query"
:
"Question: "
+
preprocess
(
doc
[
"instruction"
])
+
"
\n
Answer:"
,
"choices"
:
[
preprocess
(
doc
[
"option_a"
]),
preprocess
(
doc
[
"option_b"
]),
preprocess
(
doc
[
"option_c"
]),
preprocess
(
doc
[
"option_d"
]),
preprocess
(
doc
[
"option_e"
]),
],
"gold"
:
[
"A"
,
"B"
,
"C"
,
"D"
,
"E"
].
index
(
doc
[
"answer"
]),
}
return
out_doc
return
dataset
.
map
(
_process_doc
)
lm_eval/tasks/okapi/hellaswag_multilingual/utils.py
View file @
9822b06e
import
datasets
import
re
import
datasets
def
preprocess
(
text
):
text
=
text
.
strip
()
...
...
lm_eval/tasks/okapi/mmlu_multilingual/_default_yaml
0 → 100644
View file @
9822b06e
group:
- m_mmlu
dataset_path: alexandrainst/m_mmlu
test_split: test
fewshot_split: train
fewshot_config:
sampler: first_n
output_type: multiple_choice
doc_to_text: "{{instruction.strip()}}\nA. {{option_a}}\nB. {{option_b}}\nC. {{option_c}}\nD. {{option_d}}\nAnswer:"
doc_to_choice: ["A", "B", "C", "D"]
doc_to_target: answer
metric_list:
- metric: acc
aggregation: mean
higher_is_better: true
metadata:
version: 0.0
lm_eval/tasks/okapi/mmlu_multilingual/_generate_configs.py
0 → 100644
View file @
9822b06e
import
datasets
import
yaml
from
tqdm
import
tqdm
def
main
()
->
None
:
dataset_path
=
"alexandrainst/m_mmlu"
for
task
in
tqdm
(
datasets
.
get_dataset_infos
(
dataset_path
).
keys
()):
file_name
=
f
"m_mmlu_
{
task
}
.yaml"
try
:
with
open
(
f
"
{
file_name
}
"
,
"w"
)
as
f
:
f
.
write
(
"# Generated by _generate_configs.py
\n
"
)
yaml
.
dump
(
{
"include"
:
"_default_yaml"
,
"task"
:
f
"
{
dataset_path
.
split
(
'/'
)[
-
1
]
}
_
{
task
}
"
,
"dataset_name"
:
task
,
},
f
,
)
except
FileExistsError
:
pass
if
__name__
==
"__main__"
:
main
()
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_ar.yaml
0 → 100644
View file @
9822b06e
# Generated by _generate_configs.py
dataset_name
:
ar
include
:
_default_yaml
task
:
m_mmlu_ar
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_bn.yaml
0 → 100644
View file @
9822b06e
# Generated by _generate_configs.py
dataset_name
:
bn
include
:
_default_yaml
task
:
m_mmlu_bn
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_ca.yaml
0 → 100644
View file @
9822b06e
# Generated by _generate_configs.py
dataset_name
:
ca
include
:
_default_yaml
task
:
m_mmlu_ca
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_da.yaml
0 → 100644
View file @
9822b06e
# Generated by _generate_configs.py
dataset_name
:
da
include
:
_default_yaml
task
:
m_mmlu_da
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_de.yaml
0 → 100644
View file @
9822b06e
# Generated by _generate_configs.py
dataset_name
:
de
include
:
_default_yaml
task
:
m_mmlu_de
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_en.yaml
0 → 100644
View file @
9822b06e
# Generated by _generate_configs.py
dataset_name
:
en
include
:
_default_yaml
task
:
m_mmlu_en
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_es.yaml
0 → 100644
View file @
9822b06e
# Generated by _generate_configs.py
dataset_name
:
es
include
:
_default_yaml
task
:
m_mmlu_es
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_eu.yaml
0 → 100644
View file @
9822b06e
# Generated by _generate_configs.py
dataset_name
:
eu
include
:
_default_yaml
task
:
m_mmlu_eu
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_fr.yaml
0 → 100644
View file @
9822b06e
# Generated by _generate_configs.py
dataset_name
:
fr
include
:
_default_yaml
task
:
m_mmlu_fr
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_gu.yaml
0 → 100644
View file @
9822b06e
# Generated by _generate_configs.py
dataset_name
:
gu
include
:
_default_yaml
task
:
m_mmlu_gu
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_hi.yaml
0 → 100644
View file @
9822b06e
# Generated by _generate_configs.py
dataset_name
:
hi
include
:
_default_yaml
task
:
m_mmlu_hi
lm_eval/tasks/okapi/mmlu_multilingual/m_mmlu_hr.yaml
0 → 100644
View file @
9822b06e
# Generated by _generate_configs.py
dataset_name
:
hr
include
:
_default_yaml
task
:
m_mmlu_hr
Prev
1
…
23
24
25
26
27
28
29
30
31
…
33
Next
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment