Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
lm-evaluation-harness
Commits
364e54d4
Commit
364e54d4
authored
Mar 22, 2021
by
Jonathan Tow
Browse files
Split `dev` and `val` sets and cleanup prompt spacing
parent
b2bab740
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
8 additions
and
12 deletions
+8
-12
lm_eval/tasks/hendrycks_test.py
lm_eval/tasks/hendrycks_test.py
+8
-12
No files found.
lm_eval/tasks/hendrycks_test.py
View file @
364e54d4
...
@@ -54,7 +54,7 @@ class GeneralHendrycksTest(MultipleChoiceTask):
...
@@ -54,7 +54,7 @@ class GeneralHendrycksTest(MultipleChoiceTask):
return
True
return
True
def
has_validation_docs
(
self
):
def
has_validation_docs
(
self
):
return
Fals
e
return
Tru
e
def
has_test_docs
(
self
):
def
has_test_docs
(
self
):
return
True
return
True
...
@@ -69,9 +69,9 @@ class GeneralHendrycksTest(MultipleChoiceTask):
...
@@ -69,9 +69,9 @@ class GeneralHendrycksTest(MultipleChoiceTask):
D. <choice4>
D. <choice4>
Answer:
Answer:
"""
"""
prompt
=
"Question: "
+
doc
[
0
]
prompt
=
"Question: "
+
doc
[
0
]
+
"
\n
"
prompt
+=
"
"
.
join
([
f
"
\n
{
choices
[
j
]
}
.
{
doc
[
j
+
1
]
}
"
for
j
in
range
(
4
)])
prompt
+=
""
.
join
([
f
"
{
choices
[
j
]
}
.
{
doc
[
j
+
1
]
}
\n
"
for
j
in
range
(
4
)])
prompt
+=
"
\n
Answer:"
prompt
+=
"Answer:"
return
prompt
return
prompt
choices
=
[
'A'
,
'B'
,
'C'
,
'D'
]
choices
=
[
'A'
,
'B'
,
'C'
,
'D'
]
return
{
return
{
...
@@ -85,16 +85,12 @@ class GeneralHendrycksTest(MultipleChoiceTask):
...
@@ -85,16 +85,12 @@ class GeneralHendrycksTest(MultipleChoiceTask):
return
(
self
.
_convert_standard
(
doc
)
for
doc
in
reader
)
return
(
self
.
_convert_standard
(
doc
)
for
doc
in
reader
)
def
training_docs
(
self
):
def
training_docs
(
self
):
# Use all files in the auxiliary_train, dev, val directories
filename
=
self
.
DATASET_PATH
/
"dev"
/
f
"
{
self
.
subject
}
_dev.csv"
# auxiliary_train includes some UnifiedQA MC tasks
return
self
.
_load_docs
(
filename
)
docs
=
[]
for
train_dir
in
[
"auxiliary_train"
,
"dev"
,
"val"
]:
for
f
in
(
self
.
DATASET_PATH
/
train_dir
).
iterdir
():
docs
.
extend
(
self
.
_load_docs
(
f
))
return
docs
def
validation_docs
(
self
):
def
validation_docs
(
self
):
raise
NotImplementedError
filename
=
self
.
DATASET_PATH
/
"val"
/
f
"
{
self
.
subject
}
_val.csv"
return
self
.
_load_docs
(
filename
)
def
test_docs
(
self
):
def
test_docs
(
self
):
filename
=
self
.
DATASET_PATH
/
"test"
/
f
"
{
self
.
subject
}
_test.csv"
filename
=
self
.
DATASET_PATH
/
"test"
/
f
"
{
self
.
subject
}
_test.csv"
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment