Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
lm-evaluation-harness
Commits
41a94e13
Commit
41a94e13
authored
Feb 24, 2021
by
Jon Tow
Browse files
Implement all word scrambling and manipulation tasks
parent
a5e135b6
Changes
2
Hide whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
26 additions
and
8 deletions
+26
-8
lm_eval/tasks/__init__.py
lm_eval/tasks/__init__.py
+6
-3
lm_eval/tasks/unscramble.py
lm_eval/tasks/unscramble.py
+20
-5
No files found.
lm_eval/tasks/__init__.py
View file @
41a94e13
...
...
@@ -29,7 +29,7 @@ from . import qa4mre
from
.
import
translation
from
.
import
headqa
from
.
import
mathqa
from
.
import
anagrams
from
.
import
unscramble
########################################
# Translation tasks
...
...
@@ -133,8 +133,11 @@ TASK_REGISTRY = {
**
translation
.
create_tasks_from_benchmarks
(
selected_translation_benchmarks
),
# Word Scrambling and Manipulation Tasks
"anagrams1"
:
anagrams
.
Anagrams1
,
"anagrams2"
:
anagrams
.
Anagrams2
"anagrams1"
:
unscramble
.
Anagrams1
,
"anagrams2"
:
unscramble
.
Anagrams2
,
"cycle_letters"
:
unscramble
.
CycleLetters
,
"random_insertion"
:
unscramble
.
RandomInsertion
,
"reversed_words"
:
unscramble
.
ReversedWords
,
}
...
...
lm_eval/tasks/
anagrams
.py
→
lm_eval/tasks/
unscramble
.py
View file @
41a94e13
...
...
@@ -14,8 +14,8 @@ def extract_gzip(gz, to):
shutil
.
copyfileobj
(
fin
,
fout
)
class
AnagramsB
as
e
(
Task
):
BASE_PATH
=
Path
(
"data/
anagrams
"
)
class
WordUnscrambleT
as
k
(
Task
):
BASE_PATH
=
Path
(
"data/
unscramble
"
)
FILENAME
=
None
CHECKSUM
=
None
# SHA256 Checksum.
...
...
@@ -50,7 +50,7 @@ class AnagramsBase(Task):
def
fewshot_examples
(
self
,
k
):
# Override to avoid error caused by missing `training_docs`.
return
random
.
sample
(
self
.
validation_docs
(),
k
)
return
random
.
sample
(
list
(
self
.
validation_docs
()
)
,
k
)
def
doc_to_text
(
self
,
doc
):
return
doc
[
"context"
]
...
...
@@ -80,11 +80,26 @@ class AnagramsBase(Task):
}
class
Anagrams1
(
AnagramsB
as
e
):
class
Anagrams1
(
WordUnscrambleT
as
k
):
FILENAME
=
"mid_word_1_anagrams.jsonl"
CHECKSUM
=
"6768a86896083199de4815d4964cb2f6f1046476cfd80c2a562784f182905979"
class
Anagrams2
(
AnagramsB
as
e
):
class
Anagrams2
(
WordUnscrambleT
as
k
):
FILENAME
=
"mid_word_2_anagrams.jsonl"
CHECKSUM
=
"c3d839d09a7954b78a27cd2cd75d4ed0488656c56ef4dbd741a005343826cb01"
class
CycleLetters
(
WordUnscrambleTask
):
FILENAME
=
"cycle_letters_in_word.jsonl"
CHECKSUM
=
"1689c9002bb8c5988bf5f05e977c9db92f57932c1b5a38998c29ac0dd71e1d42"
class
RandomInsertion
(
WordUnscrambleTask
):
FILENAME
=
"random_insertion_in_word.jsonl"
CHECKSUM
=
"72e65d83da53d15752ee0c47379509de149ddbad32d61184e5991df29616b78a"
class
ReversedWords
(
WordUnscrambleTask
):
FILENAME
=
"reversed_words.jsonl"
CHECKSUM
=
"133a08f875cd6c1ef8608a3233571a773881cc27b1c707de738cc6543439332a"
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment