Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
lm-evaluation-harness
Commits
45127aa7
Commit
45127aa7
authored
May 05, 2021
by
Leo Gao
Browse files
Rename a ton of stuff
parent
80a739eb
Changes
5
Hide whitespace changes
Inline
Side-by-side
Showing
5 changed files
with
52 additions
and
52 deletions
+52
-52
lm_eval/base.py
lm_eval/base.py
+3
-3
lm_eval/models/dummy.py
lm_eval/models/dummy.py
+1
-1
lm_eval/models/gpt3.py
lm_eval/models/gpt3.py
+1
-1
lm_eval/tasks/__init__.py
lm_eval/tasks/__init__.py
+23
-23
lm_eval/tasks/pile.py
lm_eval/tasks/pile.py
+24
-24
No files found.
lm_eval/base.py
View file @
45127aa7
...
@@ -35,7 +35,7 @@ class LM(abc.ABC):
...
@@ -35,7 +35,7 @@ class LM(abc.ABC):
pass
pass
@
abc
.
abstractmethod
@
abc
.
abstractmethod
def
loglikelihood_
perplexity
(
self
,
requests
):
def
loglikelihood_
rolling
(
self
,
requests
):
"""Compute full log-likelihood of a string, with no truncation, for perplexity computation
"""Compute full log-likelihood of a string, with no truncation, for perplexity computation
- We will use the full max context length of the model.
- We will use the full max context length of the model.
- For inputs that exceed the max context length, we divide the tokenized string into chunks of up to
- For inputs that exceed the max context length, we divide the tokenized string into chunks of up to
...
@@ -322,7 +322,7 @@ class PerplexityTask(Task, abc.ABC):
...
@@ -322,7 +322,7 @@ class PerplexityTask(Task, abc.ABC):
def
construct_requests
(
self
,
doc
,
ctx
):
def
construct_requests
(
self
,
doc
,
ctx
):
assert
not
ctx
assert
not
ctx
req
=
rf
.
loglikelihood_
perplexity
(
doc
)
req
=
rf
.
loglikelihood_
rolling
(
doc
)
return
req
return
req
def
process_results
(
self
,
doc
,
results
):
def
process_results
(
self
,
doc
,
results
):
...
@@ -351,7 +351,7 @@ class PerplexityTask(Task, abc.ABC):
...
@@ -351,7 +351,7 @@ class PerplexityTask(Task, abc.ABC):
req_ret_lens
=
{
req_ret_lens
=
{
'loglikelihood'
:
2
,
'loglikelihood'
:
2
,
'greedy_until'
:
None
,
'greedy_until'
:
None
,
'loglikelihood_
perplexity
'
:
None
,
'loglikelihood_
rolling
'
:
None
,
}
}
import
os
import
os
...
...
lm_eval/models/dummy.py
View file @
45127aa7
...
@@ -27,7 +27,7 @@ class DummyLM(LM):
...
@@ -27,7 +27,7 @@ class DummyLM(LM):
return
res
return
res
def
loglikelihood_
perplexity
(
self
,
requests
):
def
loglikelihood_
rolling
(
self
,
requests
):
res
=
[]
res
=
[]
for
_
in
requests
:
for
_
in
requests
:
...
...
lm_eval/models/gpt3.py
View file @
45127aa7
...
@@ -84,7 +84,7 @@ class GPT3LM(LM):
...
@@ -84,7 +84,7 @@ class GPT3LM(LM):
return
self
.
_loglikelihood_tokens
(
new_reqs
)
return
self
.
_loglikelihood_tokens
(
new_reqs
)
def
loglikelihood_
perplexity
(
self
,
requests
):
def
loglikelihood_
rolling
(
self
,
requests
):
# TODO: switch implementation to use _loglikelihood_tokens rather than having it do its own thing
# TODO: switch implementation to use _loglikelihood_tokens rather than having it do its own thing
loglikelihoods
=
[]
loglikelihoods
=
[]
...
...
lm_eval/tasks/__init__.py
View file @
45127aa7
...
@@ -174,29 +174,29 @@ TASK_REGISTRY = {
...
@@ -174,29 +174,29 @@ TASK_REGISTRY = {
"reversed_words"
:
unscramble
.
ReversedWords
,
"reversed_words"
:
unscramble
.
ReversedWords
,
# Pile
# Pile
"arxiv"
:
pile
.
PileArxiv
PerplexityTask
,
"
pile_
arxiv"
:
pile
.
PileArxiv
,
"books3"
:
pile
.
PileBooks3
PerplexityTask
,
"
pile_
books3"
:
pile
.
PileBooks3
,
"bookcorpus2"
:
pile
.
PileBookCorpus2
PerplexityTask
,
"
pile_
bookcorpus2"
:
pile
.
PileBookCorpus2
,
"commoncrawl"
:
pile
.
PileCommonCrawl
PerplexityTask
,
"
pile_
commoncrawl"
:
pile
.
PileCommonCrawl
,
"dm-mathematics"
:
pile
.
PileDmMathematics
PerplexityTask
,
"
pile_
dm-mathematics"
:
pile
.
PileDmMathematics
,
"enron"
:
pile
.
PileEnron
PerplexityTask
,
"
pile_
enron"
:
pile
.
PileEnron
,
"europarl"
:
pile
.
PileEuroparl
PerplexityTask
,
"
pile_
europarl"
:
pile
.
PileEuroparl
,
"freelaw"
:
pile
.
PileFreeLaw
PerplexityTask
,
"
pile_
freelaw"
:
pile
.
PileFreeLaw
,
"github"
:
pile
.
PileGithub
PerplexityTask
,
"
pile_
github"
:
pile
.
PileGithub
,
"gutenberg"
:
pile
.
PileGutenberg
PerplexityTask
,
"
pile_
gutenberg"
:
pile
.
PileGutenberg
,
"hackernews"
:
pile
.
PileHackernews
PerplexityTask
,
"
pile_
hackernews"
:
pile
.
PileHackernews
,
"nih-exporter"
:
pile
.
PileNIHExporter
PerplexityTask
,
"
pile_
nih-exporter"
:
pile
.
PileNIHExporter
,
"opensubtitles"
:
pile
.
PileOpenSubtitles
PerplexityTask
,
"
pile_
opensubtitles"
:
pile
.
PileOpenSubtitles
,
"openwebtext2"
:
pile
.
PileOpenWebText2
PerplexityTask
,
"
pile_
openwebtext2"
:
pile
.
PileOpenWebText2
,
"philpapers"
:
pile
.
PilePhilPapers
PerplexityTask
,
"
pile_
philpapers"
:
pile
.
PilePhilPapers
,
"pile-cc"
:
pile
.
PilePileCc
PerplexityTask
,
"pile
_pile
-cc"
:
pile
.
PilePileCc
,
"pubmed-abstracts"
:
pile
.
PilePubmedAbstracts
PerplexityTask
,
"
pile_
pubmed-abstracts"
:
pile
.
PilePubmedAbstracts
,
"pubmed-central"
:
pile
.
PilePubmedCentral
PerplexityTask
,
"
pile_
pubmed-central"
:
pile
.
PilePubmedCentral
,
"stackexchange"
:
pile
.
PileStackExchange
PerplexityTask
,
"
pile_
stackexchange"
:
pile
.
PileStackExchange
,
"uspto"
:
pile
.
PileUspto
PerplexityTask
,
"
pile_
uspto"
:
pile
.
PileUspto
,
"ubuntu-irc"
:
pile
.
PileUbuntuIrc
PerplexityTask
,
"
pile_
ubuntu-irc"
:
pile
.
PileUbuntuIrc
,
"wikipedia"
:
pile
.
PileWikipedia
PerplexityTask
,
"
pile_
wikipedia"
:
pile
.
PileWikipedia
,
"youtubesubtitles"
:
pile
.
PileYoutubeSubtitles
PerplexityTask
,
"
pile_
youtubesubtitles"
:
pile
.
PileYoutubeSubtitles
,
}
}
...
...
lm_eval/tasks/pile.py
View file @
45127aa7
...
@@ -9,7 +9,7 @@ from ..utils import general_detokenize
...
@@ -9,7 +9,7 @@ from ..utils import general_detokenize
from
best_download
import
download_file
from
best_download
import
download_file
class
Pile
PerplexityTask
(
PerplexityTask
,
abc
.
ABC
):
class
Pile
(
PerplexityTask
,
abc
.
ABC
):
PILE_SET_NAME
=
None
PILE_SET_NAME
=
None
VAL_PATH
=
'data/pile/val.jsonl.zst'
VAL_PATH
=
'data/pile/val.jsonl.zst'
...
@@ -42,93 +42,93 @@ class PilePerplexityTask(PerplexityTask, abc.ABC):
...
@@ -42,93 +42,93 @@ class PilePerplexityTask(PerplexityTask, abc.ABC):
return
True
return
True
class
PileArxiv
PerplexityTask
(
PilePerplexityTask
):
class
PileArxiv
(
PilePerplexityTask
):
PILE_SET_NAME
=
"ArXiv"
PILE_SET_NAME
=
"ArXiv"
class
PileBooks3
PerplexityTask
(
PilePerplexityTask
):
class
PileBooks3
(
PilePerplexityTask
):
PILE_SET_NAME
=
"Books3"
PILE_SET_NAME
=
"Books3"
class
PileBookCorpus2
PerplexityTask
(
PilePerplexityTask
):
class
PileBookCorpus2
(
PilePerplexityTask
):
PILE_SET_NAME
=
"BookCorpus2"
PILE_SET_NAME
=
"BookCorpus2"
class
PileCommonCrawl
PerplexityTask
(
PilePerplexityTask
):
class
PileCommonCrawl
(
PilePerplexityTask
):
PILE_SET_NAME
=
"CommonCrawl"
PILE_SET_NAME
=
"CommonCrawl"
class
PileDmMathematics
PerplexityTask
(
PilePerplexityTask
):
class
PileDmMathematics
(
PilePerplexityTask
):
PILE_SET_NAME
=
"DM Mathematics"
PILE_SET_NAME
=
"DM Mathematics"
class
PileEnron
PerplexityTask
(
PilePerplexityTask
):
class
PileEnron
(
PilePerplexityTask
):
PILE_SET_NAME
=
"Enron Emails"
PILE_SET_NAME
=
"Enron Emails"
class
PileEuroparl
PerplexityTask
(
PilePerplexityTask
):
class
PileEuroparl
(
PilePerplexityTask
):
PILE_SET_NAME
=
"EuroParl"
PILE_SET_NAME
=
"EuroParl"
class
PileFreeLaw
PerplexityTask
(
PilePerplexityTask
):
class
PileFreeLaw
(
PilePerplexityTask
):
PILE_SET_NAME
=
"FreeLaw"
PILE_SET_NAME
=
"FreeLaw"
class
PileGithub
PerplexityTask
(
PilePerplexityTask
):
class
PileGithub
(
PilePerplexityTask
):
PILE_SET_NAME
=
"Github"
PILE_SET_NAME
=
"Github"
class
PileGutenberg
PerplexityTask
(
PilePerplexityTask
):
class
PileGutenberg
(
PilePerplexityTask
):
PILE_SET_NAME
=
"Gutenberg (PG-19)"
PILE_SET_NAME
=
"Gutenberg (PG-19)"
class
PileHackernews
PerplexityTask
(
PilePerplexityTask
):
class
PileHackernews
(
PilePerplexityTask
):
PILE_SET_NAME
=
"HackerNews"
PILE_SET_NAME
=
"HackerNews"
class
PileNIHExporter
PerplexityTask
(
PilePerplexityTask
):
class
PileNIHExporter
(
PilePerplexityTask
):
PILE_SET_NAME
=
"NIH ExPorter"
PILE_SET_NAME
=
"NIH ExPorter"
class
PileOpenSubtitles
PerplexityTask
(
PilePerplexityTask
):
class
PileOpenSubtitles
(
PilePerplexityTask
):
PILE_SET_NAME
=
"OpenSubtitles"
PILE_SET_NAME
=
"OpenSubtitles"
class
PileOpenWebText2
PerplexityTask
(
PilePerplexityTask
):
class
PileOpenWebText2
(
PilePerplexityTask
):
PILE_SET_NAME
=
"OpenWebText2"
PILE_SET_NAME
=
"OpenWebText2"
class
PilePhilPapers
PerplexityTask
(
PilePerplexityTask
):
class
PilePhilPapers
(
PilePerplexityTask
):
PILE_SET_NAME
=
"PhilPapers"
PILE_SET_NAME
=
"PhilPapers"
class
PilePileCc
PerplexityTask
(
PilePerplexityTask
):
class
PilePileCc
(
PilePerplexityTask
):
PILE_SET_NAME
=
"Pile-CC"
PILE_SET_NAME
=
"Pile-CC"
class
PilePubmedAbstracts
PerplexityTask
(
PilePerplexityTask
):
class
PilePubmedAbstracts
(
PilePerplexityTask
):
PILE_SET_NAME
=
"PubMed Abstracts"
PILE_SET_NAME
=
"PubMed Abstracts"
class
PilePubmedCentral
PerplexityTask
(
PilePerplexityTask
):
class
PilePubmedCentral
(
PilePerplexityTask
):
PILE_SET_NAME
=
"PubMed Central"
PILE_SET_NAME
=
"PubMed Central"
class
PileStackExchange
PerplexityTask
(
PilePerplexityTask
):
class
PileStackExchange
(
PilePerplexityTask
):
PILE_SET_NAME
=
"StackExchange"
PILE_SET_NAME
=
"StackExchange"
class
PileUspto
PerplexityTask
(
PilePerplexityTask
):
class
PileUspto
(
PilePerplexityTask
):
PILE_SET_NAME
=
"USPTO Backgrounds"
PILE_SET_NAME
=
"USPTO Backgrounds"
class
PileUbuntuIrc
PerplexityTask
(
PilePerplexityTask
):
class
PileUbuntuIrc
(
PilePerplexityTask
):
PILE_SET_NAME
=
"Ubuntu IRC"
PILE_SET_NAME
=
"Ubuntu IRC"
class
PileWikipedia
PerplexityTask
(
PilePerplexityTask
):
class
PileWikipedia
(
PilePerplexityTask
):
PILE_SET_NAME
=
"Wikipedia (en)"
PILE_SET_NAME
=
"Wikipedia (en)"
class
PileYoutubeSubtitles
PerplexityTask
(
PilePerplexityTask
):
class
PileYoutubeSubtitles
(
PilePerplexityTask
):
PILE_SET_NAME
=
"YoutubeSubtitles"
PILE_SET_NAME
=
"YoutubeSubtitles"
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment