Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
lm-evaluation-harness
Commits
e35b0667
Unverified
Commit
e35b0667
authored
Nov 14, 2023
by
Hailey Schoelkopf
Committed by
GitHub
Nov 14, 2023
Browse files
Merge pull request #987 from EleutherAI/alias-fix
[Refactor] Alias fix
parents
8ffd2630
d9230aa8
Changes
2
Hide whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
8 additions
and
12 deletions
+8
-12
lm_eval/evaluator.py
lm_eval/evaluator.py
+4
-12
lm_eval/utils.py
lm_eval/utils.py
+4
-0
No files found.
lm_eval/evaluator.py
View file @
e35b0667
...
@@ -562,8 +562,6 @@ def evaluate(
...
@@ -562,8 +562,6 @@ def evaluate(
task_hierarchy
,
task_order
,
versions
,
task_group_alias
task_hierarchy
,
task_order
,
versions
,
task_group_alias
)
)
_results_agg
=
collections
.
defaultdict
(
dict
)
_versions
=
collections
.
defaultdict
(
dict
)
for
task
in
results_agg
:
for
task
in
results_agg
:
task_results
=
results_agg
[
task
]
task_results
=
results_agg
[
task
]
...
@@ -577,15 +575,10 @@ def evaluate(
...
@@ -577,15 +575,10 @@ def evaluate(
if
task
in
task_group_alias
:
if
task
in
task_group_alias
:
task_alias
=
task_group_alias
[
task
]
task_alias
=
task_group_alias
[
task
]
_results_agg
[
tab_string
+
task_alias
]
=
task_results
results_agg
[
task
][
"alias"
]
=
tab_string
+
task_alias
_versions
[
tab_string
+
task_alias
]
=
versions
[
task
]
else
:
else
:
_results_agg
[
tab_string
+
task
]
=
task_results
results_agg
[
task
][
"alias"
]
=
tab_string
+
task
_versions
[
tab_string
+
task
]
=
versions
[
task
]
results_agg
=
_results_agg
versions
=
_versions
_groups_agg
=
collections
.
defaultdict
(
dict
)
for
group
in
groups_agg
:
for
group
in
groups_agg
:
group_results
=
groups_agg
[
group
]
group_results
=
groups_agg
[
group
]
...
@@ -599,10 +592,9 @@ def evaluate(
...
@@ -599,10 +592,9 @@ def evaluate(
if
group
in
task_group_alias
:
if
group
in
task_group_alias
:
group_alias
=
task_group_alias
[
group
]
group_alias
=
task_group_alias
[
group
]
_
groups_agg
[
tab_string
+
group_alias
]
=
group_results
groups_agg
[
group
][
"alias"
]
=
tab_string
+
group_alias
else
:
else
:
_groups_agg
[
tab_string
+
group
]
=
group_results
groups_agg
[
group
][
"alias"
]
=
tab_string
+
group
groups_agg
=
_groups_agg
results_dict
=
{
results_dict
=
{
"results"
:
dict
(
results_agg
.
items
()),
"results"
:
dict
(
results_agg
.
items
()),
...
...
lm_eval/utils.py
View file @
e35b0667
...
@@ -305,6 +305,10 @@ def make_table(result_dict, column: str = "results"):
...
@@ -305,6 +305,10 @@ def make_table(result_dict, column: str = "results"):
for
k
,
dic
in
result_dict
[
column
].
items
():
for
k
,
dic
in
result_dict
[
column
].
items
():
version
=
result_dict
[
"versions"
][
k
]
version
=
result_dict
[
"versions"
][
k
]
if
"alias"
in
dic
:
k
=
dic
.
pop
(
"alias"
)
for
(
mf
),
v
in
dic
.
items
():
for
(
mf
),
v
in
dic
.
items
():
m
,
_
,
f
=
mf
.
partition
(
","
)
m
,
_
,
f
=
mf
.
partition
(
","
)
if
m
.
endswith
(
"_stderr"
):
if
m
.
endswith
(
"_stderr"
):
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment