Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
lm-evaluation-harness
Commits
29ba8cb1
Commit
29ba8cb1
authored
Nov 02, 2023
by
lintangsutawika
Browse files
fixing display name
parent
60dd33c8
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
20 additions
and
11 deletions
+20
-11
lm_eval/evaluator.py
lm_eval/evaluator.py
+20
-11
No files found.
lm_eval/evaluator.py
View file @
29ba8cb1
...
...
@@ -230,8 +230,12 @@ def evaluate(
task_hierarchy
[
group_name
].
append
(
task_name
)
versions
[
group_name
]
=
"N/A"
if
"group_alias"
in
configs
[
task_name
]:
if
(
"group_alias"
in
configs
[
task_name
])
and
(
group_name
not
in
task_group_alias
):
print
(
group_name
)
task_group_alias
[
group_name
]
=
configs
[
task_name
][
"group_alias"
]
print
(
task_group_alias
)
else
:
task_hierarchy
[
task_name
]
=
[]
...
...
@@ -537,11 +541,11 @@ def evaluate(
for
group_name
,
task_list
in
task_hierarchy
.
items
():
order
=
task_order
[
group_name
]
results_agg
[
group_name
]
=
results
[
group_name
]
results_agg
[
group_name
]
=
results
[
group_name
]
.
copy
()
results_agg
[
group_name
][
"tab"
]
=
order
if
(
order
<
max
(
task_order
.
values
()))
and
(
len
(
task_list
)
>
0
):
groups_agg
[
group_name
]
=
results
[
group_name
]
groups_agg
[
group_name
]
=
results
[
group_name
]
.
copy
()
groups_agg
[
group_name
][
"tab"
]
=
order
if
task_list
!=
[]:
...
...
@@ -564,36 +568,41 @@ def evaluate(
task_hierarchy
,
task_order
,
versions
,
task_group_alias
)
print
(
"task_group_alias"
)
print
(
task_group_alias
)
_results_agg
=
collections
.
defaultdict
(
dict
)
_versions
=
collections
.
defaultdict
(
dict
)
for
task
in
results_agg
:
task_results
=
results_agg
[
task
]
tab_string
=
""
if
"tab"
in
task_results
:
tab
=
task_results
.
pop
(
"tab"
)
tab_string
=
" "
*
tab
+
"-"
if
tab
>
0
else
""
tab_string
=
" "
*
tab
+
"-"
if
tab
>
0
else
""
if
task
in
task_group_alias
:
task_alias
=
task_group_alias
[
task
]
_results_agg
[
tab_string
+
task_alias
]
=
task_results
_versions
[
tab_string
+
task_alias
]
=
versions
[
task
]
_results_agg
[
tab_string
+
task_alias
]
=
task_results
_versions
[
tab_string
+
task_alias
]
=
versions
[
task
]
else
:
_results_agg
[
tab_string
+
task
]
=
task_results
_versions
[
tab_string
+
task
]
=
versions
[
task
]
_results_agg
[
tab_string
+
task
]
=
task_results
_versions
[
tab_string
+
task
]
=
versions
[
task
]
results_agg
=
_results_agg
versions
=
_versions
_groups_agg
=
collections
.
defaultdict
(
dict
)
for
group
in
groups_agg
:
group_results
=
groups_agg
[
group
]
tab_string
=
""
if
"tab"
in
group_results
:
tab
=
group_results
.
pop
(
"tab"
)
tab_string
=
" "
*
tab
+
"-"
if
tab
>
0
else
""
tab_string
=
" "
*
tab
+
"-"
if
tab
>
0
else
""
if
group
in
task_group_alias
:
group_alias
=
task_group_alias
[
group
]
_groups_agg
[
tab_string
+
group_alias
]
=
group_results
_groups_agg
[
tab_string
+
group_alias
]
=
group_results
else
:
_groups_agg
[
tab_string
+
group
]
=
group_results
_groups_agg
[
tab_string
+
group
]
=
group_results
groups_agg
=
_groups_agg
results_dict
=
{
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment