Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
lm-evaluation-harness
Commits
29f12dd9
Unverified
Commit
29f12dd9
authored
Aug 01, 2023
by
Lintang Sutawika
Committed by
GitHub
Aug 01, 2023
Browse files
Merge branch 'big-refactor' into benchmark-scripts
parents
e37698df
4168c05f
Changes
222
Hide whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
23 additions
and
47 deletions
+23
-47
results/xglm/xglm-7.5B/xglm-7.5B_xwinograd_0-shot.json
results/xglm/xglm-7.5B/xglm-7.5B_xwinograd_0-shot.json
+0
-47
tests/extra/test_utils.py
tests/extra/test_utils.py
+23
-0
No files found.
results/xglm/xglm-7.5B/xglm-7.5B_xwinograd_0-shot.json
deleted
100644 → 0
View file @
e37698df
{
"results"
:
{
"xwinograd_zh"
:
{
"acc"
:
0.7281746031746031
,
"acc_stderr"
:
0.01983712759311063
},
"xwinograd_ru"
:
{
"acc"
:
0.6317460317460317
,
"acc_stderr"
:
0.027219500732466696
},
"xwinograd_pt"
:
{
"acc"
:
0.6730038022813688
,
"acc_stderr"
:
0.028982074243683254
},
"xwinograd_en"
:
{
"acc"
:
0.7948387096774193
,
"acc_stderr"
:
0.008376626547826555
},
"xwinograd_jp"
:
{
"acc"
:
0.6496350364963503
,
"acc_stderr"
:
0.01541389159576608
},
"xwinograd_fr"
:
{
"acc"
:
0.6506024096385542
,
"acc_stderr"
:
0.05265151356440471
}
},
"versions"
:
{
"xwinograd_zh"
:
0
,
"xwinograd_ru"
:
0
,
"xwinograd_pt"
:
0
,
"xwinograd_en"
:
0
,
"xwinograd_jp"
:
0
,
"xwinograd_fr"
:
0
},
"config"
:
{
"model"
:
"hf-causal-experimental"
,
"model_args"
:
"pretrained=facebook/xglm-7.5B,use_accelerate=True"
,
"num_fewshot"
:
0
,
"batch_size"
:
"auto"
,
"device"
:
"cuda"
,
"no_cache"
:
true
,
"limit"
:
null
,
"bootstrap_iters"
:
100000
,
"description_dict"
:
{}
}
}
tests/extra/test_utils.py
0 → 100644
View file @
29f12dd9
import
json
from
typing
import
List
from
lm_eval.utils
import
load_yaml_config
from
pathlib
import
Path
FILE_PATH
=
file_path
=
".github/outputs/tasks_all_changed_and_modified_files.txt"
def
load_changed_files
(
file_path
:
str
=
FILE_PATH
)
->
List
[
str
]:
with
open
(
file_path
,
"r"
)
as
f
:
return
[
l
for
line
in
f
.
readlines
()
for
l
in
line
.
strip
().
split
(
" "
)]
def
parser
(
full_path
:
List
[
str
])
->
List
[
str
]:
_output
=
set
()
for
x
in
full_path
:
if
x
.
endswith
(
".yaml"
):
_output
.
add
(
load_yaml_config
(
x
)[
"task"
])
elif
x
.
endswith
(
".py"
):
path
=
[
str
(
x
)
for
x
in
(
list
(
Path
(
x
).
parent
.
glob
(
"*.yaml"
)))]
_output
|=
{
load_yaml_config
(
x
)[
"task"
]
for
x
in
path
}
return
list
(
_output
)
Prev
1
…
8
9
10
11
12
Next
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment