Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
lm-evaluation-harness
Commits
121b7096
Commit
121b7096
authored
May 02, 2022
by
Fabrizio Milo
Browse files
add pre-commit
parent
7a038118
Changes
732
Hide whitespace changes
Inline
Side-by-side
Showing
20 changed files
with
20 additions
and
20 deletions
+20
-20
tests/testdata/lambada_mt_de-v0-loglikelihood
tests/testdata/lambada_mt_de-v0-loglikelihood
+1
-1
tests/testdata/lambada_mt_de-v0-res.json
tests/testdata/lambada_mt_de-v0-res.json
+1
-1
tests/testdata/lambada_mt_en-v0-loglikelihood
tests/testdata/lambada_mt_en-v0-loglikelihood
+1
-1
tests/testdata/lambada_mt_en-v0-res.json
tests/testdata/lambada_mt_en-v0-res.json
+1
-1
tests/testdata/lambada_mt_es-v0-loglikelihood
tests/testdata/lambada_mt_es-v0-loglikelihood
+1
-1
tests/testdata/lambada_mt_es-v0-res.json
tests/testdata/lambada_mt_es-v0-res.json
+1
-1
tests/testdata/lambada_mt_fr-v0-loglikelihood
tests/testdata/lambada_mt_fr-v0-loglikelihood
+1
-1
tests/testdata/lambada_mt_fr-v0-res.json
tests/testdata/lambada_mt_fr-v0-res.json
+1
-1
tests/testdata/lambada_mt_it-v0-loglikelihood
tests/testdata/lambada_mt_it-v0-loglikelihood
+1
-1
tests/testdata/lambada_mt_it-v0-res.json
tests/testdata/lambada_mt_it-v0-res.json
+1
-1
tests/testdata/logiqa-v0-loglikelihood
tests/testdata/logiqa-v0-loglikelihood
+1
-1
tests/testdata/logiqa-v0-res.json
tests/testdata/logiqa-v0-res.json
+1
-1
tests/testdata/math_algebra-v0-greedy_until
tests/testdata/math_algebra-v0-greedy_until
+1
-1
tests/testdata/math_algebra-v0-res.json
tests/testdata/math_algebra-v0-res.json
+1
-1
tests/testdata/math_algebra-v1-greedy_until
tests/testdata/math_algebra-v1-greedy_until
+1
-1
tests/testdata/math_algebra-v1-res.json
tests/testdata/math_algebra-v1-res.json
+1
-1
tests/testdata/math_counting_and_prob-v0-greedy_until
tests/testdata/math_counting_and_prob-v0-greedy_until
+1
-1
tests/testdata/math_counting_and_prob-v0-res.json
tests/testdata/math_counting_and_prob-v0-res.json
+1
-1
tests/testdata/math_counting_and_prob-v1-greedy_until
tests/testdata/math_counting_and_prob-v1-greedy_until
+1
-1
tests/testdata/math_counting_and_prob-v1-res.json
tests/testdata/math_counting_and_prob-v1-res.json
+1
-1
No files found.
tests/testdata/lambada_mt_de-v0-loglikelihood
View file @
121b7096
5ad125e1708499832b2cee8c3388f89f9c0277010fd96fbd3359039ce8105984
5ad125e1708499832b2cee8c3388f89f9c0277010fd96fbd3359039ce8105984
\ No newline at end of file
tests/testdata/lambada_mt_de-v0-res.json
View file @
121b7096
{
"results"
:
{
"lambada_mt_de"
:
{
"acc"
:
0.0
,
"acc_stderr"
:
0.0
,
"ppl"
:
1.6479047769869253
,
"ppl_stderr"
:
0.006497321146240192
}},
"versions"
:
{
"lambada_mt_de"
:
0
}}
{
"results"
:
{
"lambada_mt_de"
:
{
"acc"
:
0.0
,
"acc_stderr"
:
0.0
,
"ppl"
:
1.6479047769869253
,
"ppl_stderr"
:
0.006497321146240192
}},
"versions"
:
{
"lambada_mt_de"
:
0
}}
\ No newline at end of file
tests/testdata/lambada_mt_en-v0-loglikelihood
View file @
121b7096
6829e6a8aa5922e6c92dd31403cc060f242dc0ede4a775e085a70da095ab2e20
6829e6a8aa5922e6c92dd31403cc060f242dc0ede4a775e085a70da095ab2e20
\ No newline at end of file
tests/testdata/lambada_mt_en-v0-res.json
View file @
121b7096
{
"results"
:
{
"lambada_mt_en"
:
{
"acc"
:
0.0
,
"acc_stderr"
:
0.0
,
"ppl"
:
1.6479047769869253
,
"ppl_stderr"
:
0.006497321146240192
}},
"versions"
:
{
"lambada_mt_en"
:
0
}}
{
"results"
:
{
"lambada_mt_en"
:
{
"acc"
:
0.0
,
"acc_stderr"
:
0.0
,
"ppl"
:
1.6479047769869253
,
"ppl_stderr"
:
0.006497321146240192
}},
"versions"
:
{
"lambada_mt_en"
:
0
}}
\ No newline at end of file
tests/testdata/lambada_mt_es-v0-loglikelihood
View file @
121b7096
4a88f4b316c72fe0396c382d6cbb33568ac4d0ad225150d3536635c085359fc9
4a88f4b316c72fe0396c382d6cbb33568ac4d0ad225150d3536635c085359fc9
\ No newline at end of file
tests/testdata/lambada_mt_es-v0-res.json
View file @
121b7096
{
"results"
:
{
"lambada_mt_es"
:
{
"acc"
:
0.0
,
"acc_stderr"
:
0.0
,
"ppl"
:
1.6479047769869253
,
"ppl_stderr"
:
0.006497321146240192
}},
"versions"
:
{
"lambada_mt_es"
:
0
}}
{
"results"
:
{
"lambada_mt_es"
:
{
"acc"
:
0.0
,
"acc_stderr"
:
0.0
,
"ppl"
:
1.6479047769869253
,
"ppl_stderr"
:
0.006497321146240192
}},
"versions"
:
{
"lambada_mt_es"
:
0
}}
\ No newline at end of file
tests/testdata/lambada_mt_fr-v0-loglikelihood
View file @
121b7096
5d16f4a0c51dc6d7b6df2ebeba2bbfa51e700b843779b559b3d90183d7b02a11
5d16f4a0c51dc6d7b6df2ebeba2bbfa51e700b843779b559b3d90183d7b02a11
\ No newline at end of file
tests/testdata/lambada_mt_fr-v0-res.json
View file @
121b7096
{
"results"
:
{
"lambada_mt_fr"
:
{
"acc"
:
0.0
,
"acc_stderr"
:
0.0
,
"ppl"
:
1.6479047769869253
,
"ppl_stderr"
:
0.006497321146240192
}},
"versions"
:
{
"lambada_mt_fr"
:
0
}}
{
"results"
:
{
"lambada_mt_fr"
:
{
"acc"
:
0.0
,
"acc_stderr"
:
0.0
,
"ppl"
:
1.6479047769869253
,
"ppl_stderr"
:
0.006497321146240192
}},
"versions"
:
{
"lambada_mt_fr"
:
0
}}
\ No newline at end of file
tests/testdata/lambada_mt_it-v0-loglikelihood
View file @
121b7096
fd87c6c5cf4e0499c5f9f80e5bd7ee6a4f3d2991902a0cc3ec9e6eaf22d6760a
fd87c6c5cf4e0499c5f9f80e5bd7ee6a4f3d2991902a0cc3ec9e6eaf22d6760a
\ No newline at end of file
tests/testdata/lambada_mt_it-v0-res.json
View file @
121b7096
{
"results"
:
{
"lambada_mt_it"
:
{
"acc"
:
0.0
,
"acc_stderr"
:
0.0
,
"ppl"
:
1.6479047769869253
,
"ppl_stderr"
:
0.006497321146240192
}},
"versions"
:
{
"lambada_mt_it"
:
0
}}
{
"results"
:
{
"lambada_mt_it"
:
{
"acc"
:
0.0
,
"acc_stderr"
:
0.0
,
"ppl"
:
1.6479047769869253
,
"ppl_stderr"
:
0.006497321146240192
}},
"versions"
:
{
"lambada_mt_it"
:
0
}}
\ No newline at end of file
tests/testdata/logiqa-v0-loglikelihood
View file @
121b7096
12495c50454ba5e1ce0753bd18c09aaca516bebd27648d815e37b15229dbf198
12495c50454ba5e1ce0753bd18c09aaca516bebd27648d815e37b15229dbf198
\ No newline at end of file
tests/testdata/logiqa-v0-res.json
View file @
121b7096
{
"results"
:
{
"logiqa"
:
{
"acc"
:
0.25806451612903225
,
"acc_norm"
:
0.2764976958525346
,
"acc_norm_stderr"
:
0.017543209075825194
,
"acc_stderr"
:
0.017162894755127077
}},
"versions"
:
{
"logiqa"
:
0
}}
{
"results"
:
{
"logiqa"
:
{
"acc"
:
0.25806451612903225
,
"acc_norm"
:
0.2764976958525346
,
"acc_norm_stderr"
:
0.017543209075825194
,
"acc_stderr"
:
0.017162894755127077
}},
"versions"
:
{
"logiqa"
:
0
}}
\ No newline at end of file
tests/testdata/math_algebra-v0-greedy_until
View file @
121b7096
f19182ce697a2c095d9e5b56ee6659dc38c93994b69ca75d7c3d3f5fd87572b4
f19182ce697a2c095d9e5b56ee6659dc38c93994b69ca75d7c3d3f5fd87572b4
\ No newline at end of file
tests/testdata/math_algebra-v0-res.json
View file @
121b7096
{
"results"
:
{
"math_algebra"
:
{
"acc"
:
0.0
,
"acc_stderr"
:
0.0
}},
"versions"
:
{
"math_algebra"
:
0
}}
{
"results"
:
{
"math_algebra"
:
{
"acc"
:
0.0
,
"acc_stderr"
:
0.0
}},
"versions"
:
{
"math_algebra"
:
0
}}
\ No newline at end of file
tests/testdata/math_algebra-v1-greedy_until
View file @
121b7096
f19182ce697a2c095d9e5b56ee6659dc38c93994b69ca75d7c3d3f5fd87572b4
f19182ce697a2c095d9e5b56ee6659dc38c93994b69ca75d7c3d3f5fd87572b4
\ No newline at end of file
tests/testdata/math_algebra-v1-res.json
View file @
121b7096
{
"results"
:
{
"math_algebra"
:
{
"acc"
:
0.0
,
"acc_stderr"
:
0.0
}},
"versions"
:
{
"math_algebra"
:
1
}}
{
"results"
:
{
"math_algebra"
:
{
"acc"
:
0.0
,
"acc_stderr"
:
0.0
}},
"versions"
:
{
"math_algebra"
:
1
}}
\ No newline at end of file
tests/testdata/math_counting_and_prob-v0-greedy_until
View file @
121b7096
2aa9ae43ee9dbb2457525247d7b65358632c5eaa9cbfc40cf95a4f17f5d942ad
2aa9ae43ee9dbb2457525247d7b65358632c5eaa9cbfc40cf95a4f17f5d942ad
\ No newline at end of file
tests/testdata/math_counting_and_prob-v0-res.json
View file @
121b7096
{
"results"
:
{
"math_counting_and_prob"
:
{
"acc"
:
0.0
,
"acc_stderr"
:
0.0
}},
"versions"
:
{
"math_counting_and_prob"
:
0
}}
{
"results"
:
{
"math_counting_and_prob"
:
{
"acc"
:
0.0
,
"acc_stderr"
:
0.0
}},
"versions"
:
{
"math_counting_and_prob"
:
0
}}
\ No newline at end of file
tests/testdata/math_counting_and_prob-v1-greedy_until
View file @
121b7096
2aa9ae43ee9dbb2457525247d7b65358632c5eaa9cbfc40cf95a4f17f5d942ad
2aa9ae43ee9dbb2457525247d7b65358632c5eaa9cbfc40cf95a4f17f5d942ad
\ No newline at end of file
tests/testdata/math_counting_and_prob-v1-res.json
View file @
121b7096
{
"results"
:
{
"math_counting_and_prob"
:
{
"acc"
:
0.0
,
"acc_stderr"
:
0.0
}},
"versions"
:
{
"math_counting_and_prob"
:
1
}}
{
"results"
:
{
"math_counting_and_prob"
:
{
"acc"
:
0.0
,
"acc_stderr"
:
0.0
}},
"versions"
:
{
"math_counting_and_prob"
:
1
}}
\ No newline at end of file
Prev
1
…
13
14
15
16
17
18
19
20
21
…
37
Next
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment