Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
lm-evaluation-harness
Commits
720cdf90
Commit
720cdf90
authored
Aug 15, 2024
by
lintangsutawika
Browse files
adjust tag name
parent
09e5f519
Changes
32
Hide whitespace changes
Inline
Side-by-side
Showing
20 changed files
with
19 additions
and
19 deletions
+19
-19
lm_eval/tasks/tmlu/default/_tmlu.yaml
lm_eval/tasks/tmlu/default/_tmlu.yaml
+0
-0
lm_eval/tasks/tmlu/default/tmlu_AST_biology.yaml
lm_eval/tasks/tmlu/default/tmlu_AST_biology.yaml
+1
-1
lm_eval/tasks/tmlu/default/tmlu_AST_chemistry.yaml
lm_eval/tasks/tmlu/default/tmlu_AST_chemistry.yaml
+1
-1
lm_eval/tasks/tmlu/default/tmlu_AST_chinese.yaml
lm_eval/tasks/tmlu/default/tmlu_AST_chinese.yaml
+1
-1
lm_eval/tasks/tmlu/default/tmlu_AST_civics.yaml
lm_eval/tasks/tmlu/default/tmlu_AST_civics.yaml
+1
-1
lm_eval/tasks/tmlu/default/tmlu_AST_geography.yaml
lm_eval/tasks/tmlu/default/tmlu_AST_geography.yaml
+1
-1
lm_eval/tasks/tmlu/default/tmlu_AST_history.yaml
lm_eval/tasks/tmlu/default/tmlu_AST_history.yaml
+1
-1
lm_eval/tasks/tmlu/default/tmlu_CAP_biology.yaml
lm_eval/tasks/tmlu/default/tmlu_CAP_biology.yaml
+1
-1
lm_eval/tasks/tmlu/default/tmlu_CAP_chemistry.yaml
lm_eval/tasks/tmlu/default/tmlu_CAP_chemistry.yaml
+1
-1
lm_eval/tasks/tmlu/default/tmlu_CAP_chinese.yaml
lm_eval/tasks/tmlu/default/tmlu_CAP_chinese.yaml
+1
-1
lm_eval/tasks/tmlu/default/tmlu_CAP_civics.yaml
lm_eval/tasks/tmlu/default/tmlu_CAP_civics.yaml
+1
-1
lm_eval/tasks/tmlu/default/tmlu_CAP_earth_science.yaml
lm_eval/tasks/tmlu/default/tmlu_CAP_earth_science.yaml
+1
-1
lm_eval/tasks/tmlu/default/tmlu_CAP_geography.yaml
lm_eval/tasks/tmlu/default/tmlu_CAP_geography.yaml
+1
-1
lm_eval/tasks/tmlu/default/tmlu_CAP_history.yaml
lm_eval/tasks/tmlu/default/tmlu_CAP_history.yaml
+1
-1
lm_eval/tasks/tmlu/default/tmlu_GSAT_biology.yaml
lm_eval/tasks/tmlu/default/tmlu_GSAT_biology.yaml
+1
-1
lm_eval/tasks/tmlu/default/tmlu_GSAT_chemistry.yaml
lm_eval/tasks/tmlu/default/tmlu_GSAT_chemistry.yaml
+1
-1
lm_eval/tasks/tmlu/default/tmlu_GSAT_chinese.yaml
lm_eval/tasks/tmlu/default/tmlu_GSAT_chinese.yaml
+1
-1
lm_eval/tasks/tmlu/default/tmlu_GSAT_civics.yaml
lm_eval/tasks/tmlu/default/tmlu_GSAT_civics.yaml
+1
-1
lm_eval/tasks/tmlu/default/tmlu_GSAT_earth_science.yaml
lm_eval/tasks/tmlu/default/tmlu_GSAT_earth_science.yaml
+1
-1
lm_eval/tasks/tmlu/default/tmlu_GSAT_geography.yaml
lm_eval/tasks/tmlu/default/tmlu_GSAT_geography.yaml
+1
-1
No files found.
lm_eval/tasks/tmlu/default/tmlu.yaml
→
lm_eval/tasks/tmlu/default/
_
tmlu.yaml
View file @
720cdf90
File moved
lm_eval/tasks/tmlu/default/tmlu_AST_biology.yaml
View file @
720cdf90
...
@@ -9,7 +9,7 @@
...
@@ -9,7 +9,7 @@
D.
{{choices[3]}}{%
if
choices
is
defined
and
choices|length
>
4
%}
\n
E.
{{choices[4]}}{%
\
D.
{{choices[3]}}{%
if
choices
is
defined
and
choices|length
>
4
%}
\n
E.
{{choices[4]}}{%
\
\
endif
%}{%
if
choices
is
defined
and
choices|length
>
5
%}
\n
F.
{{choices[5]}}{%
\
\
endif
%}{%
if
choices
is
defined
and
choices|length
>
5
%}
\n
F.
{{choices[5]}}{%
\
\
endif
%}
\n
Answer:"
\
endif
%}
\n
Answer:"
"
group
"
:
"
tmlu_
STEM
"
"
tag
"
:
"
tmlu_
stem_tasks
"
"
group_alias"
:
"
STEM"
"
group_alias"
:
"
STEM"
"
include"
:
"
_default_template_yaml"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
tmlu_AST_biology"
"
task"
:
"
tmlu_AST_biology"
...
...
lm_eval/tasks/tmlu/default/tmlu_AST_chemistry.yaml
View file @
720cdf90
...
@@ -10,7 +10,7 @@
...
@@ -10,7 +10,7 @@
D.
{{choices[3]}}{%
if
choices
is
defined
and
choices|length
>
4
%}
\n
E.
{{choices[4]}}{%
\
D.
{{choices[3]}}{%
if
choices
is
defined
and
choices|length
>
4
%}
\n
E.
{{choices[4]}}{%
\
\
endif
%}{%
if
choices
is
defined
and
choices|length
>
5
%}
\n
F.
{{choices[5]}}{%
\
\
endif
%}{%
if
choices
is
defined
and
choices|length
>
5
%}
\n
F.
{{choices[5]}}{%
\
\
endif
%}
\n
Answer:"
\
endif
%}
\n
Answer:"
"
group
"
:
"
tmlu_
STEM
"
"
tag
"
:
"
tmlu_
stem_tasks
"
"
group_alias"
:
"
STEM"
"
group_alias"
:
"
STEM"
"
include"
:
"
_default_template_yaml"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
tmlu_AST_chemistry"
"
task"
:
"
tmlu_AST_chemistry"
...
...
lm_eval/tasks/tmlu/default/tmlu_AST_chinese.yaml
View file @
720cdf90
...
@@ -9,7 +9,7 @@
...
@@ -9,7 +9,7 @@
D.
{{choices[3]}}{%
if
choices
is
defined
and
choices|length
>
4
%}
\n
E.
{{choices[4]}}{%
\
D.
{{choices[3]}}{%
if
choices
is
defined
and
choices|length
>
4
%}
\n
E.
{{choices[4]}}{%
\
\
endif
%}{%
if
choices
is
defined
and
choices|length
>
5
%}
\n
F.
{{choices[5]}}{%
\
\
endif
%}{%
if
choices
is
defined
and
choices|length
>
5
%}
\n
F.
{{choices[5]}}{%
\
\
endif
%}
\n
Answer:"
\
endif
%}
\n
Answer:"
"
group
"
:
"
tmlu_humanities"
"
tag
"
:
"
tmlu_humanities
_tasks
"
"
group_alias"
:
"
humanities"
"
group_alias"
:
"
humanities"
"
include"
:
"
_default_template_yaml"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
tmlu_AST_chinese"
"
task"
:
"
tmlu_AST_chinese"
...
...
lm_eval/tasks/tmlu/default/tmlu_AST_civics.yaml
View file @
720cdf90
...
@@ -9,7 +9,7 @@
...
@@ -9,7 +9,7 @@
D.
{{choices[3]}}{%
if
choices
is
defined
and
choices|length
>
4
%}
\n
E.
{{choices[4]}}{%
\
D.
{{choices[3]}}{%
if
choices
is
defined
and
choices|length
>
4
%}
\n
E.
{{choices[4]}}{%
\
\
endif
%}{%
if
choices
is
defined
and
choices|length
>
5
%}
\n
F.
{{choices[5]}}{%
\
\
endif
%}{%
if
choices
is
defined
and
choices|length
>
5
%}
\n
F.
{{choices[5]}}{%
\
\
endif
%}
\n
Answer:"
\
endif
%}
\n
Answer:"
"
group
"
:
"
tmlu_social_sciences"
"
tag
"
:
"
tmlu_social_sciences
_tasks
"
"
group_alias"
:
"
social
sciences"
"
group_alias"
:
"
social
sciences"
"
include"
:
"
_default_template_yaml"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
tmlu_AST_civics"
"
task"
:
"
tmlu_AST_civics"
...
...
lm_eval/tasks/tmlu/default/tmlu_AST_geography.yaml
View file @
720cdf90
...
@@ -9,7 +9,7 @@
...
@@ -9,7 +9,7 @@
D.
{{choices[3]}}{%
if
choices
is
defined
and
choices|length
>
4
%}
\n
E.
{{choices[4]}}{%
\
D.
{{choices[3]}}{%
if
choices
is
defined
and
choices|length
>
4
%}
\n
E.
{{choices[4]}}{%
\
\
endif
%}{%
if
choices
is
defined
and
choices|length
>
5
%}
\n
F.
{{choices[5]}}{%
\
\
endif
%}{%
if
choices
is
defined
and
choices|length
>
5
%}
\n
F.
{{choices[5]}}{%
\
\
endif
%}
\n
Answer:"
\
endif
%}
\n
Answer:"
"
group
"
:
"
tmlu_social_sciences"
"
tag
"
:
"
tmlu_social_sciences
_tasks
"
"
group_alias"
:
"
social
sciences"
"
group_alias"
:
"
social
sciences"
"
include"
:
"
_default_template_yaml"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
tmlu_AST_geography"
"
task"
:
"
tmlu_AST_geography"
...
...
lm_eval/tasks/tmlu/default/tmlu_AST_history.yaml
View file @
720cdf90
...
@@ -9,7 +9,7 @@
...
@@ -9,7 +9,7 @@
D.
{{choices[3]}}{%
if
choices
is
defined
and
choices|length
>
4
%}
\n
E.
{{choices[4]}}{%
\
D.
{{choices[3]}}{%
if
choices
is
defined
and
choices|length
>
4
%}
\n
E.
{{choices[4]}}{%
\
\
endif
%}{%
if
choices
is
defined
and
choices|length
>
5
%}
\n
F.
{{choices[5]}}{%
\
\
endif
%}{%
if
choices
is
defined
and
choices|length
>
5
%}
\n
F.
{{choices[5]}}{%
\
\
endif
%}
\n
Answer:"
\
endif
%}
\n
Answer:"
"
group
"
:
"
tmlu_humanities"
"
tag
"
:
"
tmlu_humanities
_tasks
"
"
group_alias"
:
"
humanities"
"
group_alias"
:
"
humanities"
"
include"
:
"
_default_template_yaml"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
tmlu_AST_history"
"
task"
:
"
tmlu_AST_history"
...
...
lm_eval/tasks/tmlu/default/tmlu_CAP_biology.yaml
View file @
720cdf90
...
@@ -9,7 +9,7 @@
...
@@ -9,7 +9,7 @@
D.
{{choices[3]}}{%
if
choices
is
defined
and
choices|length
>
4
%}
\n
E.
{{choices[4]}}{%
\
D.
{{choices[3]}}{%
if
choices
is
defined
and
choices|length
>
4
%}
\n
E.
{{choices[4]}}{%
\
\
endif
%}{%
if
choices
is
defined
and
choices|length
>
5
%}
\n
F.
{{choices[5]}}{%
\
\
endif
%}{%
if
choices
is
defined
and
choices|length
>
5
%}
\n
F.
{{choices[5]}}{%
\
\
endif
%}
\n
Answer:"
\
endif
%}
\n
Answer:"
"
group
"
:
"
tmlu_
STEM
"
"
tag
"
:
"
tmlu_
stem_tasks
"
"
group_alias"
:
"
STEM"
"
group_alias"
:
"
STEM"
"
include"
:
"
_default_template_yaml"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
tmlu_CAP_biology"
"
task"
:
"
tmlu_CAP_biology"
...
...
lm_eval/tasks/tmlu/default/tmlu_CAP_chemistry.yaml
View file @
720cdf90
...
@@ -9,7 +9,7 @@
...
@@ -9,7 +9,7 @@
D.
{{choices[3]}}{%
if
choices
is
defined
and
choices|length
>
4
%}
\n
E.
{{choices[4]}}{%
\
D.
{{choices[3]}}{%
if
choices
is
defined
and
choices|length
>
4
%}
\n
E.
{{choices[4]}}{%
\
\
endif
%}{%
if
choices
is
defined
and
choices|length
>
5
%}
\n
F.
{{choices[5]}}{%
\
\
endif
%}{%
if
choices
is
defined
and
choices|length
>
5
%}
\n
F.
{{choices[5]}}{%
\
\
endif
%}
\n
Answer:"
\
endif
%}
\n
Answer:"
"
group
"
:
"
tmlu_
STEM
"
"
tag
"
:
"
tmlu_
stem_tasks
"
"
group_alias"
:
"
STEM"
"
group_alias"
:
"
STEM"
"
include"
:
"
_default_template_yaml"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
tmlu_CAP_chemistry"
"
task"
:
"
tmlu_CAP_chemistry"
...
...
lm_eval/tasks/tmlu/default/tmlu_CAP_chinese.yaml
View file @
720cdf90
...
@@ -9,7 +9,7 @@
...
@@ -9,7 +9,7 @@
D.
{{choices[3]}}{%
if
choices
is
defined
and
choices|length
>
4
%}
\n
E.
{{choices[4]}}{%
\
D.
{{choices[3]}}{%
if
choices
is
defined
and
choices|length
>
4
%}
\n
E.
{{choices[4]}}{%
\
\
endif
%}{%
if
choices
is
defined
and
choices|length
>
5
%}
\n
F.
{{choices[5]}}{%
\
\
endif
%}{%
if
choices
is
defined
and
choices|length
>
5
%}
\n
F.
{{choices[5]}}{%
\
\
endif
%}
\n
Answer:"
\
endif
%}
\n
Answer:"
"
group
"
:
"
tmlu_humanities"
"
tag
"
:
"
tmlu_humanities
_tasks
"
"
group_alias"
:
"
humanities"
"
group_alias"
:
"
humanities"
"
include"
:
"
_default_template_yaml"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
tmlu_CAP_chinese"
"
task"
:
"
tmlu_CAP_chinese"
...
...
lm_eval/tasks/tmlu/default/tmlu_CAP_civics.yaml
View file @
720cdf90
...
@@ -9,7 +9,7 @@
...
@@ -9,7 +9,7 @@
D.
{{choices[3]}}{%
if
choices
is
defined
and
choices|length
>
4
%}
\n
E.
{{choices[4]}}{%
\
D.
{{choices[3]}}{%
if
choices
is
defined
and
choices|length
>
4
%}
\n
E.
{{choices[4]}}{%
\
\
endif
%}{%
if
choices
is
defined
and
choices|length
>
5
%}
\n
F.
{{choices[5]}}{%
\
\
endif
%}{%
if
choices
is
defined
and
choices|length
>
5
%}
\n
F.
{{choices[5]}}{%
\
\
endif
%}
\n
Answer:"
\
endif
%}
\n
Answer:"
"
group
"
:
"
tmlu_social_sciences"
"
tag
"
:
"
tmlu_social_sciences
_tasks
"
"
group_alias"
:
"
social
sciences"
"
group_alias"
:
"
social
sciences"
"
include"
:
"
_default_template_yaml"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
tmlu_CAP_civics"
"
task"
:
"
tmlu_CAP_civics"
...
...
lm_eval/tasks/tmlu/default/tmlu_CAP_earth_science.yaml
View file @
720cdf90
...
@@ -9,7 +9,7 @@
...
@@ -9,7 +9,7 @@
D.
{{choices[3]}}{%
if
choices
is
defined
and
choices|length
>
4
%}
\n
E.
{{choices[4]}}{%
\
D.
{{choices[3]}}{%
if
choices
is
defined
and
choices|length
>
4
%}
\n
E.
{{choices[4]}}{%
\
\
endif
%}{%
if
choices
is
defined
and
choices|length
>
5
%}
\n
F.
{{choices[5]}}{%
\
\
endif
%}{%
if
choices
is
defined
and
choices|length
>
5
%}
\n
F.
{{choices[5]}}{%
\
\
endif
%}
\n
Answer:"
\
endif
%}
\n
Answer:"
"
group
"
:
"
tmlu_
STEM
"
"
tag
"
:
"
tmlu_
stem_tasks
"
"
group_alias"
:
"
STEM"
"
group_alias"
:
"
STEM"
"
include"
:
"
_default_template_yaml"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
tmlu_CAP_earth_science"
"
task"
:
"
tmlu_CAP_earth_science"
...
...
lm_eval/tasks/tmlu/default/tmlu_CAP_geography.yaml
View file @
720cdf90
...
@@ -9,7 +9,7 @@
...
@@ -9,7 +9,7 @@
D.
{{choices[3]}}{%
if
choices
is
defined
and
choices|length
>
4
%}
\n
E.
{{choices[4]}}{%
\
D.
{{choices[3]}}{%
if
choices
is
defined
and
choices|length
>
4
%}
\n
E.
{{choices[4]}}{%
\
\
endif
%}{%
if
choices
is
defined
and
choices|length
>
5
%}
\n
F.
{{choices[5]}}{%
\
\
endif
%}{%
if
choices
is
defined
and
choices|length
>
5
%}
\n
F.
{{choices[5]}}{%
\
\
endif
%}
\n
Answer:"
\
endif
%}
\n
Answer:"
"
group
"
:
"
tmlu_social_sciences"
"
tag
"
:
"
tmlu_social_sciences
_tasks
"
"
group_alias"
:
"
social
sciences"
"
group_alias"
:
"
social
sciences"
"
include"
:
"
_default_template_yaml"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
tmlu_CAP_geography"
"
task"
:
"
tmlu_CAP_geography"
...
...
lm_eval/tasks/tmlu/default/tmlu_CAP_history.yaml
View file @
720cdf90
...
@@ -9,7 +9,7 @@
...
@@ -9,7 +9,7 @@
D.
{{choices[3]}}{%
if
choices
is
defined
and
choices|length
>
4
%}
\n
E.
{{choices[4]}}{%
\
D.
{{choices[3]}}{%
if
choices
is
defined
and
choices|length
>
4
%}
\n
E.
{{choices[4]}}{%
\
\
endif
%}{%
if
choices
is
defined
and
choices|length
>
5
%}
\n
F.
{{choices[5]}}{%
\
\
endif
%}{%
if
choices
is
defined
and
choices|length
>
5
%}
\n
F.
{{choices[5]}}{%
\
\
endif
%}
\n
Answer:"
\
endif
%}
\n
Answer:"
"
group
"
:
"
tmlu_humanities"
"
tag
"
:
"
tmlu_humanities
_tasks
"
"
group_alias"
:
"
humanities"
"
group_alias"
:
"
humanities"
"
include"
:
"
_default_template_yaml"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
tmlu_CAP_history"
"
task"
:
"
tmlu_CAP_history"
...
...
lm_eval/tasks/tmlu/default/tmlu_GSAT_biology.yaml
View file @
720cdf90
...
@@ -10,7 +10,7 @@
...
@@ -10,7 +10,7 @@
D.
{{choices[3]}}{%
if
choices
is
defined
and
choices|length
>
4
%}
\n
E.
{{choices[4]}}{%
\
D.
{{choices[3]}}{%
if
choices
is
defined
and
choices|length
>
4
%}
\n
E.
{{choices[4]}}{%
\
\
endif
%}{%
if
choices
is
defined
and
choices|length
>
5
%}
\n
F.
{{choices[5]}}{%
\
\
endif
%}{%
if
choices
is
defined
and
choices|length
>
5
%}
\n
F.
{{choices[5]}}{%
\
\
endif
%}
\n
Answer:"
\
endif
%}
\n
Answer:"
"
group
"
:
"
tmlu_
STEM
"
"
tag
"
:
"
tmlu_
stem_tasks
"
"
group_alias"
:
"
STEM"
"
group_alias"
:
"
STEM"
"
include"
:
"
_default_template_yaml"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
tmlu_GSAT_biology"
"
task"
:
"
tmlu_GSAT_biology"
...
...
lm_eval/tasks/tmlu/default/tmlu_GSAT_chemistry.yaml
View file @
720cdf90
...
@@ -10,7 +10,7 @@
...
@@ -10,7 +10,7 @@
D.
{{choices[3]}}{%
if
choices
is
defined
and
choices|length
>
4
%}
\n
E.
{{choices[4]}}{%
\
D.
{{choices[3]}}{%
if
choices
is
defined
and
choices|length
>
4
%}
\n
E.
{{choices[4]}}{%
\
\
endif
%}{%
if
choices
is
defined
and
choices|length
>
5
%}
\n
F.
{{choices[5]}}{%
\
\
endif
%}{%
if
choices
is
defined
and
choices|length
>
5
%}
\n
F.
{{choices[5]}}{%
\
\
endif
%}
\n
Answer:"
\
endif
%}
\n
Answer:"
"
group
"
:
"
tmlu_
STEM
"
"
tag
"
:
"
tmlu_
stem_tasks
"
"
group_alias"
:
"
STEM"
"
group_alias"
:
"
STEM"
"
include"
:
"
_default_template_yaml"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
tmlu_GSAT_chemistry"
"
task"
:
"
tmlu_GSAT_chemistry"
...
...
lm_eval/tasks/tmlu/default/tmlu_GSAT_chinese.yaml
View file @
720cdf90
...
@@ -9,7 +9,7 @@
...
@@ -9,7 +9,7 @@
D.
{{choices[3]}}{%
if
choices
is
defined
and
choices|length
>
4
%}
\n
E.
{{choices[4]}}{%
\
D.
{{choices[3]}}{%
if
choices
is
defined
and
choices|length
>
4
%}
\n
E.
{{choices[4]}}{%
\
\
endif
%}{%
if
choices
is
defined
and
choices|length
>
5
%}
\n
F.
{{choices[5]}}{%
\
\
endif
%}{%
if
choices
is
defined
and
choices|length
>
5
%}
\n
F.
{{choices[5]}}{%
\
\
endif
%}
\n
Answer:"
\
endif
%}
\n
Answer:"
"
group
"
:
"
tmlu_humanities"
"
tag
"
:
"
tmlu_humanities
_tasks
"
"
group_alias"
:
"
humanities"
"
group_alias"
:
"
humanities"
"
include"
:
"
_default_template_yaml"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
tmlu_GSAT_chinese"
"
task"
:
"
tmlu_GSAT_chinese"
...
...
lm_eval/tasks/tmlu/default/tmlu_GSAT_civics.yaml
View file @
720cdf90
...
@@ -9,7 +9,7 @@
...
@@ -9,7 +9,7 @@
D.
{{choices[3]}}{%
if
choices
is
defined
and
choices|length
>
4
%}
\n
E.
{{choices[4]}}{%
\
D.
{{choices[3]}}{%
if
choices
is
defined
and
choices|length
>
4
%}
\n
E.
{{choices[4]}}{%
\
\
endif
%}{%
if
choices
is
defined
and
choices|length
>
5
%}
\n
F.
{{choices[5]}}{%
\
\
endif
%}{%
if
choices
is
defined
and
choices|length
>
5
%}
\n
F.
{{choices[5]}}{%
\
\
endif
%}
\n
Answer:"
\
endif
%}
\n
Answer:"
"
group
"
:
"
tmlu_social_sciences"
"
tag
"
:
"
tmlu_social_sciences
_tasks
"
"
group_alias"
:
"
social
sciences"
"
group_alias"
:
"
social
sciences"
"
include"
:
"
_default_template_yaml"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
tmlu_GSAT_civics"
"
task"
:
"
tmlu_GSAT_civics"
...
...
lm_eval/tasks/tmlu/default/tmlu_GSAT_earth_science.yaml
View file @
720cdf90
...
@@ -10,7 +10,7 @@
...
@@ -10,7 +10,7 @@
D.
{{choices[3]}}{%
if
choices
is
defined
and
choices|length
>
4
%}
\n
E.
{{choices[4]}}{%
\
D.
{{choices[3]}}{%
if
choices
is
defined
and
choices|length
>
4
%}
\n
E.
{{choices[4]}}{%
\
\
endif
%}{%
if
choices
is
defined
and
choices|length
>
5
%}
\n
F.
{{choices[5]}}{%
\
\
endif
%}{%
if
choices
is
defined
and
choices|length
>
5
%}
\n
F.
{{choices[5]}}{%
\
\
endif
%}
\n
Answer:"
\
endif
%}
\n
Answer:"
"
group
"
:
"
tmlu_
STEM
"
"
tag
"
:
"
tmlu_
stem_tasks
"
"
group_alias"
:
"
STEM"
"
group_alias"
:
"
STEM"
"
include"
:
"
_default_template_yaml"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
tmlu_GSAT_earth_science"
"
task"
:
"
tmlu_GSAT_earth_science"
...
...
lm_eval/tasks/tmlu/default/tmlu_GSAT_geography.yaml
View file @
720cdf90
...
@@ -9,7 +9,7 @@
...
@@ -9,7 +9,7 @@
D.
{{choices[3]}}{%
if
choices
is
defined
and
choices|length
>
4
%}
\n
E.
{{choices[4]}}{%
\
D.
{{choices[3]}}{%
if
choices
is
defined
and
choices|length
>
4
%}
\n
E.
{{choices[4]}}{%
\
\
endif
%}{%
if
choices
is
defined
and
choices|length
>
5
%}
\n
F.
{{choices[5]}}{%
\
\
endif
%}{%
if
choices
is
defined
and
choices|length
>
5
%}
\n
F.
{{choices[5]}}{%
\
\
endif
%}
\n
Answer:"
\
endif
%}
\n
Answer:"
"
group
"
:
"
tmlu_social_sciences"
"
tag
"
:
"
tmlu_social_sciences
_tasks
"
"
group_alias"
:
"
social
sciences"
"
group_alias"
:
"
social
sciences"
"
include"
:
"
_default_template_yaml"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
tmlu_GSAT_geography"
"
task"
:
"
tmlu_GSAT_geography"
...
...
Prev
1
2
Next
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment