Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
lm-evaluation-harness
Commits
bb5b46d7
Unverified
Commit
bb5b46d7
authored
Jun 24, 2024
by
Yu Shi Jie
Committed by
GitHub
Jun 24, 2024
Browse files
Merge branch 'EleutherAI:main' into mmlu-pro
parents
1e4e058c
6f7b4a05
Changes
90
Hide whitespace changes
Inline
Side-by-side
Showing
20 changed files
with
120 additions
and
0 deletions
+120
-0
lm_eval/tasks/arabicmmlu/arabicmmlu_high_history.yaml
lm_eval/tasks/arabicmmlu/arabicmmlu_high_history.yaml
+6
-0
lm_eval/tasks/arabicmmlu/arabicmmlu_high_islamic_studies.yaml
...val/tasks/arabicmmlu/arabicmmlu_high_islamic_studies.yaml
+6
-0
lm_eval/tasks/arabicmmlu/arabicmmlu_high_philosophy.yaml
lm_eval/tasks/arabicmmlu/arabicmmlu_high_philosophy.yaml
+6
-0
lm_eval/tasks/arabicmmlu/arabicmmlu_high_physics.yaml
lm_eval/tasks/arabicmmlu/arabicmmlu_high_physics.yaml
+6
-0
lm_eval/tasks/arabicmmlu/arabicmmlu_islamic_studies.yaml
lm_eval/tasks/arabicmmlu/arabicmmlu_islamic_studies.yaml
+6
-0
lm_eval/tasks/arabicmmlu/arabicmmlu_middle_arabic_language.yaml
...l/tasks/arabicmmlu/arabicmmlu_middle_arabic_language.yaml
+6
-0
lm_eval/tasks/arabicmmlu/arabicmmlu_middle_civics.yaml
lm_eval/tasks/arabicmmlu/arabicmmlu_middle_civics.yaml
+6
-0
lm_eval/tasks/arabicmmlu/arabicmmlu_middle_computer_science.yaml
.../tasks/arabicmmlu/arabicmmlu_middle_computer_science.yaml
+6
-0
lm_eval/tasks/arabicmmlu/arabicmmlu_middle_economics.yaml
lm_eval/tasks/arabicmmlu/arabicmmlu_middle_economics.yaml
+6
-0
lm_eval/tasks/arabicmmlu/arabicmmlu_middle_general_knowledge.yaml
...tasks/arabicmmlu/arabicmmlu_middle_general_knowledge.yaml
+6
-0
lm_eval/tasks/arabicmmlu/arabicmmlu_middle_geography.yaml
lm_eval/tasks/arabicmmlu/arabicmmlu_middle_geography.yaml
+6
-0
lm_eval/tasks/arabicmmlu/arabicmmlu_middle_history.yaml
lm_eval/tasks/arabicmmlu/arabicmmlu_middle_history.yaml
+6
-0
lm_eval/tasks/arabicmmlu/arabicmmlu_middle_islamic_studies.yaml
...l/tasks/arabicmmlu/arabicmmlu_middle_islamic_studies.yaml
+6
-0
lm_eval/tasks/arabicmmlu/arabicmmlu_middle_natural_science.yaml
...l/tasks/arabicmmlu/arabicmmlu_middle_natural_science.yaml
+6
-0
lm_eval/tasks/arabicmmlu/arabicmmlu_middle_social_science.yaml
...al/tasks/arabicmmlu/arabicmmlu_middle_social_science.yaml
+6
-0
lm_eval/tasks/arabicmmlu/arabicmmlu_primary_arabic_language.yaml
.../tasks/arabicmmlu/arabicmmlu_primary_arabic_language.yaml
+6
-0
lm_eval/tasks/arabicmmlu/arabicmmlu_primary_computer_science.yaml
...tasks/arabicmmlu/arabicmmlu_primary_computer_science.yaml
+6
-0
lm_eval/tasks/arabicmmlu/arabicmmlu_primary_general_knowledge.yaml
...asks/arabicmmlu/arabicmmlu_primary_general_knowledge.yaml
+6
-0
lm_eval/tasks/arabicmmlu/arabicmmlu_primary_geography.yaml
lm_eval/tasks/arabicmmlu/arabicmmlu_primary_geography.yaml
+6
-0
lm_eval/tasks/arabicmmlu/arabicmmlu_primary_history.yaml
lm_eval/tasks/arabicmmlu/arabicmmlu_primary_history.yaml
+6
-0
No files found.
lm_eval/tasks/arabicmmlu/arabicmmlu_high_history.yaml
0 → 100644
View file @
bb5b46d7
"
dataset_name"
:
"
High
History"
"
group"
:
"
arabicmmlu_humanities"
"
group_alias"
:
"
humanities"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
arabicmmlu_high_history"
"
task_alias"
:
"
High
History"
lm_eval/tasks/arabicmmlu/arabicmmlu_high_islamic_studies.yaml
0 → 100644
View file @
bb5b46d7
"
dataset_name"
:
"
High
Islamic
Studies"
"
group"
:
"
arabicmmlu_humanities"
"
group_alias"
:
"
humanities"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
arabicmmlu_high_islamic_studies"
"
task_alias"
:
"
High
Islamic
Studies"
lm_eval/tasks/arabicmmlu/arabicmmlu_high_philosophy.yaml
0 → 100644
View file @
bb5b46d7
"
dataset_name"
:
"
High
Philosophy"
"
group"
:
"
arabicmmlu_humanities"
"
group_alias"
:
"
humanities"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
arabicmmlu_high_philosophy"
"
task_alias"
:
"
High
Philosophy"
lm_eval/tasks/arabicmmlu/arabicmmlu_high_physics.yaml
0 → 100644
View file @
bb5b46d7
"
dataset_name"
:
"
High
Physics"
"
group"
:
"
arabicmmlu_stem"
"
group_alias"
:
"
stem"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
arabicmmlu_high_physics"
"
task_alias"
:
"
High
Physics"
lm_eval/tasks/arabicmmlu/arabicmmlu_islamic_studies.yaml
0 → 100644
View file @
bb5b46d7
"
dataset_name"
:
"
Islamic
Studies"
"
group"
:
"
arabicmmlu_humanities"
"
group_alias"
:
"
humanities"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
arabicmmlu_islamic_studies"
"
task_alias"
:
"
Islamic
Studies"
lm_eval/tasks/arabicmmlu/arabicmmlu_middle_arabic_language.yaml
0 → 100644
View file @
bb5b46d7
"
dataset_name"
:
"
Middle
Arabic
Language"
"
group"
:
"
arabicmmlu_language"
"
group_alias"
:
"
language"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
arabicmmlu_middle_arabic_language"
"
task_alias"
:
"
Middle
Arabic
Language"
lm_eval/tasks/arabicmmlu/arabicmmlu_middle_civics.yaml
0 → 100644
View file @
bb5b46d7
"
dataset_name"
:
"
Middle
Civics"
"
group"
:
"
arabicmmlu_social_science"
"
group_alias"
:
"
social
science"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
arabicmmlu_middle_civics"
"
task_alias"
:
"
Middle
Civics"
lm_eval/tasks/arabicmmlu/arabicmmlu_middle_computer_science.yaml
0 → 100644
View file @
bb5b46d7
"
dataset_name"
:
"
Middle
Computer
Science"
"
group"
:
"
arabicmmlu_stem"
"
group_alias"
:
"
stem"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
arabicmmlu_middle_computer_science"
"
task_alias"
:
"
Middle
Computer
Science"
lm_eval/tasks/arabicmmlu/arabicmmlu_middle_economics.yaml
0 → 100644
View file @
bb5b46d7
"
dataset_name"
:
"
Middle
Economics"
"
group"
:
"
arabicmmlu_social_science"
"
group_alias"
:
"
social
science"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
arabicmmlu_middle_economics"
"
task_alias"
:
"
Middle
Economics"
lm_eval/tasks/arabicmmlu/arabicmmlu_middle_general_knowledge.yaml
0 → 100644
View file @
bb5b46d7
"
dataset_name"
:
"
Middle
General
Knowledge"
"
group"
:
"
arabicmmlu_other"
"
group_alias"
:
"
other"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
arabicmmlu_middle_general_knowledge"
"
task_alias"
:
"
Middle
General
Knowledge"
lm_eval/tasks/arabicmmlu/arabicmmlu_middle_geography.yaml
0 → 100644
View file @
bb5b46d7
"
dataset_name"
:
"
Middle
Geography"
"
group"
:
"
arabicmmlu_social_science"
"
group_alias"
:
"
social
science"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
arabicmmlu_middle_geography"
"
task_alias"
:
"
Middle
Geography"
lm_eval/tasks/arabicmmlu/arabicmmlu_middle_history.yaml
0 → 100644
View file @
bb5b46d7
"
dataset_name"
:
"
Middle
History"
"
group"
:
"
arabicmmlu_humanities"
"
group_alias"
:
"
humanities"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
arabicmmlu_middle_history"
"
task_alias"
:
"
Middle
History"
lm_eval/tasks/arabicmmlu/arabicmmlu_middle_islamic_studies.yaml
0 → 100644
View file @
bb5b46d7
"
dataset_name"
:
"
Middle
Islamic
Studies"
"
group"
:
"
arabicmmlu_humanities"
"
group_alias"
:
"
humanities"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
arabicmmlu_middle_islamic_studies"
"
task_alias"
:
"
Middle
Islamic
Studies"
lm_eval/tasks/arabicmmlu/arabicmmlu_middle_natural_science.yaml
0 → 100644
View file @
bb5b46d7
"
dataset_name"
:
"
Middle
Natural
Science"
"
group"
:
"
arabicmmlu_stem"
"
group_alias"
:
"
stem"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
arabicmmlu_middle_natural_science"
"
task_alias"
:
"
Middle
Natural
Science"
lm_eval/tasks/arabicmmlu/arabicmmlu_middle_social_science.yaml
0 → 100644
View file @
bb5b46d7
"
dataset_name"
:
"
Middle
Social
Science"
"
group"
:
"
arabicmmlu_social_science"
"
group_alias"
:
"
social
science"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
arabicmmlu_middle_social_science"
"
task_alias"
:
"
Middle
Social
Science"
lm_eval/tasks/arabicmmlu/arabicmmlu_primary_arabic_language.yaml
0 → 100644
View file @
bb5b46d7
"
dataset_name"
:
"
Primary
Arabic
Language"
"
group"
:
"
arabicmmlu_language"
"
group_alias"
:
"
language"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
arabicmmlu_primary_arabic_language"
"
task_alias"
:
"
Primary
Arabic
Language"
lm_eval/tasks/arabicmmlu/arabicmmlu_primary_computer_science.yaml
0 → 100644
View file @
bb5b46d7
"
dataset_name"
:
"
Primary
Computer
Science"
"
group"
:
"
arabicmmlu_stem"
"
group_alias"
:
"
stem"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
arabicmmlu_primary_computer_science"
"
task_alias"
:
"
Primary
Computer
Science"
lm_eval/tasks/arabicmmlu/arabicmmlu_primary_general_knowledge.yaml
0 → 100644
View file @
bb5b46d7
"
dataset_name"
:
"
Primary
General
Knowledge"
"
group"
:
"
arabicmmlu_other"
"
group_alias"
:
"
other"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
arabicmmlu_primary_general_knowledge"
"
task_alias"
:
"
Primary
General
Knowledge"
lm_eval/tasks/arabicmmlu/arabicmmlu_primary_geography.yaml
0 → 100644
View file @
bb5b46d7
"
dataset_name"
:
"
Primary
Geography"
"
group"
:
"
arabicmmlu_social_science"
"
group_alias"
:
"
social
science"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
arabicmmlu_primary_geography"
"
task_alias"
:
"
Primary
Geography"
lm_eval/tasks/arabicmmlu/arabicmmlu_primary_history.yaml
0 → 100644
View file @
bb5b46d7
"
dataset_name"
:
"
Primary
History"
"
group"
:
"
arabicmmlu_humanities"
"
group_alias"
:
"
humanities"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
arabicmmlu_primary_history"
"
task_alias"
:
"
Primary
History"
Prev
1
2
3
4
5
Next
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment