Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
lm-evaluation-harness
Commits
3d1b8f43
"model.properties" did not exist on "e89836bddc7d11cf406da85cd63aa9cc31e0b408"
Unverified
Commit
3d1b8f43
authored
Jul 03, 2024
by
Lintang Sutawika
Committed by
GitHub
Jul 03, 2024
Browse files
Merge branch 'main' into group-agg-rework
parents
e200c24e
d855d0ba
Changes
317
Hide whitespace changes
Inline
Side-by-side
Showing
20 changed files
with
120 additions
and
0 deletions
+120
-0
lm_eval/tasks/arabicmmlu/arabicmmlu_high_history.yaml
lm_eval/tasks/arabicmmlu/arabicmmlu_high_history.yaml
+6
-0
lm_eval/tasks/arabicmmlu/arabicmmlu_high_islamic_studies.yaml
...val/tasks/arabicmmlu/arabicmmlu_high_islamic_studies.yaml
+6
-0
lm_eval/tasks/arabicmmlu/arabicmmlu_high_philosophy.yaml
lm_eval/tasks/arabicmmlu/arabicmmlu_high_philosophy.yaml
+6
-0
lm_eval/tasks/arabicmmlu/arabicmmlu_high_physics.yaml
lm_eval/tasks/arabicmmlu/arabicmmlu_high_physics.yaml
+6
-0
lm_eval/tasks/arabicmmlu/arabicmmlu_islamic_studies.yaml
lm_eval/tasks/arabicmmlu/arabicmmlu_islamic_studies.yaml
+6
-0
lm_eval/tasks/arabicmmlu/arabicmmlu_middle_arabic_language.yaml
...l/tasks/arabicmmlu/arabicmmlu_middle_arabic_language.yaml
+6
-0
lm_eval/tasks/arabicmmlu/arabicmmlu_middle_civics.yaml
lm_eval/tasks/arabicmmlu/arabicmmlu_middle_civics.yaml
+6
-0
lm_eval/tasks/arabicmmlu/arabicmmlu_middle_computer_science.yaml
.../tasks/arabicmmlu/arabicmmlu_middle_computer_science.yaml
+6
-0
lm_eval/tasks/arabicmmlu/arabicmmlu_middle_economics.yaml
lm_eval/tasks/arabicmmlu/arabicmmlu_middle_economics.yaml
+6
-0
lm_eval/tasks/arabicmmlu/arabicmmlu_middle_general_knowledge.yaml
...tasks/arabicmmlu/arabicmmlu_middle_general_knowledge.yaml
+6
-0
lm_eval/tasks/arabicmmlu/arabicmmlu_middle_geography.yaml
lm_eval/tasks/arabicmmlu/arabicmmlu_middle_geography.yaml
+6
-0
lm_eval/tasks/arabicmmlu/arabicmmlu_middle_history.yaml
lm_eval/tasks/arabicmmlu/arabicmmlu_middle_history.yaml
+6
-0
lm_eval/tasks/arabicmmlu/arabicmmlu_middle_islamic_studies.yaml
...l/tasks/arabicmmlu/arabicmmlu_middle_islamic_studies.yaml
+6
-0
lm_eval/tasks/arabicmmlu/arabicmmlu_middle_natural_science.yaml
...l/tasks/arabicmmlu/arabicmmlu_middle_natural_science.yaml
+6
-0
lm_eval/tasks/arabicmmlu/arabicmmlu_middle_social_science.yaml
...al/tasks/arabicmmlu/arabicmmlu_middle_social_science.yaml
+6
-0
lm_eval/tasks/arabicmmlu/arabicmmlu_primary_arabic_language.yaml
.../tasks/arabicmmlu/arabicmmlu_primary_arabic_language.yaml
+6
-0
lm_eval/tasks/arabicmmlu/arabicmmlu_primary_computer_science.yaml
...tasks/arabicmmlu/arabicmmlu_primary_computer_science.yaml
+6
-0
lm_eval/tasks/arabicmmlu/arabicmmlu_primary_general_knowledge.yaml
...asks/arabicmmlu/arabicmmlu_primary_general_knowledge.yaml
+6
-0
lm_eval/tasks/arabicmmlu/arabicmmlu_primary_geography.yaml
lm_eval/tasks/arabicmmlu/arabicmmlu_primary_geography.yaml
+6
-0
lm_eval/tasks/arabicmmlu/arabicmmlu_primary_history.yaml
lm_eval/tasks/arabicmmlu/arabicmmlu_primary_history.yaml
+6
-0
No files found.
lm_eval/tasks/arabicmmlu/arabicmmlu_high_history.yaml
0 → 100644
View file @
3d1b8f43
"
dataset_name"
:
"
High
History"
"
group"
:
"
arabicmmlu_humanities"
"
group_alias"
:
"
humanities"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
arabicmmlu_high_history"
"
task_alias"
:
"
High
History"
lm_eval/tasks/arabicmmlu/arabicmmlu_high_islamic_studies.yaml
0 → 100644
View file @
3d1b8f43
"
dataset_name"
:
"
High
Islamic
Studies"
"
group"
:
"
arabicmmlu_humanities"
"
group_alias"
:
"
humanities"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
arabicmmlu_high_islamic_studies"
"
task_alias"
:
"
High
Islamic
Studies"
lm_eval/tasks/arabicmmlu/arabicmmlu_high_philosophy.yaml
0 → 100644
View file @
3d1b8f43
"
dataset_name"
:
"
High
Philosophy"
"
group"
:
"
arabicmmlu_humanities"
"
group_alias"
:
"
humanities"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
arabicmmlu_high_philosophy"
"
task_alias"
:
"
High
Philosophy"
lm_eval/tasks/arabicmmlu/arabicmmlu_high_physics.yaml
0 → 100644
View file @
3d1b8f43
"
dataset_name"
:
"
High
Physics"
"
group"
:
"
arabicmmlu_stem"
"
group_alias"
:
"
stem"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
arabicmmlu_high_physics"
"
task_alias"
:
"
High
Physics"
lm_eval/tasks/arabicmmlu/arabicmmlu_islamic_studies.yaml
0 → 100644
View file @
3d1b8f43
"
dataset_name"
:
"
Islamic
Studies"
"
group"
:
"
arabicmmlu_humanities"
"
group_alias"
:
"
humanities"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
arabicmmlu_islamic_studies"
"
task_alias"
:
"
Islamic
Studies"
lm_eval/tasks/arabicmmlu/arabicmmlu_middle_arabic_language.yaml
0 → 100644
View file @
3d1b8f43
"
dataset_name"
:
"
Middle
Arabic
Language"
"
group"
:
"
arabicmmlu_language"
"
group_alias"
:
"
language"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
arabicmmlu_middle_arabic_language"
"
task_alias"
:
"
Middle
Arabic
Language"
lm_eval/tasks/arabicmmlu/arabicmmlu_middle_civics.yaml
0 → 100644
View file @
3d1b8f43
"
dataset_name"
:
"
Middle
Civics"
"
group"
:
"
arabicmmlu_social_science"
"
group_alias"
:
"
social
science"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
arabicmmlu_middle_civics"
"
task_alias"
:
"
Middle
Civics"
lm_eval/tasks/ammlu/ammlu_m
oral
_scen
arios
.yaml
→
lm_eval/tasks/a
rabic
mmlu/a
rabic
mmlu_m
iddle_computer
_sc
i
en
ce
.yaml
View file @
3d1b8f43
"
dataset_name"
:
"
moral_scenarios"
"
dataset_name"
:
"
Middle
Computer
Science"
"
description"
:
"
فم
بعملية
التقييم
في
مجال
العلوم
الانسانية
\n\n
"
"
group"
:
"
arabicmmlu_stem"
"
group_alias"
:
"
stem"
"
include"
:
"
_default_template_yaml"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
ammlu_moral_scenarios"
"
task"
:
"
arabicmmlu_middle_computer_science"
"
task_alias"
:
"
Middle
Computer
Science"
lm_eval/tasks/arabicmmlu/arabicmmlu_middle_economics.yaml
0 → 100644
View file @
3d1b8f43
"
dataset_name"
:
"
Middle
Economics"
"
group"
:
"
arabicmmlu_social_science"
"
group_alias"
:
"
social
science"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
arabicmmlu_middle_economics"
"
task_alias"
:
"
Middle
Economics"
lm_eval/tasks/arabicmmlu/arabicmmlu_middle_general_knowledge.yaml
0 → 100644
View file @
3d1b8f43
"
dataset_name"
:
"
Middle
General
Knowledge"
"
group"
:
"
arabicmmlu_other"
"
group_alias"
:
"
other"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
arabicmmlu_middle_general_knowledge"
"
task_alias"
:
"
Middle
General
Knowledge"
lm_eval/tasks/arabicmmlu/arabicmmlu_middle_geography.yaml
0 → 100644
View file @
3d1b8f43
"
dataset_name"
:
"
Middle
Geography"
"
group"
:
"
arabicmmlu_social_science"
"
group_alias"
:
"
social
science"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
arabicmmlu_middle_geography"
"
task_alias"
:
"
Middle
Geography"
lm_eval/tasks/arabicmmlu/arabicmmlu_middle_history.yaml
0 → 100644
View file @
3d1b8f43
"
dataset_name"
:
"
Middle
History"
"
group"
:
"
arabicmmlu_humanities"
"
group_alias"
:
"
humanities"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
arabicmmlu_middle_history"
"
task_alias"
:
"
Middle
History"
lm_eval/tasks/arabicmmlu/arabicmmlu_middle_islamic_studies.yaml
0 → 100644
View file @
3d1b8f43
"
dataset_name"
:
"
Middle
Islamic
Studies"
"
group"
:
"
arabicmmlu_humanities"
"
group_alias"
:
"
humanities"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
arabicmmlu_middle_islamic_studies"
"
task_alias"
:
"
Middle
Islamic
Studies"
lm_eval/tasks/arabicmmlu/arabicmmlu_middle_natural_science.yaml
0 → 100644
View file @
3d1b8f43
"
dataset_name"
:
"
Middle
Natural
Science"
"
group"
:
"
arabicmmlu_stem"
"
group_alias"
:
"
stem"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
arabicmmlu_middle_natural_science"
"
task_alias"
:
"
Middle
Natural
Science"
lm_eval/tasks/arabicmmlu/arabicmmlu_middle_social_science.yaml
0 → 100644
View file @
3d1b8f43
"
dataset_name"
:
"
Middle
Social
Science"
"
group"
:
"
arabicmmlu_social_science"
"
group_alias"
:
"
social
science"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
arabicmmlu_middle_social_science"
"
task_alias"
:
"
Middle
Social
Science"
lm_eval/tasks/arabicmmlu/arabicmmlu_primary_arabic_language.yaml
0 → 100644
View file @
3d1b8f43
"
dataset_name"
:
"
Primary
Arabic
Language"
"
group"
:
"
arabicmmlu_language"
"
group_alias"
:
"
language"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
arabicmmlu_primary_arabic_language"
"
task_alias"
:
"
Primary
Arabic
Language"
lm_eval/tasks/arabicmmlu/arabicmmlu_primary_computer_science.yaml
0 → 100644
View file @
3d1b8f43
"
dataset_name"
:
"
Primary
Computer
Science"
"
group"
:
"
arabicmmlu_stem"
"
group_alias"
:
"
stem"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
arabicmmlu_primary_computer_science"
"
task_alias"
:
"
Primary
Computer
Science"
lm_eval/tasks/arabicmmlu/arabicmmlu_primary_general_knowledge.yaml
0 → 100644
View file @
3d1b8f43
"
dataset_name"
:
"
Primary
General
Knowledge"
"
group"
:
"
arabicmmlu_other"
"
group_alias"
:
"
other"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
arabicmmlu_primary_general_knowledge"
"
task_alias"
:
"
Primary
General
Knowledge"
lm_eval/tasks/arabicmmlu/arabicmmlu_primary_geography.yaml
0 → 100644
View file @
3d1b8f43
"
dataset_name"
:
"
Primary
Geography"
"
group"
:
"
arabicmmlu_social_science"
"
group_alias"
:
"
social
science"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
arabicmmlu_primary_geography"
"
task_alias"
:
"
Primary
Geography"
lm_eval/tasks/arabicmmlu/arabicmmlu_primary_history.yaml
0 → 100644
View file @
3d1b8f43
"
dataset_name"
:
"
Primary
History"
"
group"
:
"
arabicmmlu_humanities"
"
group_alias"
:
"
humanities"
"
include"
:
"
_default_template_yaml"
"
task"
:
"
arabicmmlu_primary_history"
"
task_alias"
:
"
Primary
History"
Prev
1
2
3
4
5
6
7
8
9
10
…
16
Next
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment