Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
lm-evaluation-harness
Commits
90ad5db7
Commit
90ad5db7
authored
Mar 01, 2024
by
lintangsutawika
Browse files
merged main
parents
f692caa9
b177c82c
Changes
484
Hide whitespace changes
Inline
Side-by-side
Showing
20 changed files
with
54 additions
and
6 deletions
+54
-6
lm_eval/tasks/kmmlu/hard/kmmlu_hard_machine_design_and_manufacturing.yaml
...mlu/hard/kmmlu_hard_machine_design_and_manufacturing.yaml
+3
-0
lm_eval/tasks/kmmlu/hard/kmmlu_hard_management.yaml
lm_eval/tasks/kmmlu/hard/kmmlu_hard_management.yaml
+3
-0
lm_eval/tasks/kmmlu/hard/kmmlu_hard_maritime_engineering.yaml
...val/tasks/kmmlu/hard/kmmlu_hard_maritime_engineering.yaml
+3
-0
lm_eval/tasks/kmmlu/hard/kmmlu_hard_marketing.yaml
lm_eval/tasks/kmmlu/hard/kmmlu_hard_marketing.yaml
+3
-0
lm_eval/tasks/kmmlu/hard/kmmlu_hard_materials_engineering.yaml
...al/tasks/kmmlu/hard/kmmlu_hard_materials_engineering.yaml
+3
-0
lm_eval/tasks/kmmlu/hard/kmmlu_hard_math.yaml
lm_eval/tasks/kmmlu/hard/kmmlu_hard_math.yaml
+3
-0
lm_eval/tasks/kmmlu/hard/kmmlu_hard_mechanical_engineering.yaml
...l/tasks/kmmlu/hard/kmmlu_hard_mechanical_engineering.yaml
+3
-0
lm_eval/tasks/kmmlu/hard/kmmlu_hard_nondestructive_testing.yaml
...l/tasks/kmmlu/hard/kmmlu_hard_nondestructive_testing.yaml
+3
-0
lm_eval/tasks/kmmlu/hard/kmmlu_hard_patent.yaml
lm_eval/tasks/kmmlu/hard/kmmlu_hard_patent.yaml
+3
-0
lm_eval/tasks/kmmlu/hard/kmmlu_hard_political_science_and_sociology.yaml
...mmlu/hard/kmmlu_hard_political_science_and_sociology.yaml
+3
-0
lm_eval/tasks/kmmlu/hard/kmmlu_hard_psychology.yaml
lm_eval/tasks/kmmlu/hard/kmmlu_hard_psychology.yaml
+3
-0
lm_eval/tasks/kmmlu/hard/kmmlu_hard_public_safety.yaml
lm_eval/tasks/kmmlu/hard/kmmlu_hard_public_safety.yaml
+3
-0
lm_eval/tasks/kmmlu/hard/kmmlu_hard_railway_and_automotive_engineering.yaml
...u/hard/kmmlu_hard_railway_and_automotive_engineering.yaml
+3
-0
lm_eval/tasks/kmmlu/hard/kmmlu_hard_real_estate.yaml
lm_eval/tasks/kmmlu/hard/kmmlu_hard_real_estate.yaml
+3
-0
lm_eval/tasks/kmmlu/hard/kmmlu_hard_refrigerating_machinery.yaml
.../tasks/kmmlu/hard/kmmlu_hard_refrigerating_machinery.yaml
+3
-0
lm_eval/tasks/kmmlu/hard/kmmlu_hard_social_welfare.yaml
lm_eval/tasks/kmmlu/hard/kmmlu_hard_social_welfare.yaml
+3
-0
lm_eval/tasks/kmmlu/hard/kmmlu_hard_taxation.yaml
lm_eval/tasks/kmmlu/hard/kmmlu_hard_taxation.yaml
+3
-0
lm_eval/tasks/kmmlu/hard/kmmlu_hard_telecommunications_and_wireless_technology.yaml
...mmlu_hard_telecommunications_and_wireless_technology.yaml
+3
-0
lm_eval/tasks/kmmlu/kmmlu_accounting.yaml
lm_eval/tasks/kmmlu/kmmlu_accounting.yaml
+0
-3
lm_eval/tasks/kmmlu/kmmlu_agricultural_sciences.yaml
lm_eval/tasks/kmmlu/kmmlu_agricultural_sciences.yaml
+0
-3
No files found.
lm_eval/tasks/kmmlu/hard/kmmlu_hard_machine_design_and_manufacturing.yaml
0 → 100644
View file @
90ad5db7
dataset_name
:
machine_design_and_manufacturing
include
:
_hard_kmmlu_yaml
task
:
kmmlu_hard_machine_design_and_manufacturing
lm_eval/tasks/kmmlu/hard/kmmlu_hard_management.yaml
0 → 100644
View file @
90ad5db7
dataset_name
:
management
include
:
_hard_kmmlu_yaml
task
:
kmmlu_hard_management
lm_eval/tasks/kmmlu/hard/kmmlu_hard_maritime_engineering.yaml
0 → 100644
View file @
90ad5db7
dataset_name
:
maritime_engineering
include
:
_hard_kmmlu_yaml
task
:
kmmlu_hard_maritime_engineering
lm_eval/tasks/kmmlu/hard/kmmlu_hard_marketing.yaml
0 → 100644
View file @
90ad5db7
dataset_name
:
marketing
include
:
_hard_kmmlu_yaml
task
:
kmmlu_hard_marketing
lm_eval/tasks/kmmlu/hard/kmmlu_hard_materials_engineering.yaml
0 → 100644
View file @
90ad5db7
dataset_name
:
materials_engineering
include
:
_hard_kmmlu_yaml
task
:
kmmlu_hard_materials_engineering
lm_eval/tasks/kmmlu/hard/kmmlu_hard_math.yaml
0 → 100644
View file @
90ad5db7
dataset_name
:
math
include
:
_hard_kmmlu_yaml
task
:
kmmlu_hard_math
lm_eval/tasks/kmmlu/hard/kmmlu_hard_mechanical_engineering.yaml
0 → 100644
View file @
90ad5db7
dataset_name
:
mechanical_engineering
include
:
_hard_kmmlu_yaml
task
:
kmmlu_hard_mechanical_engineering
lm_eval/tasks/kmmlu/hard/kmmlu_hard_nondestructive_testing.yaml
0 → 100644
View file @
90ad5db7
dataset_name
:
nondestructive_testing
include
:
_hard_kmmlu_yaml
task
:
kmmlu_hard_nondestructive_testing
lm_eval/tasks/kmmlu/hard/kmmlu_hard_patent.yaml
0 → 100644
View file @
90ad5db7
dataset_name
:
patent
include
:
_hard_kmmlu_yaml
task
:
kmmlu_hard_patent
lm_eval/tasks/kmmlu/hard/kmmlu_hard_political_science_and_sociology.yaml
0 → 100644
View file @
90ad5db7
dataset_name
:
political_science_and_sociology
include
:
_hard_kmmlu_yaml
task
:
kmmlu_hard_political_science_and_sociology
lm_eval/tasks/kmmlu/hard/kmmlu_hard_psychology.yaml
0 → 100644
View file @
90ad5db7
dataset_name
:
psychology
include
:
_hard_kmmlu_yaml
task
:
kmmlu_hard_psychology
lm_eval/tasks/kmmlu/hard/kmmlu_hard_public_safety.yaml
0 → 100644
View file @
90ad5db7
dataset_name
:
public_safety
include
:
_hard_kmmlu_yaml
task
:
kmmlu_hard_public_safety
lm_eval/tasks/kmmlu/hard/kmmlu_hard_railway_and_automotive_engineering.yaml
0 → 100644
View file @
90ad5db7
dataset_name
:
railway_and_automotive_engineering
include
:
_hard_kmmlu_yaml
task
:
kmmlu_hard_railway_and_automotive_engineering
lm_eval/tasks/kmmlu/hard/kmmlu_hard_real_estate.yaml
0 → 100644
View file @
90ad5db7
dataset_name
:
real_estate
include
:
_hard_kmmlu_yaml
task
:
kmmlu_hard_real_estate
lm_eval/tasks/kmmlu/hard/kmmlu_hard_refrigerating_machinery.yaml
0 → 100644
View file @
90ad5db7
dataset_name
:
refrigerating_machinery
include
:
_hard_kmmlu_yaml
task
:
kmmlu_hard_refrigerating_machinery
lm_eval/tasks/kmmlu/hard/kmmlu_hard_social_welfare.yaml
0 → 100644
View file @
90ad5db7
dataset_name
:
social_welfare
include
:
_hard_kmmlu_yaml
task
:
kmmlu_hard_social_welfare
lm_eval/tasks/kmmlu/hard/kmmlu_hard_taxation.yaml
0 → 100644
View file @
90ad5db7
dataset_name
:
taxation
include
:
_hard_kmmlu_yaml
task
:
kmmlu_hard_taxation
lm_eval/tasks/kmmlu/hard/kmmlu_hard_telecommunications_and_wireless_technology.yaml
0 → 100644
View file @
90ad5db7
dataset_name
:
telecommunications_and_wireless_technology
include
:
_hard_kmmlu_yaml
task
:
kmmlu_hard_telecommunications_and_wireless_technology
lm_eval/tasks/kmmlu/kmmlu_accounting.yaml
deleted
100644 → 0
View file @
f692caa9
"
dataset_name"
:
"
Accounting"
"
include"
:
"
_default_kmmlu_yaml"
"
task"
:
"
kmmlu_accounting"
lm_eval/tasks/kmmlu/kmmlu_agricultural_sciences.yaml
deleted
100644 → 0
View file @
f692caa9
"
dataset_name"
:
"
Agricultural-Sciences"
"
include"
:
"
_default_kmmlu_yaml"
"
task"
:
"
kmmlu_agricultural_sciences"
Prev
1
…
11
12
13
14
15
16
17
18
19
…
25
Next
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment