Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
lm-evaluation-harness
Commits
4288b53e
Commit
4288b53e
authored
Jan 29, 2025
by
Baber
Browse files
Merge branch 'main' into llama
parents
37eb9c9d
94344a61
Changes
201
Hide whitespace changes
Inline
Side-by-side
Showing
20 changed files
with
45 additions
and
56 deletions
+45
-56
lm_eval/tasks/global_mmlu/default/global_mmlu_bn.yaml
lm_eval/tasks/global_mmlu/default/global_mmlu_bn.yaml
+0
-4
lm_eval/tasks/global_mmlu/default/global_mmlu_de.yaml
lm_eval/tasks/global_mmlu/default/global_mmlu_de.yaml
+0
-4
lm_eval/tasks/global_mmlu/default/global_mmlu_en.yaml
lm_eval/tasks/global_mmlu/default/global_mmlu_en.yaml
+0
-4
lm_eval/tasks/global_mmlu/default/global_mmlu_es.yaml
lm_eval/tasks/global_mmlu/default/global_mmlu_es.yaml
+0
-4
lm_eval/tasks/global_mmlu/default/global_mmlu_fr.yaml
lm_eval/tasks/global_mmlu/default/global_mmlu_fr.yaml
+0
-4
lm_eval/tasks/global_mmlu/default/global_mmlu_hi.yaml
lm_eval/tasks/global_mmlu/default/global_mmlu_hi.yaml
+0
-4
lm_eval/tasks/global_mmlu/default/global_mmlu_id.yaml
lm_eval/tasks/global_mmlu/default/global_mmlu_id.yaml
+0
-4
lm_eval/tasks/global_mmlu/default/global_mmlu_it.yaml
lm_eval/tasks/global_mmlu/default/global_mmlu_it.yaml
+0
-4
lm_eval/tasks/global_mmlu/default/global_mmlu_ja.yaml
lm_eval/tasks/global_mmlu/default/global_mmlu_ja.yaml
+0
-4
lm_eval/tasks/global_mmlu/default/global_mmlu_ko.yaml
lm_eval/tasks/global_mmlu/default/global_mmlu_ko.yaml
+0
-4
lm_eval/tasks/global_mmlu/default/global_mmlu_pt.yaml
lm_eval/tasks/global_mmlu/default/global_mmlu_pt.yaml
+0
-4
lm_eval/tasks/global_mmlu/default/global_mmlu_sw.yaml
lm_eval/tasks/global_mmlu/default/global_mmlu_sw.yaml
+0
-4
lm_eval/tasks/global_mmlu/default/global_mmlu_yo.yaml
lm_eval/tasks/global_mmlu/default/global_mmlu_yo.yaml
+0
-4
lm_eval/tasks/global_mmlu/default/global_mmlu_zh.yaml
lm_eval/tasks/global_mmlu/default/global_mmlu_zh.yaml
+0
-4
lm_eval/tasks/global_mmlu/default/hi/_global_mmlu_hi.yaml
lm_eval/tasks/global_mmlu/default/hi/_global_mmlu_hi.yaml
+13
-0
lm_eval/tasks/global_mmlu/default/hi/_hi_template_yaml
lm_eval/tasks/global_mmlu/default/hi/_hi_template_yaml
+16
-0
lm_eval/tasks/global_mmlu/default/hi/global_mmlu_hi_business.yaml
...tasks/global_mmlu/default/hi/global_mmlu_hi_business.yaml
+4
-0
lm_eval/tasks/global_mmlu/default/hi/global_mmlu_hi_humanities.yaml
...sks/global_mmlu/default/hi/global_mmlu_hi_humanities.yaml
+4
-0
lm_eval/tasks/global_mmlu/default/hi/global_mmlu_hi_medical.yaml
.../tasks/global_mmlu/default/hi/global_mmlu_hi_medical.yaml
+4
-0
lm_eval/tasks/global_mmlu/default/hi/global_mmlu_hi_other.yaml
...al/tasks/global_mmlu/default/hi/global_mmlu_hi_other.yaml
+4
-0
No files found.
lm_eval/tasks/global_mmlu/default/global_mmlu_bn.yaml
deleted
100644 → 0
View file @
37eb9c9d
# Generated by _generate_configs.py
dataset_name
:
bn
include
:
_default_yaml
task
:
global_mmlu_bn
lm_eval/tasks/global_mmlu/default/global_mmlu_de.yaml
deleted
100644 → 0
View file @
37eb9c9d
# Generated by _generate_configs.py
dataset_name
:
de
include
:
_default_yaml
task
:
global_mmlu_de
lm_eval/tasks/global_mmlu/default/global_mmlu_en.yaml
deleted
100644 → 0
View file @
37eb9c9d
# Generated by _generate_configs.py
dataset_name
:
en
include
:
_default_yaml
task
:
global_mmlu_en
lm_eval/tasks/global_mmlu/default/global_mmlu_es.yaml
deleted
100644 → 0
View file @
37eb9c9d
# Generated by _generate_configs.py
dataset_name
:
es
include
:
_default_yaml
task
:
global_mmlu_es
lm_eval/tasks/global_mmlu/default/global_mmlu_fr.yaml
deleted
100644 → 0
View file @
37eb9c9d
# Generated by _generate_configs.py
dataset_name
:
fr
include
:
_default_yaml
task
:
global_mmlu_fr
lm_eval/tasks/global_mmlu/default/global_mmlu_hi.yaml
deleted
100644 → 0
View file @
37eb9c9d
# Generated by _generate_configs.py
dataset_name
:
hi
include
:
_default_yaml
task
:
global_mmlu_hi
lm_eval/tasks/global_mmlu/default/global_mmlu_id.yaml
deleted
100644 → 0
View file @
37eb9c9d
# Generated by _generate_configs.py
dataset_name
:
id
include
:
_default_yaml
task
:
global_mmlu_id
lm_eval/tasks/global_mmlu/default/global_mmlu_it.yaml
deleted
100644 → 0
View file @
37eb9c9d
# Generated by _generate_configs.py
dataset_name
:
it
include
:
_default_yaml
task
:
global_mmlu_it
lm_eval/tasks/global_mmlu/default/global_mmlu_ja.yaml
deleted
100644 → 0
View file @
37eb9c9d
# Generated by _generate_configs.py
dataset_name
:
ja
include
:
_default_yaml
task
:
global_mmlu_ja
lm_eval/tasks/global_mmlu/default/global_mmlu_ko.yaml
deleted
100644 → 0
View file @
37eb9c9d
# Generated by _generate_configs.py
dataset_name
:
ko
include
:
_default_yaml
task
:
global_mmlu_ko
lm_eval/tasks/global_mmlu/default/global_mmlu_pt.yaml
deleted
100644 → 0
View file @
37eb9c9d
# Generated by _generate_configs.py
dataset_name
:
pt
include
:
_default_yaml
task
:
global_mmlu_pt
lm_eval/tasks/global_mmlu/default/global_mmlu_sw.yaml
deleted
100644 → 0
View file @
37eb9c9d
# Generated by _generate_configs.py
dataset_name
:
sw
include
:
_default_yaml
task
:
global_mmlu_sw
lm_eval/tasks/global_mmlu/default/global_mmlu_yo.yaml
deleted
100644 → 0
View file @
37eb9c9d
# Generated by _generate_configs.py
dataset_name
:
yo
include
:
_default_yaml
task
:
global_mmlu_yo
lm_eval/tasks/global_mmlu/default/global_mmlu_zh.yaml
deleted
100644 → 0
View file @
37eb9c9d
# Generated by _generate_configs.py
dataset_name
:
zh
include
:
_default_yaml
task
:
global_mmlu_zh
lm_eval/tasks/global_mmlu/default/hi/_global_mmlu_hi.yaml
0 → 100644
View file @
4288b53e
group
:
global_mmlu_hi
task
:
-
global_mmlu_hi_business
-
global_mmlu_hi_humanities
-
global_mmlu_hi_medical
-
global_mmlu_hi_other
-
global_mmlu_hi_stem
-
global_mmlu_hi_social_sciences
aggregate_metric_list
:
-
metric
:
acc
weight_by_size
:
True
metadata
:
version
:
0.0
lm_eval/tasks/global_mmlu/default/hi/_hi_template_yaml
0 → 100644
View file @
4288b53e
dataset_path: CohereForAI/Global-MMLU-Lite
dataset_name: hi
test_split: test
fewshot_split: dev
fewshot_config:
sampler: default
output_type: multiple_choice
doc_to_text: "{{question.strip()}}\nA. {{option_a}}\nB. {{option_b}}\nC. {{option_c}}\nD. {{option_d}}\nAnswer:"
doc_to_choice: ["A", "B", "C", "D"]
doc_to_target: answer
metric_list:
- metric: acc
aggregation: mean
higher_is_better: true
metadata:
version: 0.0
lm_eval/tasks/global_mmlu/default/hi/global_mmlu_hi_business.yaml
0 → 100644
View file @
4288b53e
# Generated by _generate_configs.py
include
:
_hi_template_yaml
process_docs
:
!function
utils.process_business
task
:
global_mmlu_hi_business
lm_eval/tasks/global_mmlu/default/hi/global_mmlu_hi_humanities.yaml
0 → 100644
View file @
4288b53e
# Generated by _generate_configs.py
include
:
_hi_template_yaml
process_docs
:
!function
utils.process_humanities
task
:
global_mmlu_hi_humanities
lm_eval/tasks/global_mmlu/default/hi/global_mmlu_hi_medical.yaml
0 → 100644
View file @
4288b53e
# Generated by _generate_configs.py
include
:
_hi_template_yaml
process_docs
:
!function
utils.process_medical
task
:
global_mmlu_hi_medical
lm_eval/tasks/global_mmlu/default/hi/global_mmlu_hi_other.yaml
0 → 100644
View file @
4288b53e
# Generated by _generate_configs.py
include
:
_hi_template_yaml
process_docs
:
!function
utils.process_other
task
:
global_mmlu_hi_other
Prev
1
2
3
4
5
6
7
8
…
11
Next
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment