Commit 5a4fc8fb authored by lintangsutawika's avatar lintangsutawika
Browse files

Merge branch 'big-refactor' of...

Merge branch 'big-refactor' of https://github.com/EleutherAI/lm-evaluation-harness into port_master_squadv2
parents 51753750 e35b0667
"dataset_name": "us_foreign_policy"
"description": "The following are multiple choice questions (with answers) about us\
\ foreign policy.\n\n"
"group": "mmlu_flan_n_shot_generative_social_sciences"
"group": "mmlu_flan_n_shot_loglikelihood_social_sciences"
"include": "_mmlu_flan_loglikelihood_template_yaml"
"task": "mmlu_flan_n_shot_generative_us_foreign_policy"
"task": "mmlu_flan_n_shot_loglikelihood_us_foreign_policy"
"dataset_name": "virology"
"description": "The following are multiple choice questions (with answers) about virology.\n\
\n"
"group": "mmlu_flan_n_shot_generative_other"
"group": "mmlu_flan_n_shot_loglikelihood_other"
"include": "_mmlu_flan_loglikelihood_template_yaml"
"task": "mmlu_flan_n_shot_generative_virology"
"task": "mmlu_flan_n_shot_loglikelihood_virology"
"dataset_name": "world_religions"
"description": "The following are multiple choice questions (with answers) about world\
\ religions.\n\n"
"group": "mmlu_flan_n_shot_generative_humanities"
"group": "mmlu_flan_n_shot_loglikelihood_humanities"
"include": "_mmlu_flan_loglikelihood_template_yaml"
"task": "mmlu_flan_n_shot_generative_world_religions"
"task": "mmlu_flan_n_shot_loglikelihood_world_religions"
......@@ -305,6 +305,10 @@ def make_table(result_dict, column: str = "results"):
for k, dic in result_dict[column].items():
version = result_dict["versions"][k]
if "alias" in dic:
k = dic.pop("alias")
for (mf), v in dic.items():
m, _, f = mf.partition(",")
if m.endswith("_stderr"):
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment