"src/vscode:/vscode.git/clone" did not exist on "771ac86163001a158c3e50ecc5c96186f34f4876"
Unverified Commit 6769119f authored by Hailey Schoelkopf's avatar Hailey Schoelkopf Committed by GitHub
Browse files

Merge pull request #816 from EleutherAI/flan-benchmark

[Refactor] Flan benchmark
parents 4824a832 7d5e511c
"dataset_name": "medical_genetics"
"description": "The following are multiple choice questions (with answers) about medical genetics.\n\n"
"include": "_mmlu_flan_loglikelihood_template_yaml"
"task": "mmlu_flan_n_shot_loglikelihood_medical_genetics"
"dataset_name": "miscellaneous"
"description": "The following are multiple choice questions (with answers) about miscellaneous.\n\n"
"include": "_mmlu_flan_loglikelihood_template_yaml"
"task": "mmlu_flan_n_shot_loglikelihood_miscellaneous"
"dataset_name": "moral_disputes"
"description": "The following are multiple choice questions (with answers) about moral disputes.\n\n"
"include": "_mmlu_flan_loglikelihood_template_yaml"
"task": "mmlu_flan_n_shot_loglikelihood_moral_disputes"
"dataset_name": "moral_scenarios"
"description": "The following are multiple choice questions (with answers) about moral scenarios.\n\n"
"include": "_mmlu_flan_loglikelihood_template_yaml"
"task": "mmlu_flan_n_shot_loglikelihood_moral_scenarios"
"dataset_name": "nutrition"
"description": "The following are multiple choice questions (with answers) about nutrition.\n\n"
"include": "_mmlu_flan_loglikelihood_template_yaml"
"task": "mmlu_flan_n_shot_loglikelihood_nutrition"
"dataset_name": "philosophy"
"description": "The following are multiple choice questions (with answers) about philosophy.\n\n"
"include": "_mmlu_flan_loglikelihood_template_yaml"
"task": "mmlu_flan_n_shot_loglikelihood_philosophy"
"dataset_name": "prehistory"
"description": "The following are multiple choice questions (with answers) about prehistory.\n\n"
"include": "_mmlu_flan_loglikelihood_template_yaml"
"task": "mmlu_flan_n_shot_loglikelihood_prehistory"
"dataset_name": "professional_accounting"
"description": "The following are multiple choice questions (with answers) about professional accounting.\n\n"
"include": "_mmlu_flan_loglikelihood_template_yaml"
"task": "mmlu_flan_n_shot_loglikelihood_professional_accounting"
"dataset_name": "professional_law"
"description": "The following are multiple choice questions (with answers) about professional law.\n\n"
"include": "_mmlu_flan_loglikelihood_template_yaml"
"task": "mmlu_flan_n_shot_loglikelihood_professional_law"
"dataset_name": "professional_medicine"
"description": "The following are multiple choice questions (with answers) about professional medicine.\n\n"
"include": "_mmlu_flan_loglikelihood_template_yaml"
"task": "mmlu_flan_n_shot_loglikelihood_professional_medicine"
"dataset_name": "professional_psychology"
"description": "The following are multiple choice questions (with answers) about professional psychology.\n\n"
"include": "_mmlu_flan_loglikelihood_template_yaml"
"task": "mmlu_flan_n_shot_loglikelihood_professional_psychology"
"dataset_name": "public_relations"
"description": "The following are multiple choice questions (with answers) about public relations.\n\n"
"include": "_mmlu_flan_loglikelihood_template_yaml"
"task": "mmlu_flan_n_shot_loglikelihood_public_relations"
"dataset_name": "security_studies"
"description": "The following are multiple choice questions (with answers) about security studies.\n\n"
"include": "_mmlu_flan_loglikelihood_template_yaml"
"task": "mmlu_flan_n_shot_loglikelihood_security_studies"
"dataset_name": "sociology"
"description": "The following are multiple choice questions (with answers) about sociology.\n\n"
"include": "_mmlu_flan_loglikelihood_template_yaml"
"task": "mmlu_flan_n_shot_loglikelihood_sociology"
"dataset_name": "us_foreign_policy"
"description": "The following are multiple choice questions (with answers) about us foreign policy.\n\n"
"include": "_mmlu_flan_loglikelihood_template_yaml"
"task": "mmlu_flan_n_shot_loglikelihood_us_foreign_policy"
"dataset_name": "virology"
"description": "The following are multiple choice questions (with answers) about virology.\n\n"
"include": "_mmlu_flan_loglikelihood_template_yaml"
"task": "mmlu_flan_n_shot_loglikelihood_virology"
"dataset_name": "world_religions"
"description": "The following are multiple choice questions (with answers) about world religions.\n\n"
"include": "_mmlu_flan_loglikelihood_template_yaml"
"task": "mmlu_flan_n_shot_loglikelihood_world_religions"
...@@ -9,6 +9,9 @@ output_type: greedy_until ...@@ -9,6 +9,9 @@ output_type: greedy_until
doc_to_text: "boolq passage: {{passage}} question: {{question}}" doc_to_text: "boolq passage: {{passage}} question: {{question}}"
doc_to_target: label doc_to_target: label
doc_to_choice: ['False', 'True'] doc_to_choice: ['False', 'True']
generation_kwargs:
until:
- "</s>"
metric_list: metric_list:
- metric: exact_match - metric: exact_match
aggregation: mean aggregation: mean
......
...@@ -9,6 +9,9 @@ output_type: greedy_until ...@@ -9,6 +9,9 @@ output_type: greedy_until
doc_to_text: "cb hypothesis: {{hypothesis}} premise: {{premise}}" doc_to_text: "cb hypothesis: {{hypothesis}} premise: {{premise}}"
doc_to_target: label doc_to_target: label
doc_to_choice: ['entailment', 'contradiction', 'neutral'] doc_to_choice: ['entailment', 'contradiction', 'neutral']
generation_kwargs:
until:
- "</s>"
metric_list: metric_list:
- metric: exact_match - metric: exact_match
aggregation: mean aggregation: mean
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment