add bigbench

605787a9 · lintangsutawika · b8d1cef9 · 605787a9 · 605787a9 · 605787a9
Commit 605787a9 authored Sep 13, 2023 by lintangsutawika
18 changed files
--- a/lm_eval/tasks/bigbench/multiple_choice/symbol_interpretation.yaml
+++ b/lm_eval/tasks/bigbench/multiple_choice/symbol_interpretation.yaml
+# Generated by utils.py
+dataset_name: symbol_interpretation
+include: ../multiple_choice_template_yaml
+task: bigbench_symbol_interpretation_multiple_choice
--- a/lm_eval/tasks/bigbench/multiple_choice/temporal_sequences.yaml
+++ b/lm_eval/tasks/bigbench/multiple_choice/temporal_sequences.yaml
+# Generated by utils.py
+dataset_name: temporal_sequences
+include: ../multiple_choice_template_yaml
+task: bigbench_temporal_sequences_multiple_choice
--- a/lm_eval/tasks/bigbench/multiple_choice/tense.yaml
+++ b/lm_eval/tasks/bigbench/multiple_choice/tense.yaml
+# Generated by utils.py
+dataset_name: tense
+include: ../multiple_choice_template_yaml
+task: bigbench_tense_multiple_choice
--- a/lm_eval/tasks/bigbench/multiple_choice/timedial.yaml
+++ b/lm_eval/tasks/bigbench/multiple_choice/timedial.yaml
+# Generated by utils.py
+dataset_name: timedial
+include: ../multiple_choice_template_yaml
+task: bigbench_timedial_multiple_choice
--- a/lm_eval/tasks/bigbench/multiple_choice/topical_chat.yaml
+++ b/lm_eval/tasks/bigbench/multiple_choice/topical_chat.yaml
+# Generated by utils.py
+dataset_name: topical_chat
+include: ../multiple_choice_template_yaml
+task: bigbench_topical_chat_multiple_choice
--- a/lm_eval/tasks/bigbench/multiple_choice/tracking_shuffled_objects.yaml
+++ b/lm_eval/tasks/bigbench/multiple_choice/tracking_shuffled_objects.yaml
+# Generated by utils.py
+dataset_name: tracking_shuffled_objects
+include: ../multiple_choice_template_yaml
+task: bigbench_tracking_shuffled_objects_multiple_choice
--- a/lm_eval/tasks/bigbench/multiple_choice/understanding_fables.yaml
+++ b/lm_eval/tasks/bigbench/multiple_choice/understanding_fables.yaml
+# Generated by utils.py
+dataset_name: understanding_fables
+include: ../multiple_choice_template_yaml
+task: bigbench_understanding_fables_multiple_choice
--- a/lm_eval/tasks/bigbench/multiple_choice/undo_permutation.yaml
+++ b/lm_eval/tasks/bigbench/multiple_choice/undo_permutation.yaml
+# Generated by utils.py
+dataset_name: undo_permutation
+include: ../multiple_choice_template_yaml
+task: bigbench_undo_permutation_multiple_choice
--- a/lm_eval/tasks/bigbench/multiple_choice/unit_conversion.yaml
+++ b/lm_eval/tasks/bigbench/multiple_choice/unit_conversion.yaml
+# Generated by utils.py
+dataset_name: unit_conversion
+include: ../multiple_choice_template_yaml
+task: bigbench_unit_conversion_multiple_choice
--- a/lm_eval/tasks/bigbench/multiple_choice/unit_interpretation.yaml
+++ b/lm_eval/tasks/bigbench/multiple_choice/unit_interpretation.yaml
+# Generated by utils.py
+dataset_name: unit_interpretation
+include: ../multiple_choice_template_yaml
+task: bigbench_unit_interpretation_multiple_choice
--- a/lm_eval/tasks/bigbench/multiple_choice/unnatural_in_context_learning.yaml
+++ b/lm_eval/tasks/bigbench/multiple_choice/unnatural_in_context_learning.yaml
+# Generated by utils.py
+dataset_name: unnatural_in_context_learning
+include: ../multiple_choice_template_yaml
+task: bigbench_unnatural_in_context_learning_multiple_choice
--- a/lm_eval/tasks/bigbench/multiple_choice/vitaminc_fact_verification.yaml
+++ b/lm_eval/tasks/bigbench/multiple_choice/vitaminc_fact_verification.yaml
+# Generated by utils.py
+dataset_name: vitaminc_fact_verification
+include: ../multiple_choice_template_yaml
+task: bigbench_vitaminc_fact_verification_multiple_choice
--- a/lm_eval/tasks/bigbench/multiple_choice/what_is_the_tao.yaml
+++ b/lm_eval/tasks/bigbench/multiple_choice/what_is_the_tao.yaml
+# Generated by utils.py
+dataset_name: what_is_the_tao
+include: ../multiple_choice_template_yaml
+task: bigbench_what_is_the_tao_multiple_choice
--- a/lm_eval/tasks/bigbench/multiple_choice/which_wiki_edit.yaml
+++ b/lm_eval/tasks/bigbench/multiple_choice/which_wiki_edit.yaml
+# Generated by utils.py
+dataset_name: which_wiki_edit
+include: ../multiple_choice_template_yaml
+task: bigbench_which_wiki_edit_multiple_choice
--- a/lm_eval/tasks/bigbench/multiple_choice/winowhy.yaml
+++ b/lm_eval/tasks/bigbench/multiple_choice/winowhy.yaml
+# Generated by utils.py
+dataset_name: winowhy
+include: ../multiple_choice_template_yaml
+task: bigbench_winowhy_multiple_choice
--- a/lm_eval/tasks/bigbench/multiple_choice/word_sorting.yaml
+++ b/lm_eval/tasks/bigbench/multiple_choice/word_sorting.yaml
+# Generated by utils.py
+dataset_name: word_sorting
+include: ../multiple_choice_template_yaml
+task: bigbench_word_sorting_multiple_choice
--- a/lm_eval/tasks/bigbench/multiple_choice/word_unscrambling.yaml
+++ b/lm_eval/tasks/bigbench/multiple_choice/word_unscrambling.yaml
+# Generated by utils.py
+dataset_name: word_unscrambling
+include: ../multiple_choice_template_yaml
+task: bigbench_word_unscrambling_multiple_choice
--- a/lm_eval/tasks/bigbench/multiple_choice_template_yaml
+++ b/lm_eval/tasks/bigbench/multiple_choice_template_yaml
+group: bigbench
+dataset_path: bigbench
+output_type: multiple_choice
+training_split: train
+validation_split: validation
+doc_to_text: inputs
+doc_to_target: "{{multiple_choice_targets.index(targets[0])}}"
+doc_to_choice: "{{multiple_choice_targets}}"
+metric_list:
+  - metric: acc