add flan_zeroshot

0d195e90 · lintangsutawika · 3531d9c1 · 0d195e90 · 0d195e90 · 0d195e90
Commit 0d195e90 authored Sep 04, 2023 by lintangsutawika
8 changed files
--- a/lm_eval/tasks/bbh/flan_zeroshot/snarks.yaml
+++ b/lm_eval/tasks/bbh/flan_zeroshot/snarks.yaml
+"dataset_name": "snarks"
+"description": "Determine which of two sentences is sarcastic.\n\n"
+"doc_to_text": "Q: {{input}}\nA:"
+"include": "_template_yaml"
+"task": "bbh_flan_zeroshot_snarks"
--- a/lm_eval/tasks/bbh/flan_zeroshot/sports_understanding.yaml
+++ b/lm_eval/tasks/bbh/flan_zeroshot/sports_understanding.yaml
+"dataset_name": "sports_understanding"
+"description": "Determine whether an artificially constructed sentence relating to sports is plausible or not.\n\n"
+"doc_to_text": "Q: {{input}}\nA:"
+"include": "_template_yaml"
+"task": "bbh_flan_zeroshot_sports_understanding"
--- a/lm_eval/tasks/bbh/flan_zeroshot/temporal_sequences.yaml
+++ b/lm_eval/tasks/bbh/flan_zeroshot/temporal_sequences.yaml
+"dataset_name": "temporal_sequences"
+"description": "Task description: Answer questions about which times certain events could have occurred.\n\n"
+"doc_to_text": "Q: {{input}}\nA:"
+"include": "_template_yaml"
+"task": "bbh_flan_zeroshot_temporal_sequences"
--- a/lm_eval/tasks/bbh/flan_zeroshot/tracking_shuffled_objects_five_objects.yaml
+++ b/lm_eval/tasks/bbh/flan_zeroshot/tracking_shuffled_objects_five_objects.yaml
+"dataset_name": "tracking_shuffled_objects_five_objects"
+"description": "A task requiring determining the final positions of a set of objects given their initial positions and a description of a sequence of swaps.\n\n"
+"doc_to_text": "Q: {{input}}\nA:"
+"include": "_template_yaml"
+"task": "bbh_flan_zeroshot_tracking_shuffled_objects_five_objects"
--- a/lm_eval/tasks/bbh/flan_zeroshot/tracking_shuffled_objects_seven_objects.yaml
+++ b/lm_eval/tasks/bbh/flan_zeroshot/tracking_shuffled_objects_seven_objects.yaml
+"dataset_name": "tracking_shuffled_objects_seven_objects"
+"description": "A task requiring determining the final positions of a set of objects given their initial positions and a description of a sequence of swaps.\n\n"
+"doc_to_text": "Q: {{input}}\nA:"
+"include": "_template_yaml"
+"task": "bbh_flan_zeroshot_tracking_shuffled_objects_seven_objects"
--- a/lm_eval/tasks/bbh/flan_zeroshot/tracking_shuffled_objects_three_objects.yaml
+++ b/lm_eval/tasks/bbh/flan_zeroshot/tracking_shuffled_objects_three_objects.yaml
+"dataset_name": "tracking_shuffled_objects_three_objects"
+"description": "A task requiring determining the final positions of a set of objects given their initial positions and a description of a sequence of swaps.\n\n"
+"doc_to_text": "Q: {{input}}\nA:"
+"include": "_template_yaml"
+"task": "bbh_flan_zeroshot_tracking_shuffled_objects_three_objects"
--- a/lm_eval/tasks/bbh/flan_zeroshot/web_of_lies.yaml
+++ b/lm_eval/tasks/bbh/flan_zeroshot/web_of_lies.yaml
+"dataset_name": "web_of_lies"
+"description": "Evaluate a random boolean function expressed as a word problem.\n\n"
+"doc_to_text": "Q: {{input}}\nA:"
+"include": "_template_yaml"
+"task": "bbh_flan_zeroshot_web_of_lies"
--- a/lm_eval/tasks/bbh/flan_zeroshot/word_sorting.yaml
+++ b/lm_eval/tasks/bbh/flan_zeroshot/word_sorting.yaml
+"dataset_name": "word_sorting"
+"description": "Sort a list of words.\n\n"
+"doc_to_text": "Q: {{input}}\nA:"
+"include": "_template_yaml"
+"task": "bbh_flan_zeroshot_word_sorting"