Commit f77a3a27 authored by lintangsutawika's avatar lintangsutawika
Browse files

Merge branch 'big-refactor' of...

Merge branch 'big-refactor' of https://github.com/EleutherAI/lm-evaluation-harness into mmlu_subgroups
parents 109ed1c7 f8342178
# Generated by utils.py
dataset_name: presuppositions_as_nli_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_presuppositions_as_nli_greedy_until
include: ../generate_until_template_yaml
task: bigbench_presuppositions_as_nli_generate_until
# Generated by utils.py
dataset_name: qa_wikidata_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_qa_wikidata_greedy_until
include: ../generate_until_template_yaml
task: bigbench_qa_wikidata_generate_until
# Generated by utils.py
dataset_name: question_selection_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_question_selection_greedy_until
include: ../generate_until_template_yaml
task: bigbench_question_selection_generate_until
# Generated by utils.py
dataset_name: real_or_fake_text_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_real_or_fake_text_greedy_until
include: ../generate_until_template_yaml
task: bigbench_real_or_fake_text_generate_until
# Generated by utils.py
dataset_name: reasoning_about_colored_objects_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_reasoning_about_colored_objects_greedy_until
include: ../generate_until_template_yaml
task: bigbench_reasoning_about_colored_objects_generate_until
# Generated by utils.py
dataset_name: repeat_copy_logic_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_repeat_copy_logic_greedy_until
include: ../generate_until_template_yaml
task: bigbench_repeat_copy_logic_generate_until
# Generated by utils.py
dataset_name: rephrase_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_rephrase_greedy_until
include: ../generate_until_template_yaml
task: bigbench_rephrase_generate_until
# Generated by utils.py
dataset_name: riddle_sense_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_riddle_sense_greedy_until
include: ../generate_until_template_yaml
task: bigbench_riddle_sense_generate_until
# Generated by utils.py
dataset_name: ruin_names_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_ruin_names_greedy_until
include: ../generate_until_template_yaml
task: bigbench_ruin_names_generate_until
# Generated by utils.py
dataset_name: salient_translation_error_detection_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_salient_translation_error_detection_greedy_until
include: ../generate_until_template_yaml
task: bigbench_salient_translation_error_detection_generate_until
# Generated by utils.py
dataset_name: scientific_press_release_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_scientific_press_release_greedy_until
include: ../generate_until_template_yaml
task: bigbench_scientific_press_release_generate_until
# Generated by utils.py
dataset_name: semantic_parsing_in_context_sparc_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_semantic_parsing_in_context_sparc_greedy_until
include: ../generate_until_template_yaml
task: bigbench_semantic_parsing_in_context_sparc_generate_until
# Generated by utils.py
dataset_name: semantic_parsing_spider_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_semantic_parsing_spider_greedy_until
include: ../generate_until_template_yaml
task: bigbench_semantic_parsing_spider_generate_until
# Generated by utils.py
dataset_name: sentence_ambiguity_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_sentence_ambiguity_greedy_until
include: ../generate_until_template_yaml
task: bigbench_sentence_ambiguity_generate_until
# Generated by utils.py
dataset_name: similarities_abstraction_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_similarities_abstraction_greedy_until
include: ../generate_until_template_yaml
task: bigbench_similarities_abstraction_generate_until
# Generated by utils.py
dataset_name: simp_turing_concept_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_simp_turing_concept_greedy_until
include: ../generate_until_template_yaml
task: bigbench_simp_turing_concept_generate_until
# Generated by utils.py
dataset_name: simple_arithmetic_json_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_simple_arithmetic_json_greedy_until
include: ../generate_until_template_yaml
task: bigbench_simple_arithmetic_json_generate_until
# Generated by utils.py
dataset_name: simple_arithmetic_json_multiple_choice_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_simple_arithmetic_json_multiple_choice_greedy_until
include: ../generate_until_template_yaml
task: bigbench_simple_arithmetic_json_multiple_choice_generate_until
# Generated by utils.py
dataset_name: simple_arithmetic_json_subtasks_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_simple_arithmetic_json_subtasks_greedy_until
include: ../generate_until_template_yaml
task: bigbench_simple_arithmetic_json_subtasks_generate_until
# Generated by utils.py
dataset_name: simple_arithmetic_multiple_targets_json_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_simple_arithmetic_multiple_targets_json_greedy_until
include: ../generate_until_template_yaml
task: bigbench_simple_arithmetic_multiple_targets_json_generate_until
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment