Commit f77a3a27 authored by lintangsutawika's avatar lintangsutawika
Browse files

Merge branch 'big-refactor' of...

Merge branch 'big-refactor' of https://github.com/EleutherAI/lm-evaluation-harness into mmlu_subgroups
parents 109ed1c7 f8342178
# Generated by utils.py
dataset_name: codenames_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_codenames_greedy_until
include: ../generate_until_template_yaml
task: bigbench_codenames_generate_until
# Generated by utils.py
dataset_name: color_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_color_greedy_until
include: ../generate_until_template_yaml
task: bigbench_color_generate_until
# Generated by utils.py
dataset_name: common_morpheme_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_common_morpheme_greedy_until
include: ../generate_until_template_yaml
task: bigbench_common_morpheme_generate_until
# Generated by utils.py
dataset_name: conceptual_combinations_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_conceptual_combinations_greedy_until
include: ../generate_until_template_yaml
task: bigbench_conceptual_combinations_generate_until
# Generated by utils.py
dataset_name: conlang_translation_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_conlang_translation_greedy_until
include: ../generate_until_template_yaml
task: bigbench_conlang_translation_generate_until
# Generated by utils.py
dataset_name: contextual_parametric_knowledge_conflicts_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_contextual_parametric_knowledge_conflicts_greedy_until
include: ../generate_until_template_yaml
task: bigbench_contextual_parametric_knowledge_conflicts_generate_until
# Generated by utils.py
dataset_name: crash_blossom_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_crash_blossom_greedy_until
include: ../generate_until_template_yaml
task: bigbench_crash_blossom_generate_until
# Generated by utils.py
dataset_name: crass_ai_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_crass_ai_greedy_until
include: ../generate_until_template_yaml
task: bigbench_crass_ai_generate_until
# Generated by utils.py
dataset_name: cryobiology_spanish_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_cryobiology_spanish_greedy_until
include: ../generate_until_template_yaml
task: bigbench_cryobiology_spanish_generate_until
# Generated by utils.py
dataset_name: cryptonite_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_cryptonite_greedy_until
include: ../generate_until_template_yaml
task: bigbench_cryptonite_generate_until
# Generated by utils.py
dataset_name: cs_algorithms_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_cs_algorithms_greedy_until
include: ../generate_until_template_yaml
task: bigbench_cs_algorithms_generate_until
# Generated by utils.py
dataset_name: dark_humor_detection_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_dark_humor_detection_greedy_until
include: ../generate_until_template_yaml
task: bigbench_dark_humor_detection_generate_until
# Generated by utils.py
dataset_name: date_understanding_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_date_understanding_greedy_until
include: ../generate_until_template_yaml
task: bigbench_date_understanding_generate_until
# Generated by utils.py
dataset_name: disambiguation_qa_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_disambiguation_qa_greedy_until
include: ../generate_until_template_yaml
task: bigbench_disambiguation_qa_generate_until
# Generated by utils.py
dataset_name: discourse_marker_prediction_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_discourse_marker_prediction_greedy_until
include: ../generate_until_template_yaml
task: bigbench_discourse_marker_prediction_generate_until
# Generated by utils.py
dataset_name: disfl_qa_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_disfl_qa_greedy_until
include: ../generate_until_template_yaml
task: bigbench_disfl_qa_generate_until
# Generated by utils.py
dataset_name: dyck_languages_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_dyck_languages_greedy_until
include: ../generate_until_template_yaml
task: bigbench_dyck_languages_generate_until
# Generated by utils.py
dataset_name: elementary_math_qa_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_elementary_math_qa_greedy_until
include: ../generate_until_template_yaml
task: bigbench_elementary_math_qa_generate_until
# Generated by utils.py
dataset_name: emoji_movie_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_emoji_movie_greedy_until
include: ../generate_until_template_yaml
task: bigbench_emoji_movie_generate_until
# Generated by utils.py
dataset_name: emojis_emotion_prediction_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_emojis_emotion_prediction_greedy_until
include: ../generate_until_template_yaml
task: bigbench_emojis_emotion_prediction_generate_until
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment