Commit f77a3a27 authored by lintangsutawika's avatar lintangsutawika
Browse files

Merge branch 'big-refactor' of...

Merge branch 'big-refactor' of https://github.com/EleutherAI/lm-evaluation-harness into mmlu_subgroups
parents 109ed1c7 f8342178
# Generated by utils.py
dataset_name: empirical_judgments_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_empirical_judgments_greedy_until
include: ../generate_until_template_yaml
task: bigbench_empirical_judgments_generate_until
# Generated by utils.py
dataset_name: english_proverbs_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_english_proverbs_greedy_until
include: ../generate_until_template_yaml
task: bigbench_english_proverbs_generate_until
# Generated by utils.py
dataset_name: english_russian_proverbs_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_english_russian_proverbs_greedy_until
include: ../generate_until_template_yaml
task: bigbench_english_russian_proverbs_generate_until
# Generated by utils.py
dataset_name: entailed_polarity_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_entailed_polarity_greedy_until
include: ../generate_until_template_yaml
task: bigbench_entailed_polarity_generate_until
# Generated by utils.py
dataset_name: entailed_polarity_hindi_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_entailed_polarity_hindi_greedy_until
include: ../generate_until_template_yaml
task: bigbench_entailed_polarity_hindi_generate_until
# Generated by utils.py
dataset_name: epistemic_reasoning_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_epistemic_reasoning_greedy_until
include: ../generate_until_template_yaml
task: bigbench_epistemic_reasoning_generate_until
# Generated by utils.py
dataset_name: evaluating_information_essentiality_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_evaluating_information_essentiality_greedy_until
include: ../generate_until_template_yaml
task: bigbench_evaluating_information_essentiality_generate_until
# Generated by utils.py
dataset_name: fact_checker_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_fact_checker_greedy_until
include: ../generate_until_template_yaml
task: bigbench_fact_checker_generate_until
# Generated by utils.py
dataset_name: fantasy_reasoning_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_fantasy_reasoning_greedy_until
include: ../generate_until_template_yaml
task: bigbench_fantasy_reasoning_generate_until
# Generated by utils.py
dataset_name: few_shot_nlg_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_few_shot_nlg_greedy_until
include: ../generate_until_template_yaml
task: bigbench_few_shot_nlg_generate_until
# Generated by utils.py
dataset_name: figure_of_speech_detection_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_figure_of_speech_detection_greedy_until
include: ../generate_until_template_yaml
task: bigbench_figure_of_speech_detection_generate_until
# Generated by utils.py
dataset_name: formal_fallacies_syllogisms_negation_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_formal_fallacies_syllogisms_negation_greedy_until
include: ../generate_until_template_yaml
task: bigbench_formal_fallacies_syllogisms_negation_generate_until
# Generated by utils.py
dataset_name: gem_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_gem_greedy_until
include: ../generate_until_template_yaml
task: bigbench_gem_generate_until
# Generated by utils.py
dataset_name: gender_inclusive_sentences_german_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_gender_inclusive_sentences_german_greedy_until
include: ../generate_until_template_yaml
task: bigbench_gender_inclusive_sentences_german_generate_until
# Generated by utils.py
dataset_name: general_knowledge_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_general_knowledge_greedy_until
include: ../generate_until_template_yaml
task: bigbench_general_knowledge_generate_until
# Generated by utils.py
dataset_name: geometric_shapes_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_geometric_shapes_greedy_until
include: ../generate_until_template_yaml
task: bigbench_geometric_shapes_generate_until
# Generated by utils.py
dataset_name: goal_step_wikihow_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_goal_step_wikihow_greedy_until
include: ../generate_until_template_yaml
task: bigbench_goal_step_wikihow_generate_until
# Generated by utils.py
dataset_name: gre_reading_comprehension_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_gre_reading_comprehension_greedy_until
include: ../generate_until_template_yaml
task: bigbench_gre_reading_comprehension_generate_until
# Generated by utils.py
dataset_name: hhh_alignment_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_hhh_alignment_greedy_until
include: ../generate_until_template_yaml
task: bigbench_hhh_alignment_generate_until
# Generated by utils.py
dataset_name: hindi_question_answering_zero_shot
include: ../greedy_until_template_yaml
task: bigbench_hindi_question_answering_greedy_until
include: ../generate_until_template_yaml
task: bigbench_hindi_question_answering_generate_until
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment