Commit f77a3a27 authored by lintangsutawika's avatar lintangsutawika
Browse files

Merge branch 'big-refactor' of...

Merge branch 'big-refactor' of https://github.com/EleutherAI/lm-evaluation-harness into mmlu_subgroups
parents 109ed1c7 f8342178
# Generated by utils.py # Generated by utils.py
dataset_name: linguistics_puzzles_zero_shot dataset_name: linguistics_puzzles_zero_shot
include: ../greedy_until_template_yaml include: ../generate_until_template_yaml
task: bigbench_linguistics_puzzles_greedy_until task: bigbench_linguistics_puzzles_generate_until
# Generated by utils.py # Generated by utils.py
dataset_name: list_functions_zero_shot dataset_name: list_functions_zero_shot
include: ../greedy_until_template_yaml include: ../generate_until_template_yaml
task: bigbench_list_functions_greedy_until task: bigbench_list_functions_generate_until
# Generated by utils.py # Generated by utils.py
dataset_name: logic_grid_puzzle_zero_shot dataset_name: logic_grid_puzzle_zero_shot
include: ../greedy_until_template_yaml include: ../generate_until_template_yaml
task: bigbench_logic_grid_puzzle_greedy_until task: bigbench_logic_grid_puzzle_generate_until
# Generated by utils.py # Generated by utils.py
dataset_name: logical_args_zero_shot dataset_name: logical_args_zero_shot
include: ../greedy_until_template_yaml include: ../generate_until_template_yaml
task: bigbench_logical_args_greedy_until task: bigbench_logical_args_generate_until
# Generated by utils.py # Generated by utils.py
dataset_name: logical_deduction_zero_shot dataset_name: logical_deduction_zero_shot
include: ../greedy_until_template_yaml include: ../generate_until_template_yaml
task: bigbench_logical_deduction_greedy_until task: bigbench_logical_deduction_generate_until
# Generated by utils.py # Generated by utils.py
dataset_name: logical_fallacy_detection_zero_shot dataset_name: logical_fallacy_detection_zero_shot
include: ../greedy_until_template_yaml include: ../generate_until_template_yaml
task: bigbench_logical_fallacy_detection_greedy_until task: bigbench_logical_fallacy_detection_generate_until
# Generated by utils.py # Generated by utils.py
dataset_name: logical_sequence_zero_shot dataset_name: logical_sequence_zero_shot
include: ../greedy_until_template_yaml include: ../generate_until_template_yaml
task: bigbench_logical_sequence_greedy_until task: bigbench_logical_sequence_generate_until
# Generated by utils.py # Generated by utils.py
dataset_name: mathematical_induction_zero_shot dataset_name: mathematical_induction_zero_shot
include: ../greedy_until_template_yaml include: ../generate_until_template_yaml
task: bigbench_mathematical_induction_greedy_until task: bigbench_mathematical_induction_generate_until
# Generated by utils.py # Generated by utils.py
dataset_name: matrixshapes_zero_shot dataset_name: matrixshapes_zero_shot
include: ../greedy_until_template_yaml include: ../generate_until_template_yaml
task: bigbench_matrixshapes_greedy_until task: bigbench_matrixshapes_generate_until
# Generated by utils.py # Generated by utils.py
dataset_name: metaphor_boolean_zero_shot dataset_name: metaphor_boolean_zero_shot
include: ../greedy_until_template_yaml include: ../generate_until_template_yaml
task: bigbench_metaphor_boolean_greedy_until task: bigbench_metaphor_boolean_generate_until
# Generated by utils.py # Generated by utils.py
dataset_name: metaphor_understanding_zero_shot dataset_name: metaphor_understanding_zero_shot
include: ../greedy_until_template_yaml include: ../generate_until_template_yaml
task: bigbench_metaphor_understanding_greedy_until task: bigbench_metaphor_understanding_generate_until
# Generated by utils.py # Generated by utils.py
dataset_name: minute_mysteries_qa_zero_shot dataset_name: minute_mysteries_qa_zero_shot
include: ../greedy_until_template_yaml include: ../generate_until_template_yaml
task: bigbench_minute_mysteries_qa_greedy_until task: bigbench_minute_mysteries_qa_generate_until
# Generated by utils.py # Generated by utils.py
dataset_name: misconceptions_zero_shot dataset_name: misconceptions_zero_shot
include: ../greedy_until_template_yaml include: ../generate_until_template_yaml
task: bigbench_misconceptions_greedy_until task: bigbench_misconceptions_generate_until
# Generated by utils.py # Generated by utils.py
dataset_name: misconceptions_russian_zero_shot dataset_name: misconceptions_russian_zero_shot
include: ../greedy_until_template_yaml include: ../generate_until_template_yaml
task: bigbench_misconceptions_russian_greedy_until task: bigbench_misconceptions_russian_generate_until
# Generated by utils.py # Generated by utils.py
dataset_name: mnist_ascii_zero_shot dataset_name: mnist_ascii_zero_shot
include: ../greedy_until_template_yaml include: ../generate_until_template_yaml
task: bigbench_mnist_ascii_greedy_until task: bigbench_mnist_ascii_generate_until
# Generated by utils.py # Generated by utils.py
dataset_name: modified_arithmetic_zero_shot dataset_name: modified_arithmetic_zero_shot
include: ../greedy_until_template_yaml include: ../generate_until_template_yaml
task: bigbench_modified_arithmetic_greedy_until task: bigbench_modified_arithmetic_generate_until
# Generated by utils.py # Generated by utils.py
dataset_name: moral_permissibility_zero_shot dataset_name: moral_permissibility_zero_shot
include: ../greedy_until_template_yaml include: ../generate_until_template_yaml
task: bigbench_moral_permissibility_greedy_until task: bigbench_moral_permissibility_generate_until
# Generated by utils.py # Generated by utils.py
dataset_name: movie_dialog_same_or_different_zero_shot dataset_name: movie_dialog_same_or_different_zero_shot
include: ../greedy_until_template_yaml include: ../generate_until_template_yaml
task: bigbench_movie_dialog_same_or_different_greedy_until task: bigbench_movie_dialog_same_or_different_generate_until
# Generated by utils.py # Generated by utils.py
dataset_name: movie_recommendation_zero_shot dataset_name: movie_recommendation_zero_shot
include: ../greedy_until_template_yaml include: ../generate_until_template_yaml
task: bigbench_movie_recommendation_greedy_until task: bigbench_movie_recommendation_generate_until
# Generated by utils.py # Generated by utils.py
dataset_name: mult_data_wrangling_zero_shot dataset_name: mult_data_wrangling_zero_shot
include: ../greedy_until_template_yaml include: ../generate_until_template_yaml
task: bigbench_mult_data_wrangling_greedy_until task: bigbench_mult_data_wrangling_generate_until
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment