Commit a5a9017b authored by lintangsutawika's avatar lintangsutawika
Browse files

Merge branch 'big-refactor' of https://github.com/EleutherAI/lm-evaluation-harness into xstorycloze

parents a04a600a 7634a6ec
# Generated by utils.py
dataset_name: npi_present_2
include: template_yaml
task: blimp_npi_present_2
# Generated by utils.py
dataset_name: only_npi_licensor_present
include: template_yaml
task: blimp_only_npi_licensor_present
# Generated by utils.py
dataset_name: only_npi_scope
include: template_yaml
task: blimp_only_npi_scope
# Generated by utils.py
dataset_name: passive_1
include: template_yaml
task: blimp_passive_1
# Generated by utils.py
dataset_name: passive_2
include: template_yaml
task: blimp_passive_2
# Generated by utils.py
dataset_name: principle_A_c_command
include: template_yaml
task: blimp_principle_A_c_command
# Generated by utils.py
dataset_name: principle_A_case_1
include: template_yaml
task: blimp_principle_A_case_1
# Generated by utils.py
dataset_name: principle_A_case_2
include: template_yaml
task: blimp_principle_A_case_2
# Generated by utils.py
dataset_name: principle_A_domain_1
include: template_yaml
task: blimp_principle_A_domain_1
# Generated by utils.py
dataset_name: principle_A_domain_2
include: template_yaml
task: blimp_principle_A_domain_2
# Generated by utils.py
dataset_name: principle_A_domain_3
include: template_yaml
task: blimp_principle_A_domain_3
# Generated by utils.py
dataset_name: principle_A_reconstruction
include: template_yaml
task: blimp_principle_A_reconstruction
# Generated by utils.py
dataset_name: regular_plural_subject_verb_agreement_1
include: template_yaml
task: blimp_regular_plural_subject_verb_agreement_1
# Generated by utils.py
dataset_name: regular_plural_subject_verb_agreement_2
include: template_yaml
task: blimp_regular_plural_subject_verb_agreement_2
# Generated by utils.py
dataset_name: sentential_negation_npi_licensor_present
include: template_yaml
task: blimp_sentential_negation_npi_licensor_present
# Generated by utils.py
dataset_name: sentential_negation_npi_scope
include: template_yaml
task: blimp_sentential_negation_npi_scope
# Generated by utils.py
dataset_name: sentential_subject_island
include: template_yaml
task: blimp_sentential_subject_island
# Generated by utils.py
dataset_name: superlative_quantifiers_1
include: template_yaml
task: blimp_superlative_quantifiers_1
# Generated by utils.py
dataset_name: superlative_quantifiers_2
include: template_yaml
task: blimp_superlative_quantifiers_2
group: blimp
dataset_path: blimp
output_type: multiple_choice
validation_split: validation
doc_to_text: ""
doc_to_target: 0
doc_to_choice: "{{[sentence_good, sentence_bad]}}"
should_decontaminate: true
doc_to_decontamination_query: "{{sentence_good}} {{sentence_bad}}"
metric_list:
- metric: acc
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment