Commit e160a9f9 authored by Baber's avatar Baber
Browse files

add mc tasks

parent c0fc7172
from pathlib import Path
import datasets
if __name__ == "__main__":
subsets = [
x
for x in datasets.get_dataset_config_names(
"mrlbenchmarks/global-piqa-nonparallel"
)
if not x.startswith("dev")
]
PARENT = Path(__file__).parent
for s in subsets:
with open(PARENT / f"{s}.yaml", "w") as f:
f.write("include: '_template_mc'\n")
f.write(f"task: mrl_{s}\n")
f.write(f"dataset_name: {s}\n")
dataset_path: mrlbenchmarks/global-piqa-nonparallel
output_type: multiple_choice
test_split: test
doc_to_text: prompt
doc_to_target: label
doc_to_choice: "{{[solution0, solution1]}}"
metric_list:
- metric: acc
aggregation: mean
higher_is_better: true
metadata:
version: 1.0
include: '_template_mc'
task: mrl_acq_arab
dataset_name: acq_arab
include: '_template_mc'
task: mrl_aeb_arab
dataset_name: aeb_arab
include: '_template_mc'
task: mrl_afb_arab
dataset_name: afb_arab
include: '_template_mc'
task: mrl_als_latn
dataset_name: als_latn
include: '_template_mc'
task: mrl_amh_ethi
dataset_name: amh_ethi
include: '_template_mc'
task: mrl_apc_arab_jord
dataset_name: apc_arab_jord
include: '_template_mc'
task: mrl_apc_arab_leba
dataset_name: apc_arab_leba
include: '_template_mc'
task: mrl_apc_arab_pale
dataset_name: apc_arab_pale
include: '_template_mc'
task: mrl_apc_arab_syri
dataset_name: apc_arab_syri
include: '_template_mc'
task: mrl_arb_arab
dataset_name: arb_arab
include: '_template_mc'
task: mrl_arq_arab
dataset_name: arq_arab
include: '_template_mc'
task: mrl_ars_arab
dataset_name: ars_arab
include: '_template_mc'
task: mrl_ary_arab
dataset_name: ary_arab
include: '_template_mc'
task: mrl_arz_arab
dataset_name: arz_arab
include: '_template_mc'
task: mrl_azj_latn
dataset_name: azj_latn
include: '_template_mc'
task: mrl_bam_latn
dataset_name: bam_latn
include: '_template_mc'
task: mrl_bel_cyrl
dataset_name: bel_cyrl
include: '_template_mc'
task: mrl_ben_latn
dataset_name: ben_latn
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment