dataset_path: jumelet/multiblimp tag: multiblimp output_type: multiple_choice test_split: train doc_to_text: "" target_delimiter: "" doc_to_target: 0 doc_to_choice: "{{[sen,wrong_sen]}}" num_fewshot: 0 metric_list: - metric: acc aggregation: mean higher_is_better: true - metric: acc_norm aggregation: mean higher_is_better: true metadata: version: 0