task: swag dataset_path: swag dataset_name: regular output_type: multiple_choice training_split: train validation_split: validation test_split: null doc_to_text: startphrase doc_to_target: label doc_to_choice: "{{[ending0, ending1, ending2, ending3]}}" metric_list: - metric: acc aggregation: mean higher_is_better: true - metric: acc_norm aggregation: mean higher_is_better: true metadata: version: 1.0