task: "mmlu_redux_spanish" dataset_path: amias-mx/mmlu-redux-2.0-spanish dataset_name: abstract_algebra test_split: test output_type: multiple_choice doc_to_text: "{{question.strip()}}\nA. {{choices[0]}}\nB. {{choices[1]}}\nC. {{choices[2]}}\nD. {{choices[3]}}\nAnswer:" doc_to_choice: ["A", "B", "C", "D"] doc_to_target: answer metric_list: - metric: acc aggregation: mean higher_is_better: true metadata: version: 1.0 dataset_kwargs: trust_remote_code: true