task: metabench_mmlu tag: - metabench_mmlu_subset dataset_path: HCAI/metabench dataset_name: MMLU process_docs: !function process_docs.process_mmlu output_type: multiple_choice training_split: null validation_split: null test_split: primary num_fewshot: 0 doc_to_text: "{{five_shot_preprompt}}{{question.strip()}}\nA. {{choices[0]}}\nB. {{choices[1]}}\nC. {{choices[2]}}\nD. {{choices[3]}}\nAnswer:" doc_to_choice: ["A", "B", "C", "D"] doc_to_target: answer metric_list: - metric: acc aggregation: mean higher_is_better: true metadata: version: 0.0