group: mmlu_style_02_lo
dataset_path: cais/mmlu
test_split: test
fewshot_split: dev
output_type: multiple_choice
doc_to_text: "Q: {{question.strip()}}\nA. {{choices[0]}}\nB. {{choices[1]}}\nC. {{choices[2]}}\nD. {{choices[3]}}\nA: "
doc_to_choice: ['A.', 'B.', 'C.', 'D.']
doc_to_target: answer
metric_list:
  - metric: acc
    aggregation: mean
    higher_is_better: true
  - metric: brier_score
