group: mmlu_style_04_lo
dataset_path: cais/mmlu
test_split: test
fewshot_split: dev
output_type: multiple_choice
doc_to_text: "Q: {{question.strip()}}\nA, {{choices[0]}}\nB, {{choices[1]}}\nC, {{choices[2]}}\nD, {{choices[3]}}\nA: "
doc_to_choice: ['A,', 'B,', 'C,', 'D,']
doc_to_target: answer
metric_list:
  - metric: acc
    aggregation: mean
    higher_is_better: true
  - metric: brier_score
