group: mmlu_style_01_lo
dataset_path: cais/mmlu
test_split: test
fewshot_split: dev
output_type: multiple_choice
doc_to_text: "Q: {{question.strip()}}\n(A) {{choices[0]}}\n(B) {{choices[1]}}\n(C) {{choices[2]}}\n(D) {{choices[3]}}\nA: "
doc_to_choice: ['(A)', '(B)', '(C)', '(D)']
doc_to_target: answer
metric_list:
  - metric: acc
    aggregation: mean
    higher_is_better: true
  - metric: brier_score
