task: tinyMMLU dataset_path: tinyBenchmarks/tinyMMLU dataset_name: all test_split: test fewshot_split: dev fewshot_config: sampler: first_n output_type: multiple_choice doc_to_text: "{{input_formatted}}" doc_to_choice: ["A", "B", "C", "D"] doc_to_target: answer num_fewshot: 0 metric_list: - metric: acc aggregation: mean higher_is_better: true metadata: version: 0.0