dataset_path: MMMU/MMMU validation_split: validation output_type: generate_until doc_to_image: !function utils.doc_to_image doc_to_text: !function utils.doc_to_text doc_to_target: "answer" process_results: !function utils.process_results generation_kwargs: until: - "<|endoftext|>" temperature: 0.0 do_sample: false max_gen_toks: 512 metric_list: - metric: acc aggregation: mean higher_is_better: true metadata: version: 0.0