dataset_path: RMT-team/babilong-1k-samples output_type: generate_until doc_to_target: "{{target}}" target_delimiter: " " num_fewshot: 2 process_results: !function common_utils.process_results metric_list: - metric: acc aggregation: mean higher_is_better: true generation_kwargs: do_sample: false temperature: 0.0 max_gen_toks: 16 until: [] metadata: version: 0.0