task: coqcat dataset_path: projecte-aina/CoQCat output_type: generate_until training_split: train validation_split: validation test_split: test doc_to_text: '{{story+"\n\n"}}{% for i in range(questions|length-1) %}{{"Q: "+questions[i]+"\n\n"+"A: "+answers["input_text"][i]+"\n\n"}}{% endfor %}{{"Q: "+questions[-1]+"\n\n"+"A:"}}' doc_to_target: '{{ answers["input_text"][questions|length - 1] }}' process_results: !function utils.process_results_coqcat should_decontaminate: true doc_to_decontamination_query: "{{story}} {{question.input_text|join('\n')}}" generation_kwargs: until: - "\nQ:" metric_list: - metric: "em" aggregation: mean higher_is_better: true - metric: "f1" aggregation: mean higher_is_better: true metadata: version: 1.0