include: _template_yaml
task: squadv2
output_type: generate_until
generation_kwargs: until: - "\n" metric_list:
- metric: !function utils.exact aggregation: mean higher_is_better: true - metric: !function utils.f1 aggregation: mean
higher_is_better: true