include: _template_yaml
task: squadv2 output_type: greedy_until generation_kwargs: until: - "\n" metric_list:
- metric: !function utils.exact aggregation: mean higher_is_better: true - metric: !function utils.f1 aggregation: mean
higher_is_better: true