_longbench2_structured.yaml 216 Bytes
Newer Older
Janna's avatar
Janna committed
1
2
3
4
5
6
7
8
9
10
group: longbench2_structured
group_alias: "Long Structured Data Understanding"
task:
  - longbench2_graph
  - longbench2_table
aggregate_metric_list:
  - metric: acc
    weight_by_size: True
metadata:
  version: 0.0