longbench.py 1.33 KB
Newer Older
philipwangOvO's avatar
philipwangOvO committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
summarizer = dict(
    dataset_abbrs = [
        '--------- LongBench Single-Document QA ---------', # category
        "LongBench_narrativeqa",
        'LongBench_qasper',
        'LongBench_multifieldqa_en',
        "LongBench_multifieldqa_zh",
        '--------- LongBench Multi-Document QA ---------', # category
        'LongBench_hotpotqa',
        'LongBench_2wikimqa',
        'LongBench_musique',
        'LongBench_dureader',
        '--------- LongBench Summarization ---------', # category
        'LongBench_gov_report',
        'LongBench_qmsum',
philipwangOvO's avatar
philipwangOvO committed
16
        'LongBench_multi_news',
philipwangOvO's avatar
philipwangOvO committed
17
18
19
20
        'LongBench_vcsum',
        '--------- LongBench Few-shot Learning ---------', # category
        'LongBench_trec',
        'LongBench_triviaqa',
philipwangOvO's avatar
philipwangOvO committed
21
        'LongBench_samsum',
philipwangOvO's avatar
philipwangOvO committed
22
23
24
        'LongBench_lsht',
        '--------- LongBench Synthetic Tasks ---------', # category
        'LongBench_passage_count',
philipwangOvO's avatar
philipwangOvO committed
25
        'LongBench_passage_retrieval_en',
philipwangOvO's avatar
philipwangOvO committed
26
        'LongBench_passage_retrieval_zh',
philipwangOvO's avatar
philipwangOvO committed
27
28
29
        '--------- LongBench Code Completion ---------', # category
        'LongBench_lcc',
        'LongBench_repobench-p',
philipwangOvO's avatar
philipwangOvO committed
30
31
32
33
34
35
36
    ],
    summary_groups=sum([v for k, v in locals().items() if k.endswith("_summary_groups")], []),
    prompt_db=dict(
        database_path='configs/datasets/log.json',
        config_dir='configs/datasets',
        blacklist='.promptignore'),
)