xiezhi_gen_b86cf5.py 1.73 KB
Newer Older
1
2
3
4
5
6
7
8
from opencompass.openicl.icl_prompt_template import PromptTemplate
from opencompass.openicl.icl_inferencer import GenInferencer
from opencompass.openicl.icl_evaluator import AccEvaluator
from opencompass.datasets import XiezhiDataset, XiezhiRetriever
from opencompass.utils.text_postprocessors import first_capital_postprocess

xiezhi_datasets = []

9
for split in ['spec_eng', 'spec_chn', 'inter_eng', 'inter_chn']:
10
    if 'chn' in split:
11
        q_hint, a_hint = '题目', '答案'
12
    else:
13
        q_hint, a_hint = 'Question', 'Answer'
14
15

    xiezhi_reader_cfg = dict(
16
17
18
        input_columns=['question', 'A', 'B', 'C', 'D', 'labels'],
        output_column='answer',
        train_split='train',
19
20
21
22
23
24
        test_split='test',
    )
    xiezhi_infer_cfg = dict(
        ice_template=dict(
            type=PromptTemplate,
            template=dict(
25
                begin='</E>',
26
                round=[
27
28
                    dict(role='HUMAN', prompt=f'{q_hint}: {{question}}\nA. {{A}}\nB. {{B}}\nC. {{C}}\nD. {{D}}\n{a_hint}: '),
                    dict(role='BOT', prompt='{answer}'),
29
30
                ]
            ),
31
            ice_token='</E>',
32
33
34
35
36
37
        ),
        retriever=dict(type=XiezhiRetriever, ice_num=3),
        inferencer=dict(type=GenInferencer),
    )

    xiezhi_eval_cfg = dict(evaluator=dict(type=AccEvaluator),
38
                           pred_role='BOT',
39
40
41
42
43
                           pred_postprocessor=dict(type=first_capital_postprocess))

    xiezhi_datasets.append(
        dict(
            type=XiezhiDataset,
44
45
46
            abbr=f'xiezhi-{split}',
            path='./data/xiezhi/',
            name='xiezhi_' + split,
47
48
49
50
            reader_cfg=xiezhi_reader_cfg,
            infer_cfg=xiezhi_infer_cfg,
            eval_cfg=xiezhi_eval_cfg,
        ))