ChemBench_gen.py 2.45 KB
Newer Older
liuwei130's avatar
liuwei130 committed
1
2
3
4
5
6
7
8
9
from opencompass.openicl.icl_prompt_template import PromptTemplate
from opencompass.openicl.icl_retriever import FixKRetriever
from opencompass.openicl.icl_inferencer import GenInferencer
from opencompass.openicl.icl_evaluator import AccEvaluator
from opencompass.datasets import ChemBenchDataset
from opencompass.utils.text_postprocessors import first_capital_postprocess


chembench_reader_cfg = dict(
10
11
    input_columns=['input', 'A', 'B', 'C', 'D'],
    output_column='target',
liuwei130's avatar
liuwei130 committed
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
    train_split='dev')

chembench_all_sets = [
    'Name_Conversion',
    'Property_Prediction',
    'Mol2caption',
    'Caption2mol',
    'Product_Prediction',
    'Retrosynthesis',
    'Yield_Prediction',
    'Temperature_Prediction',
    'Solvent_Prediction'
]


chembench_datasets = []
for _name in chembench_all_sets:
    # _hint = f'There is a single choice question about {_name.replace("_", " ")}. Answer the question by replying A, B, C or D.'
    _hint = f'There is a single choice question about chemistry. Answer the question by replying A, B, C or D.'

    chembench_infer_cfg = dict(
        ice_template=dict(
            type=PromptTemplate,
            template=dict(round=[
                dict(
37
                    role='HUMAN',
liuwei130's avatar
liuwei130 committed
38
                    prompt=
39
                    f'{_hint}\nQuestion: {{input}}\nA. {{A}}\nB. {{B}}\nC. {{C}}\nD. {{D}}\nAnswer: '
liuwei130's avatar
liuwei130 committed
40
                ),
41
                dict(role='BOT', prompt='{target}\n')
liuwei130's avatar
liuwei130 committed
42
43
44
45
46
            ]),
        ),
        prompt_template=dict(
            type=PromptTemplate,
            template=dict(
47
                begin='</E>',
liuwei130's avatar
liuwei130 committed
48
49
                round=[
                    dict(
50
                        role='HUMAN',
liuwei130's avatar
liuwei130 committed
51
                        prompt=
52
                        f'{_hint}\nQuestion: {{input}}\nA. {{A}}\nB. {{B}}\nC. {{C}}\nD. {{D}}\nAnswer: '
liuwei130's avatar
liuwei130 committed
53
54
55
                    ),
                ],
            ),
56
            ice_token='</E>',
liuwei130's avatar
liuwei130 committed
57
58
59
60
61
62
63
64
65
66
67
        ),
        retriever=dict(type=FixKRetriever, fix_id_list=[0, 1, 2, 3, 4]),
        inferencer=dict(type=GenInferencer),
    )

    chembench_eval_cfg = dict(
        evaluator=dict(type=AccEvaluator),
        pred_postprocessor=dict(type=first_capital_postprocess))

    chembench_datasets.append(
        dict(
68
            abbr=f'ChemBench_{_name}',
liuwei130's avatar
liuwei130 committed
69
            type=ChemBenchDataset,
70
            path='./data/ChemBench/',
liuwei130's avatar
liuwei130 committed
71
72
73
74
75
76
77
            name=_name,
            reader_cfg=chembench_reader_cfg,
            infer_cfg=chembench_infer_cfg,
            eval_cfg=chembench_eval_cfg,
        ))

del _name, _hint