obqa_ppl_2b5b12.py 1.92 KB
Newer Older
Ezra-Yu's avatar
Ezra-Yu committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
from opencompass.openicl.icl_prompt_template import PromptTemplate
from opencompass.openicl.icl_retriever import ZeroRetriever
from opencompass.openicl.icl_inferencer import PPLInferencer
from opencompass.openicl.icl_evaluator import AccEvaluator
from opencompass.datasets import OBQADataset

_input_columns = [
    ['question_stem', 'A', 'B', 'C', 'D'],
    ['question_stem', 'A', 'B', 'C', 'D', 'fact1'],
]
_template = [
    {
        ans: dict(
            round=[
                dict(
                    role="HUMAN",
                    prompt=
                    "Question: {question_stem}\nA. {A}\nB. {B}\nC. {C}\nD. {D}\nAnswer:"
                ),
                dict(role="BOT", prompt=ans),
            ], )
        for ans in ['A', 'B', 'C', 'D']
    },
    {
        ans: dict(
            round=[
                dict(
                    role="HUMAN",
                    prompt=
                    "Given the fact: {fact1}\nQuestion: {question_stem}\nA. {A}\nB. {B}\nC. {C}\nD. {D}\nAnswer:"
                ),
                dict(role="BOT", prompt=ans),
            ], )
        for ans in ['A', 'B', 'C', 'D']
    }
]

obqa_datasets = [
    dict(
        type=OBQADataset,
        path='openbookqa',
        split='test',
    ),
    dict(
        abbr='openbookqa_fact',
        type=OBQADataset,
        path='openbookqa',
        name='additional',
        split='test',
    ),
]
for _i in range(2):
    obqa_reader_cfg = dict(
        input_columns=_input_columns[_i], output_column="answerKey")
    obqa_infer_cfg = dict(
        prompt_template=dict(
            type=PromptTemplate,
            template=_template[_i]),
        retriever=dict(type=ZeroRetriever),
        inferencer=dict(type=PPLInferencer),
    )
    obqa_eval_cfg = dict(evaluator=dict(type=AccEvaluator), )

    obqa_datasets[_i]["reader_cfg"] = obqa_reader_cfg
    obqa_datasets[_i]["infer_cfg"] = obqa_infer_cfg
    obqa_datasets[_i]["eval_cfg"] = obqa_eval_cfg