obqa_gen_9069e4.py 1.83 KB
Newer Older
gaotongxiao's avatar
gaotongxiao committed
1
2
3
4
5
from opencompass.openicl.icl_prompt_template import PromptTemplate
from opencompass.openicl.icl_retriever import ZeroRetriever
from opencompass.openicl.icl_inferencer import GenInferencer
from opencompass.openicl.icl_evaluator import AccEvaluator
from opencompass.datasets import OBQADataset
Leymore's avatar
Leymore committed
6
from opencompass.utils.text_postprocessors import first_capital_postprocess
gaotongxiao's avatar
gaotongxiao committed
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57

_input_columns = [
    ["question_stem", "A", "B", "C", "D"],
    ["question_stem", "A", "B", "C", "D", "fact1"],
]
_template = [
    dict(
        round=[
            dict(
                role="HUMAN",
                prompt="Question: {question_stem}\nA. {A}\nB. {B}\nC. {C}\nD. {D}\nAnswer:"
            ),
        ], ),
    dict(
        round=[
            dict(
                role="HUMAN",
                prompt="Given the fact: {fact1}\nQuestion: {question_stem}\nA. {A}\nB. {B}\nC. {C}\nD. {D}\nAnswer:",
            ),
        ], ),
]

obqa_datasets = [
    dict(
        abbr="openbookqa",
        type=OBQADataset,
        path="openbookqa",
        split="test",
    ),
    dict(
        abbr="openbookqa_fact",
        type=OBQADataset,
        path="openbookqa",
        name="additional",
        split="test",
    ),
]

for _i in range(2):
    obqa_reader_cfg = dict(
        input_columns=_input_columns[_i], output_column="answerKey")
    obqa_infer_cfg = dict(
        prompt_template=dict(
            type=PromptTemplate,
            template=_template[_i]),
        retriever=dict(type=ZeroRetriever),
        inferencer=dict(type=GenInferencer),
    )
    obqa_eval_cfg = dict(
        evaluator=dict(type=AccEvaluator),
        pred_role="BOT",
Leymore's avatar
Leymore committed
58
        pred_postprocessor=dict(type=first_capital_postprocess),
gaotongxiao's avatar
gaotongxiao committed
59
60
61
62
63
    )

    obqa_datasets[_i]["reader_cfg"] = obqa_reader_cfg
    obqa_datasets[_i]["infer_cfg"] = obqa_infer_cfg
    obqa_datasets[_i]["eval_cfg"] = obqa_eval_cfg