commonsenseqa_ppl_5545e2.py 1.51 KB
Newer Older
gaotongxiao's avatar
gaotongxiao committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
from opencompass.openicl.icl_prompt_template import PromptTemplate
from opencompass.openicl.icl_retriever import MDLRetriever
from opencompass.openicl.icl_inferencer import PPLInferencer
from opencompass.openicl.icl_evaluator import AccEvaluator
from opencompass.datasets import commonsenseqaDataset

commonsenseqa_reader_cfg = dict(
    input_columns=['question', 'A', 'B', 'C', 'D', 'E'],
    output_column='answerKey',
    test_split='validation')

_ice_template = dict(
    type=PromptTemplate,
    template={
        ans: dict(
            begin='</E>',
            round=[
18
19
                dict(role='HUMAN', prompt='Question: {question}\nAnswer: '),
                dict(role='BOT', prompt=ans_token),
gaotongxiao's avatar
gaotongxiao committed
20
            ])
21
22
23
        for ans, ans_token in [['A', '{A}'], ['B', '{B}'],
                               ['C', '{C}'], ['D', '{D}'],
                               ['E', '{E}']]
gaotongxiao's avatar
gaotongxiao committed
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
    },
    ice_token='</E>')

commonsenseqa_infer_cfg = dict(
    ice_template=_ice_template,
    retriever=dict(
        type=MDLRetriever,
        ice_num=8,
        candidate_num=30,
        select_time=10,
        seed=1,
        batch_size=12,
        ice_template=_ice_template),
    inferencer=dict(type=PPLInferencer))

commonsenseqa_eval_cfg = dict(evaluator=dict(type=AccEvaluator))

commonsenseqa_datasets = [
    dict(
43
        abbr='commonsense_qa',
gaotongxiao's avatar
gaotongxiao committed
44
        type=commonsenseqaDataset,
45
        path='./data/commonsenseqa',
gaotongxiao's avatar
gaotongxiao committed
46
47
48
49
        reader_cfg=commonsenseqa_reader_cfg,
        infer_cfg=commonsenseqa_infer_cfg,
        eval_cfg=commonsenseqa_eval_cfg)
]