ARC_c_clean_ppl.py 1.83 KB
Newer Older
1
2
3
4
5
6
7
8
9
10
11
12
13
14
from opencompass.openicl.icl_prompt_template import PromptTemplate
from opencompass.openicl.icl_retriever import ZeroRetriever
from opencompass.openicl.icl_inferencer import PPLInferencer
from opencompass.openicl.icl_evaluator import AccContaminationEvaluator
from opencompass.datasets import ARCDatasetClean as ARCDataset

ARC_c_reader_cfg = dict(
    input_columns=['question', 'textA', 'textB', 'textC', 'textD'],
    output_column='answerKey')

ARC_c_infer_cfg = dict(
    prompt_template=dict(
        type=PromptTemplate,
        template={
15
            'A':
16
17
            dict(
                round=[
18
19
                    dict(role='HUMAN', prompt='Question: {question}\nAnswer: '),
                    dict(role='BOT', prompt='{textA}')
20
                ], ),
21
            'B':
22
23
            dict(
                round=[
24
25
                    dict(role='HUMAN', prompt='Question: {question}\nAnswer: '),
                    dict(role='BOT', prompt='{textB}')
26
                ], ),
27
            'C':
28
29
            dict(
                round=[
30
31
                    dict(role='HUMAN', prompt='Question: {question}\nAnswer: '),
                    dict(role='BOT', prompt='{textC}')
32
                ], ),
33
            'D':
34
35
            dict(
                round=[
36
37
                    dict(role='HUMAN', prompt='Question: {question}\nAnswer: '),
                    dict(role='BOT', prompt='{textD}')
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
                ], ),
        }),
    retriever=dict(type=ZeroRetriever),
    inferencer=dict(type=PPLInferencer))

ARC_c_eval_cfg = dict(evaluator=dict(type=AccContaminationEvaluator),
                      analyze_contamination=True)

ARC_c_datasets = [
    dict(
        type=ARCDataset,
        abbr='ARC-c-test',
        path='./data/ARC/ARC-c/ARC-Challenge-Test.jsonl',
        reader_cfg=ARC_c_reader_cfg,
        infer_cfg=ARC_c_infer_cfg,
        eval_cfg=ARC_c_eval_cfg)
]