winogrande_ppl_55a66e.py 1.19 KB
Newer Older
cky's avatar
cky committed
1
2
3
4
5
6
from opencompass.openicl.icl_prompt_template import PromptTemplate
from opencompass.openicl.icl_retriever import ZeroRetriever
from opencompass.openicl.icl_inferencer import PPLInferencer
from opencompass.openicl.icl_evaluator import AccEvaluator
from opencompass.datasets import winograndeDataset

Hubert's avatar
Hubert committed
7
8
# WARNING: This config cannot reproduce results in the paper.
# e.g. LLAMA2-7B Winogrande 69.2 (paper) -> 62.27 (this config)
9
# Please try winogrande_ll_c5cf57
Hubert's avatar
Hubert committed
10

cky's avatar
cky committed
11
12
13
winogrande_reader_cfg = dict(
    input_columns=['opt1', 'opt2'],
    output_column='answer',
14
)
cky's avatar
cky committed
15
16
17
18
19
20

winogrande_infer_cfg = dict(
    prompt_template=dict(
        type=PromptTemplate,
        template={
            i: dict(round=[
21
                dict(role='HUMAN', prompt=f'Good sentence: {{opt{i}}}'),
cky's avatar
cky committed
22
            ])
Leymore's avatar
Leymore committed
23
            for i in range(1, 3)
cky's avatar
cky committed
24
25
26
27
28
29
30
31
32
33
        }),
    retriever=dict(type=ZeroRetriever),
    inferencer=dict(type=PPLInferencer))

winogrande_eval_cfg = dict(evaluator=dict(type=AccEvaluator), )

winogrande_datasets = [
    dict(
        abbr='winogrande',
        type=winograndeDataset,
34
        path='./data/winogrande',
cky's avatar
cky committed
35
36
37
38
        reader_cfg=winogrande_reader_cfg,
        infer_cfg=winogrande_infer_cfg,
        eval_cfg=winogrande_eval_cfg)
]