ceval_contamination_ppl_810ec6.py 1.53 KB
Newer Older
1
2
3
4
5
6
7
8
9
from opencompass.openicl.icl_prompt_template import PromptTemplate
from opencompass.openicl.icl_retriever import ZeroRetriever
from opencompass.openicl.icl_inferencer import PPLOnlyInferencer
from opencompass.openicl.icl_evaluator import AveragePPLEvaluator
from opencompass.datasets import JsonlDataset

ceval_datasets = []

ceval_infer_cfg = dict(
10
    prompt_template=dict(type=PromptTemplate, template='{text}'),
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
    retriever=dict(type=ZeroRetriever),
    inferencer=dict(type=PPLOnlyInferencer),
)

ceval_eval_cfg = dict(evaluator=dict(type=AveragePPLEvaluator))

ceval_reader_cfg = dict(
    input_columns=['text'],
    output_column=None,
)

ceval_datasets.append(
    dict(
        abbr=f'ceval-val-ppl',
        type=JsonlDataset,
        path='/mnt/petrelfs/zhoufengzhe/repos/cscripts/mock-datas/ceval_val_content.jsonl',
        reader_cfg=ceval_reader_cfg,
        infer_cfg=ceval_infer_cfg,
        eval_cfg=ceval_eval_cfg
    )
)

ceval_infer_cfg = dict(
34
    prompt_template=dict(type=PromptTemplate, template='{rephrase}'),
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
    retriever=dict(type=ZeroRetriever),
    inferencer=dict(type=PPLOnlyInferencer),
)

ceval_eval_cfg = dict(evaluator=dict(type=AveragePPLEvaluator))

ceval_reader_cfg = dict(
    input_columns=['rephrase'],
    output_column=None,
)

ceval_datasets.append(
    dict(
        abbr=f'ceval-ref-ppl',
        type=JsonlDataset,
        path='/mnt/petrelfs/zhoufengzhe/repos/cscripts/mock-datas/ceval_val_content.jsonl',
        reader_cfg=ceval_reader_cfg,
        infer_cfg=ceval_infer_cfg,
        eval_cfg=ceval_eval_cfg
    )
)