repobench-p.yaml 451 Bytes
Newer Older
Baber's avatar
Baber committed
1
2
3
4
5
6
7
8
9
10
11
12

tag:
  - longbench
task: longbench_repobench-p
dataset_path: THUDM/LongBench
test_split: test
dataset_name: repobench-p
doc_to_text: 'Please complete the code given below. \n{{context}}{{input}}Next line of code:\n'
doc_to_target: '{{answers}}'
generation_kwargs:
  max_gen_toks: 64
  temperature: 1
Baber's avatar
Baber committed
13
  do_sample: True
Baber's avatar
Baber committed
14
15
16
17
18
19
metric_list:
  - metric: !function metrics.code_sim_score
    aggregation: mean
    higher_is_better: True
metadata:
  version: 1.0