trec.yaml 533 Bytes
Newer Older
Baber Abbasi's avatar
Baber Abbasi committed
1
2
3
4
5
6
7
8

tag:
  - longbench
task: longbench_trec
dataset_path: THUDM/LongBench
test_split: test
dataset_name: trec
doc_to_text: 'Please determine the type of the question below. Here are some examples of questions.\n\n{{context}}\n{{input}}'
Baber Abbasi's avatar
Baber Abbasi committed
9
10
doc_to_target: '{{answers[0]}}'
process_results: !function metrics.classification_score
Baber Abbasi's avatar
Baber Abbasi committed
11
12
13
14
generation_kwargs:
  max_gen_toks: 64
  temperature: 1
  do_sample: True
Baber Abbasi's avatar
Baber Abbasi committed
15
  until: ['\n']
Baber Abbasi's avatar
Baber Abbasi committed
16
metric_list:
Baber Abbasi's avatar
Baber Abbasi committed
17
  - metric: "classification_score"
Baber Abbasi's avatar
Baber Abbasi committed
18
19
20
    aggregation: mean
    higher_is_better: True
metadata:
Baber Abbasi's avatar
Baber Abbasi committed
21
  version: 2.0