gsm8k-cot-self-consistency.yaml 972 Bytes
Newer Older
1
2
3
4
5
6
7
8
9
10
11
include: gsm8k-cot.yaml
group:
  - chain_of_thought
  - self_consistency
task: gsm8k_cot_self_consistency
generation_kwargs:
  until:
    - "Q:"
    - "\n\n"
  do_sample: true
  temperature: 0.2
haileyschoelkopf's avatar
haileyschoelkopf committed
12
repeats: 64
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
filter_list:
  - name: "score-first" # pick only the first response, and report metrics on that
    filter:
      - function: "regex"
        regex_pattern: "The answer is (\\-?[0-9\\.\\,]*[0-9]+)"
      - function: "take_first"
  - name: "maj@64"
    filter:
      - function: "regex"
        regex_pattern: "The answer is (\\-?[0-9\\.\\,]*[0-9]+)"
      - function: "majority_vote"
      - function: "take_first"
  - name: "maj@8" # get Maj@8 , via selecting the first 8 responses. Using a better estimator would be optimal.
    filter:
      - function: "take_first_k"
        k: 8
      - function: "regex"
        regex_pattern: "The answer is (\\-?[0-9\\.\\,]*[0-9]+)"
      - function: "majority_vote"
lintangsutawika's avatar
lintangsutawika committed
32
      - function: "take_first"
lintangsutawika's avatar
lintangsutawika committed
33
metadata:
34
  version: 0.0