o.json 1.37 KB
Newer Older
lintangsutawika's avatar
lintangsutawika committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
{
  "results": {
    "boolq-seq2seq": {
      "exact_match,none": 0.0,
      "exact_match_stderr,none": 0.0
    }
  },
  "configs": {
    "boolq-seq2seq": {
      "task": "boolq-seq2seq",
      "group": [
        "super-glue-lm-eval-v1-seq2seq"
      ],
      "dataset_path": "super_glue",
      "dataset_name": "boolq",
      "training_split": "train",
      "validation_split": "validation",
      "doc_to_text": "{{passage}}\nQuestion: {{question}}\nAnswer:",
      "doc_to_target": "{{['no', 'yes'][label]}}",
      "description": "",
      "target_delimiter": " ",
      "fewshot_delimiter": "\n\n",
      "num_fewshot": 4,
      "metric_list": [
        {
          "metric": "exact_match",
          "aggregation": "mean",
          "higher_is_better": true,
          "ignore_case": true,
          "ignore_punctuation": true
        }
      ],
      "output_type": "greedy_until",
      "generation_kwargs": {
        "until": [
          "\n\n",
          "\n"
        ],
        "do_sample": false,
        "temperature": 0.0
      },
      "repeats": 1,
      "should_decontaminate": false
    }
  },
  "versions": {
    "boolq-seq2seq": "Yaml"
  },
  "config": {
    "model": "hf",
    "model_args": "",
    "num_fewshot": 4,
    "batch_size": 1,
    "batch_sizes": [],
    "device": "cuda",
    "use_cache": null,
    "limit": 16.0,
    "bootstrap_iters": 100000
  },
  "git_hash": "ae41f67"
}