cb.json 1.25 KB
Newer Older
lintangsutawika's avatar
lintangsutawika committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
{
  "results": {
    "cb": {
      "acc,none": 0.5,
      "acc_stderr,none": 0.5,
      "f1,none": 0.2222222222222222
    }
  },
  "configs": {
    "cb": {
      "task": "cb",
      "group": [
        "super-glue-lm-eval-v1"
      ],
      "dataset_path": "super_glue",
      "dataset_name": "cb",
      "training_split": "train",
      "validation_split": "validation",
      "doc_to_text": "{{premise}}\nQuestion: {{hypothesis}}. True, False, or Neither?\nAnswer:",
      "doc_to_target": "label",
      "doc_to_choice": [
        "True",
        "False",
        "Neither"
      ],
      "description": "",
      "target_delimiter": " ",
      "fewshot_delimiter": "\n\n",
      "num_fewshot": 4,
      "metric_list": [
        {
          "metric": "acc"
        },
        {
          "metric": "f1",
          "aggregation": "<function cb_multi_fi at 0x7f3212743d30>"
        }
      ],
      "output_type": "multiple_choice",
      "repeats": 1,
      "should_decontaminate": false
    }
  },
  "versions": {
    "cb": "Yaml"
  },
  "config": {
    "model": "hf",
    "model_args": "",
    "num_fewshot": 4,
    "batch_size": 1,
    "batch_sizes": [],
    "device": null,
    "use_cache": null,
    "limit": 2.0,
    "bootstrap_iters": 100000
  },
  "git_hash": "656c310"
}