{ "results": { "cb": { "acc,none": 0.5, "acc_stderr,none": 0.5, "f1,none": 0.2222222222222222 } }, "configs": { "cb": { "task": "cb", "group": [ "super-glue-lm-eval-v1" ], "dataset_path": "super_glue", "dataset_name": "cb", "training_split": "train", "validation_split": "validation", "doc_to_text": "{{premise}}\nQuestion: {{hypothesis}}. True, False, or Neither?\nAnswer:", "doc_to_target": "label", "doc_to_choice": [ "True", "False", "Neither" ], "description": "", "target_delimiter": " ", "fewshot_delimiter": "\n\n", "num_fewshot": 4, "metric_list": [ { "metric": "acc" }, { "metric": "f1", "aggregation": "" } ], "output_type": "multiple_choice", "repeats": 1, "should_decontaminate": false } }, "versions": { "cb": "Yaml" }, "config": { "model": "hf", "model_args": "", "num_fewshot": 4, "batch_size": 1, "batch_sizes": [], "device": null, "use_cache": null, "limit": 2.0, "bootstrap_iters": 100000 }, "git_hash": "656c310" }