{ "results": { "boolq-seq2seq": { "exact_match,none": 0.0, "exact_match_stderr,none": 0.0 } }, "configs": { "boolq-seq2seq": { "task": "boolq-seq2seq", "group": [ "super-glue-lm-eval-v1-seq2seq" ], "dataset_path": "super_glue", "dataset_name": "boolq", "training_split": "train", "validation_split": "validation", "doc_to_text": "{{passage}}\nQuestion: {{question}}\nAnswer:", "doc_to_target": "{{['no', 'yes'][label]}}", "description": "", "target_delimiter": " ", "fewshot_delimiter": "\n\n", "num_fewshot": 4, "metric_list": [ { "metric": "exact_match", "aggregation": "mean", "higher_is_better": true, "ignore_case": true, "ignore_punctuation": true } ], "output_type": "greedy_until", "generation_kwargs": { "until": [ "\n\n", "\n" ], "do_sample": false, "temperature": 0.0 }, "repeats": 1, "should_decontaminate": false } }, "versions": { "boolq-seq2seq": "Yaml" }, "config": { "model": "hf", "model_args": "", "num_fewshot": 4, "batch_size": 1, "batch_sizes": [], "device": "cuda", "use_cache": null, "limit": 16.0, "bootstrap_iters": 100000 }, "git_hash": "ae41f67" }