{ "results": { "xwinograd_en": { "acc": 0.6589247311827957, "acc_stderr": 0.009833881195698878 }, "xwinograd_pt": { "acc": 0.6007604562737643, "acc_stderr": 0.03025636835693898 }, "xwinograd_ru": { "acc": 0.49206349206349204, "acc_stderr": 0.028213077547815057 }, "xwinograd_fr": { "acc": 0.6024096385542169, "acc_stderr": 0.054045178247868114 }, "xwinograd_jp": { "acc": 0.529718456725756, "acc_stderr": 0.01612570703179889 }, "xwinograd_zh": { "acc": 0.6765873015873016, "acc_stderr": 0.020857221952855685 } }, "versions": { "xwinograd_en": 0, "xwinograd_pt": 0, "xwinograd_ru": 0, "xwinograd_fr": 0, "xwinograd_jp": 0, "xwinograd_zh": 0 }, "config": { "model": "hf-causal-experimental", "model_args": "pretrained=bigscience/bloom-560m", "num_fewshot": 0, "batch_size": "auto", "device": "cuda", "no_cache": true, "limit": null, "bootstrap_iters": 100000, "description_dict": {} } }