Unverified Commit a6c640d3 authored by Lintang Sutawika's avatar Lintang Sutawika Committed by GitHub
Browse files

Merge branch 'big-refactor' into seq2seq-refactor

parents 55eccc29 24e3e3fa
{
"results": {
"math_algebra": {
"acc": 0.0,
"acc_stderr": 0.0
},
"math_geometry": {
"acc": 0.0,
"acc_stderr": 0.0
},
"math_prealgebra": {
"acc": 0.002296211251435132,
"acc_stderr": 0.001622733136934626
},
"math_precalc": {
"acc": 0.0,
"acc_stderr": 0.0
},
"math_num_theory": {
"acc": 0.007407407407407408,
"acc_stderr": 0.003693382168437264
},
"gsm8k": {
"acc": 0.0,
"acc_stderr": 0.0
},
"math_counting_and_prob": {
"acc": 0.0,
"acc_stderr": 0.0
},
"math_intermediate_algebra": {
"acc": 0.0,
"acc_stderr": 0.0
},
"drop": {
"em": 0.014890939597315436,
"em_stderr": 0.0012403460245602655,
"f1": 0.043118708053691356,
"f1_stderr": 0.0015424950823374804
},
"mathqa": {
"acc": 0.24288107202680068,
"acc_stderr": 0.00785017752394654,
"acc_norm": 0.24623115577889448,
"acc_norm_stderr": 0.007886624866001843
}
},
"versions": {
"math_algebra": 1,
"math_geometry": 1,
"math_prealgebra": 1,
"math_precalc": 1,
"math_num_theory": 1,
"gsm8k": 0,
"math_counting_and_prob": 1,
"mathqa": 0,
"math_intermediate_algebra": 1,
"drop": 1
},
"config": {
"model": "hf-causal-experimental",
"model_args": "pretrained=bigscience/bloom-1b7,use_accelerate=True",
"num_fewshot": 5,
"batch_size": "auto",
"device": "cuda:0",
"no_cache": true,
"limit": null,
"bootstrap_iters": 100000,
"description_dict": {}
}
}
{
"results": {
"pawsx_ja": {
"acc": 0.447,
"acc_stderr": 0.011120131683767737
},
"pawsx_es": {
"acc": 0.513,
"acc_stderr": 0.011179355482070377
},
"pawsx_fr": {
"acc": 0.462,
"acc_stderr": 0.01115079235234166
},
"pawsx_de": {
"acc": 0.4875,
"acc_stderr": 0.011179640744835734
},
"pawsx_ko": {
"acc": 0.458,
"acc_stderr": 0.011143612073516636
},
"pawsx_zh": {
"acc": 0.454,
"acc_stderr": 0.0111357084193598
},
"pawsx_en": {
"acc": 0.489,
"acc_stderr": 0.011180429374603775
}
},
"versions": {
"pawsx_ja": 0,
"pawsx_es": 0,
"pawsx_fr": 0,
"pawsx_de": 0,
"pawsx_ko": 0,
"pawsx_zh": 0,
"pawsx_en": 0
},
"config": {
"model": "hf-causal-experimental",
"model_args": "pretrained=bigscience/bloom-1b7",
"num_fewshot": 0,
"batch_size": "auto",
"device": "cuda",
"no_cache": true,
"limit": null,
"bootstrap_iters": 100000,
"description_dict": {}
}
}
This diff is collapsed.
This diff is collapsed.
This diff is collapsed.
This diff is collapsed.
This diff is collapsed.
This diff is collapsed.
This diff is collapsed.
This diff is collapsed.
This diff is collapsed.
This diff is collapsed.
This diff is collapsed.
This diff is collapsed.
This diff is collapsed.
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment