File size: 1,121 Bytes
3970485 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 |
{
"results": {
"boolq": {
"acc": 0.5859327217125382,
"acc_stderr": 0.008614932353134947
},
"hellaswag": {
"acc": 0.40689105755825533,
"acc_stderr": 0.004902502514738602,
"acc_norm": 0.5210117506472814,
"acc_norm_stderr": 0.0049853735507751065
},
"arc_challenge": {
"acc": 0.26535836177474403,
"acc_stderr": 0.012902554762313967,
"acc_norm": 0.295221843003413,
"acc_norm_stderr": 0.013329750293382316
},
"arc_easy": {
"acc": 0.5896464646464646,
"acc_stderr": 0.010093531255765457,
"acc_norm": 0.5404040404040404,
"acc_norm_stderr": 0.010226230740889027
},
"sciq": {
"acc": 0.851,
"acc_stderr": 0.011266140684632175,
"acc_norm": 0.795,
"acc_norm_stderr": 0.012772554096113132
}
},
"versions": {
"boolq": 1,
"hellaswag": 0,
"arc_challenge": 0,
"arc_easy": 0,
"sciq": 0
}
} |