lm1-4b2-84b-c4-repetitions
/
4b284b12bc4
/evaluation
/4b284b12bc4_5_lm-eval_global_step80108_2023-01-30-11-26-32_5shots_backup.json
{ | |
"results": { | |
"anli_r1": { | |
"acc": 0.332, | |
"acc_stderr": 0.014899597242811487 | |
}, | |
"anli_r2": { | |
"acc": 0.329, | |
"acc_stderr": 0.014865395385928357 | |
}, | |
"anli_r3": { | |
"acc": 0.3541666666666667, | |
"acc_stderr": 0.013811933499570954 | |
}, | |
"cb": { | |
"acc": 0.5535714285714286, | |
"acc_stderr": 0.06703189227942395, | |
"f1": 0.38376730002345766 | |
}, | |
"copa": { | |
"acc": 0.81, | |
"acc_stderr": 0.03942772444036623 | |
}, | |
"hellaswag": { | |
"acc": 0.47400916152160927, | |
"acc_stderr": 0.004983035420235716, | |
"acc_norm": 0.619896434973113, | |
"acc_norm_stderr": 0.004844199910173026 | |
}, | |
"rte": { | |
"acc": 0.516245487364621, | |
"acc_stderr": 0.030080573208738064 | |
}, | |
"winogrande": { | |
"acc": 0.5722178374112076, | |
"acc_stderr": 0.013905134013839944 | |
}, | |
"storycloze_2016": { | |
"acc": 0.7177979690005345, | |
"acc_stderr": 0.010407834479647675 | |
}, | |
"boolq": { | |
"acc": 0.5648318042813456, | |
"acc_stderr": 0.008671229580582118 | |
}, | |
"arc_easy": { | |
"acc": 0.5997474747474747, | |
"acc_stderr": 0.010053550119896127, | |
"acc_norm": 0.569023569023569, | |
"acc_norm_stderr": 0.010161552863493746 | |
} | |
}, | |
"versions": { | |
"anli_r1": 0, | |
"anli_r2": 0, | |
"anli_r3": 0, | |
"cb": 1, | |
"copa": 0, | |
"hellaswag": 0, | |
"rte": 0, | |
"winogrande": 0, | |
"storycloze_2016": 0, | |
"boolq": 1, | |
"arc_easy": 0 | |
} | |
} |