|
{ |
|
"results": { |
|
"anli_r1": { |
|
"acc": 0.351, |
|
"acc_stderr": 0.015100563798316405 |
|
}, |
|
"anli_r2": { |
|
"acc": 0.345, |
|
"acc_stderr": 0.015039986742055237 |
|
}, |
|
"anli_r3": { |
|
"acc": 0.345, |
|
"acc_stderr": 0.013728421539454878 |
|
}, |
|
"cb": { |
|
"acc": 0.5714285714285714, |
|
"acc_stderr": 0.06672848092813058, |
|
"f1": 0.37671957671957673 |
|
}, |
|
"copa": { |
|
"acc": 0.78, |
|
"acc_stderr": 0.04163331998932261 |
|
}, |
|
"hellaswag": { |
|
"acc": 0.4827723561043617, |
|
"acc_stderr": 0.004986818680313444, |
|
"acc_norm": 0.6446922923720374, |
|
"acc_norm_stderr": 0.004776283203468094 |
|
}, |
|
"rte": { |
|
"acc": 0.5776173285198556, |
|
"acc_stderr": 0.02973162264649588 |
|
}, |
|
"winogrande": { |
|
"acc": 0.595895816890292, |
|
"acc_stderr": 0.013791610664670845 |
|
}, |
|
"storycloze_2016": { |
|
"acc": 0.7252805986103688, |
|
"acc_stderr": 0.010322309878339507 |
|
}, |
|
"boolq": { |
|
"acc": 0.6146788990825688, |
|
"acc_stderr": 0.008511930879680652 |
|
}, |
|
"arc_easy": { |
|
"acc": 0.6300505050505051, |
|
"acc_stderr": 0.009906656266021155, |
|
"acc_norm": 0.6111111111111112, |
|
"acc_norm_stderr": 0.01000324833531377 |
|
}, |
|
"arc_challenge": { |
|
"acc": 0.30716723549488056, |
|
"acc_stderr": 0.013481034054980945, |
|
"acc_norm": 0.32337883959044367, |
|
"acc_norm_stderr": 0.013669421630012122 |
|
}, |
|
"sciq": { |
|
"acc": 0.919, |
|
"acc_stderr": 0.008632121032139978, |
|
"acc_norm": 0.907, |
|
"acc_norm_stderr": 0.009188875634996669 |
|
}, |
|
"piqa": { |
|
"acc": 0.7529923830250272, |
|
"acc_stderr": 0.010062268140772625, |
|
"acc_norm": 0.7671381936887922, |
|
"acc_norm_stderr": 0.009861236071080753 |
|
} |
|
}, |
|
"versions": { |
|
"anli_r1": 0, |
|
"anli_r2": 0, |
|
"anli_r3": 0, |
|
"cb": 1, |
|
"copa": 0, |
|
"hellaswag": 0, |
|
"rte": 0, |
|
"winogrande": 0, |
|
"storycloze_2016": 0, |
|
"boolq": 1, |
|
"arc_easy": 0, |
|
"arc_challenge": 0, |
|
"sciq": 0, |
|
"piqa": 0 |
|
} |
|
} |