|
{ |
|
"results": { |
|
"anli_r1": { |
|
"acc": 0.293, |
|
"acc_stderr": 0.014399942998441271 |
|
}, |
|
"anli_r2": { |
|
"acc": 0.327, |
|
"acc_stderr": 0.01484221315341124 |
|
}, |
|
"anli_r3": { |
|
"acc": 0.3383333333333333, |
|
"acc_stderr": 0.013664144006618275 |
|
}, |
|
"cb": { |
|
"acc": 0.32142857142857145, |
|
"acc_stderr": 0.06297362289056341, |
|
"f1": 0.2706949089557785 |
|
}, |
|
"copa": { |
|
"acc": 0.77, |
|
"acc_stderr": 0.042295258468165065 |
|
}, |
|
"hellaswag": { |
|
"acc": 0.5265883290181239, |
|
"acc_stderr": 0.0049827214724073405, |
|
"acc_norm": 0.7029476199960167, |
|
"acc_norm_stderr": 0.00456025908319738 |
|
}, |
|
"rte": { |
|
"acc": 0.5595667870036101, |
|
"acc_stderr": 0.029882123363118723 |
|
}, |
|
"winogrande": { |
|
"acc": 0.6243093922651933, |
|
"acc_stderr": 0.013611257508380444 |
|
}, |
|
"storycloze_2016": { |
|
"acc": 0.7413148049171566, |
|
"acc_stderr": 0.010126662138021714 |
|
}, |
|
"boolq": { |
|
"acc": 0.6669724770642201, |
|
"acc_stderr": 0.00824302391268888 |
|
}, |
|
"arc_easy": { |
|
"acc": 0.6759259259259259, |
|
"acc_stderr": 0.009603728850095394, |
|
"acc_norm": 0.640993265993266, |
|
"acc_norm_stderr": 0.009843424713072176 |
|
}, |
|
"arc_challenge": { |
|
"acc": 0.33447098976109213, |
|
"acc_stderr": 0.013787460322441384, |
|
"acc_norm": 0.3438566552901024, |
|
"acc_norm_stderr": 0.01388064457015621 |
|
}, |
|
"sciq": { |
|
"acc": 0.928, |
|
"acc_stderr": 0.008178195576218681, |
|
"acc_norm": 0.911, |
|
"acc_norm_stderr": 0.009008893392651523 |
|
}, |
|
"piqa": { |
|
"acc": 0.7763873775843307, |
|
"acc_stderr": 0.009721489519176294, |
|
"acc_norm": 0.7883569096844396, |
|
"acc_norm_stderr": 0.009530351270479392 |
|
} |
|
}, |
|
"versions": { |
|
"anli_r1": 0, |
|
"anli_r2": 0, |
|
"anli_r3": 0, |
|
"cb": 1, |
|
"copa": 0, |
|
"hellaswag": 0, |
|
"rte": 0, |
|
"winogrande": 0, |
|
"storycloze_2016": 0, |
|
"boolq": 1, |
|
"arc_easy": 0, |
|
"arc_challenge": 0, |
|
"sciq": 0, |
|
"piqa": 0 |
|
} |
|
} |