|
{ |
|
"results": { |
|
"anli_r1": { |
|
"acc": 0.319, |
|
"acc_stderr": 0.014746404865473486 |
|
}, |
|
"anli_r2": { |
|
"acc": 0.33, |
|
"acc_stderr": 0.01487687202745673 |
|
}, |
|
"anli_r3": { |
|
"acc": 0.32, |
|
"acc_stderr": 0.013471620929769142 |
|
}, |
|
"cb": { |
|
"acc": 0.42857142857142855, |
|
"acc_stderr": 0.06672848092813058, |
|
"f1": 0.3049446887911502 |
|
}, |
|
"copa": { |
|
"acc": 0.82, |
|
"acc_stderr": 0.038612291966536955 |
|
}, |
|
"hellaswag": { |
|
"acc": 0.5259908384783908, |
|
"acc_stderr": 0.004983035420235712, |
|
"acc_norm": 0.7002589125672177, |
|
"acc_norm_stderr": 0.004572081656965643 |
|
}, |
|
"rte": { |
|
"acc": 0.5812274368231047, |
|
"acc_stderr": 0.02969666108123484 |
|
}, |
|
"winogrande": { |
|
"acc": 0.6266771902131019, |
|
"acc_stderr": 0.013594002763035516 |
|
}, |
|
"storycloze_2016": { |
|
"acc": 0.7616247995724211, |
|
"acc_stderr": 0.009853267441685421 |
|
}, |
|
"boolq": { |
|
"acc": 0.6590214067278287, |
|
"acc_stderr": 0.00829097981816109 |
|
}, |
|
"arc_easy": { |
|
"acc": 0.6784511784511784, |
|
"acc_stderr": 0.00958409157564062, |
|
"acc_norm": 0.6607744107744108, |
|
"acc_norm_stderr": 0.00971491720776585 |
|
}, |
|
"arc_challenge": { |
|
"acc": 0.33276450511945393, |
|
"acc_stderr": 0.01376986304619231, |
|
"acc_norm": 0.3643344709897611, |
|
"acc_norm_stderr": 0.014063260279882415 |
|
}, |
|
"sciq": { |
|
"acc": 0.93, |
|
"acc_stderr": 0.008072494358323499, |
|
"acc_norm": 0.91, |
|
"acc_norm_stderr": 0.009054390204866442 |
|
}, |
|
"piqa": { |
|
"acc": 0.7780195865070729, |
|
"acc_stderr": 0.009696120744662019, |
|
"acc_norm": 0.7872687704026116, |
|
"acc_norm_stderr": 0.009548223123047352 |
|
} |
|
}, |
|
"versions": { |
|
"anli_r1": 0, |
|
"anli_r2": 0, |
|
"anli_r3": 0, |
|
"cb": 1, |
|
"copa": 0, |
|
"hellaswag": 0, |
|
"rte": 0, |
|
"winogrande": 0, |
|
"storycloze_2016": 0, |
|
"boolq": 1, |
|
"arc_easy": 0, |
|
"arc_challenge": 0, |
|
"sciq": 0, |
|
"piqa": 0 |
|
} |
|
} |