{ "results": { "anli_r1": { "acc": 0.324, "acc_stderr": 0.01480686473373886 }, "anli_r2": { "acc": 0.33, "acc_stderr": 0.014876872027456732 }, "anli_r3": { "acc": 0.3258333333333333, "acc_stderr": 0.013535422043417454 }, "cb": { "acc": 0.4107142857142857, "acc_stderr": 0.0663363415035954, "f1": 0.27708333333333335 }, "copa": { "acc": 0.82, "acc_stderr": 0.038612291966536955 }, "hellaswag": { "acc": 0.5340569607647879, "acc_stderr": 0.0049781928934062745, "acc_norm": 0.716391157140012, "acc_norm_stderr": 0.0044982802444945074 }, "rte": { "acc": 0.5703971119133574, "acc_stderr": 0.02979666882912467 }, "winogrande": { "acc": 0.6345698500394633, "acc_stderr": 0.013533965097638788 }, "storycloze_2016": { "acc": 0.7594869053981828, "acc_stderr": 0.009883453084862687 }, "boolq": { "acc": 0.6629969418960244, "acc_stderr": 0.008267329046329363 }, "arc_easy": { "acc": 0.6957070707070707, "acc_stderr": 0.009441202922359185, "acc_norm": 0.6712962962962963, "acc_norm_stderr": 0.009638903167022168 }, "arc_challenge": { "acc": 0.3455631399317406, "acc_stderr": 0.013896938461145687, "acc_norm": 0.3643344709897611, "acc_norm_stderr": 0.014063260279882413 }, "sciq": { "acc": 0.946, "acc_stderr": 0.007150883521295435, "acc_norm": 0.942, "acc_norm_stderr": 0.007395315455792937 }, "piqa": { "acc": 0.7758433079434167, "acc_stderr": 0.00972989795641006, "acc_norm": 0.7861806311207835, "acc_norm_stderr": 0.009565994206915607 } }, "versions": { "anli_r1": 0, "anli_r2": 0, "anli_r3": 0, "cb": 1, "copa": 0, "hellaswag": 0, "rte": 0, "winogrande": 0, "storycloze_2016": 0, "boolq": 1, "arc_easy": 0, "arc_challenge": 0, "sciq": 0, "piqa": 0 } }