{ "results": { "anli_r1": { "acc": 0.334, "acc_stderr": 0.014922019523732954 }, "anli_r2": { "acc": 0.314, "acc_stderr": 0.014683991951087974 }, "anli_r3": { "acc": 0.3416666666666667, "acc_stderr": 0.013696658778002514 }, "cb": { "acc": 0.4107142857142857, "acc_stderr": 0.06633634150359541, "f1": 0.2859744990892532 }, "copa": { "acc": 0.84, "acc_stderr": 0.0368452949177471 }, "hellaswag": { "acc": 0.5349531965743876, "acc_stderr": 0.004977574188421318, "acc_norm": 0.7157936666002789, "acc_norm_stderr": 0.004501137895230712 }, "rte": { "acc": 0.5740072202166066, "acc_stderr": 0.029764956741777652 }, "winogrande": { "acc": 0.6385161799526441, "acc_stderr": 0.013502479670791292 }, "storycloze_2016": { "acc": 0.760555852485302, "acc_stderr": 0.009868402764412846 }, "boolq": { "acc": 0.6681957186544343, "acc_stderr": 0.008235412870849404 }, "arc_easy": { "acc": 0.6877104377104377, "acc_stderr": 0.009509325983631455, "acc_norm": 0.6683501683501684, "acc_norm_stderr": 0.009660733780923952 }, "arc_challenge": { "acc": 0.3464163822525597, "acc_stderr": 0.013905011180063253, "acc_norm": 0.36006825938566556, "acc_norm_stderr": 0.014027516814585186 }, "sciq": { "acc": 0.942, "acc_stderr": 0.007395315455792948, "acc_norm": 0.935, "acc_norm_stderr": 0.007799733061832016 }, "piqa": { "acc": 0.7834602829162133, "acc_stderr": 0.009609984714384612, "acc_norm": 0.7867247007616975, "acc_norm_stderr": 0.00955712122586134 } }, "versions": { "anli_r1": 0, "anli_r2": 0, "anli_r3": 0, "cb": 1, "copa": 0, "hellaswag": 0, "rte": 0, "winogrande": 0, "storycloze_2016": 0, "boolq": 1, "arc_easy": 0, "arc_challenge": 0, "sciq": 0, "piqa": 0 } }