|
{ |
|
"results": { |
|
"anli_r1": { |
|
"acc": 0.357, |
|
"acc_stderr": 0.015158521721486774 |
|
}, |
|
"anli_r2": { |
|
"acc": 0.334, |
|
"acc_stderr": 0.014922019523732967 |
|
}, |
|
"anli_r3": { |
|
"acc": 0.37416666666666665, |
|
"acc_stderr": 0.01397501560175897 |
|
}, |
|
"cb": { |
|
"acc": 0.39285714285714285, |
|
"acc_stderr": 0.0658538889806635, |
|
"f1": 0.26788664379209554 |
|
}, |
|
"copa": { |
|
"acc": 0.75, |
|
"acc_stderr": 0.04351941398892446 |
|
}, |
|
"hellaswag": { |
|
"acc": 0.45339573790081655, |
|
"acc_stderr": 0.004968058944472161, |
|
"acc_norm": 0.5857398924517029, |
|
"acc_norm_stderr": 0.004915870966174404 |
|
}, |
|
"rte": { |
|
"acc": 0.4657039711191336, |
|
"acc_stderr": 0.030025579819366422 |
|
}, |
|
"winogrande": { |
|
"acc": 0.5509076558800315, |
|
"acc_stderr": 0.01397945938914086 |
|
}, |
|
"storycloze_2016": { |
|
"acc": 0.6878674505611972, |
|
"acc_stderr": 0.010715220346279681 |
|
}, |
|
"boolq": { |
|
"acc": 0.517125382262997, |
|
"acc_stderr": 0.008739923994130054 |
|
}, |
|
"arc_easy": { |
|
"acc": 0.5307239057239057, |
|
"acc_stderr": 0.010240395584815237, |
|
"acc_norm": 0.5084175084175084, |
|
"acc_norm_stderr": 0.010258329515226462 |
|
}, |
|
"arc_challenge": { |
|
"acc": 0.2568259385665529, |
|
"acc_stderr": 0.0127669237941168, |
|
"acc_norm": 0.31399317406143346, |
|
"acc_norm_stderr": 0.013562691224726297 |
|
}, |
|
"sciq": { |
|
"acc": 0.799, |
|
"acc_stderr": 0.012679107214617328, |
|
"acc_norm": 0.751, |
|
"acc_norm_stderr": 0.0136816002787023 |
|
}, |
|
"piqa": { |
|
"acc": 0.7399347116430903, |
|
"acc_stderr": 0.010234893249061303, |
|
"acc_norm": 0.7328618063112078, |
|
"acc_norm_stderr": 0.01032344049261243 |
|
} |
|
}, |
|
"versions": { |
|
"anli_r1": 0, |
|
"anli_r2": 0, |
|
"anli_r3": 0, |
|
"cb": 1, |
|
"copa": 0, |
|
"hellaswag": 0, |
|
"rte": 0, |
|
"winogrande": 0, |
|
"storycloze_2016": 0, |
|
"boolq": 1, |
|
"arc_easy": 0, |
|
"arc_challenge": 0, |
|
"sciq": 0, |
|
"piqa": 0 |
|
} |
|
} |