{ "results": { "anli_r1": { "acc": 0.333, "acc_stderr": 0.014910846164229873 }, "anli_r2": { "acc": 0.351, "acc_stderr": 0.015100563798316403 }, "anli_r3": { "acc": 0.335, "acc_stderr": 0.01363087184382148 }, "cb": { "acc": 0.39285714285714285, "acc_stderr": 0.0658538889806635, "f1": 0.27474323062558353 }, "copa": { "acc": 0.59, "acc_stderr": 0.04943110704237102 }, "hellaswag": { "acc": 0.28281218880701053, "acc_stderr": 0.004494454911844635, "acc_norm": 0.2951603266281617, "acc_norm_stderr": 0.004551826272978058 }, "rte": { "acc": 0.48375451263537905, "acc_stderr": 0.030080573208738064 }, "winogrande": { "acc": 0.49013417521704816, "acc_stderr": 0.014049749833367592 }, "storycloze_2016": { "acc": 0.564404061998931, "acc_stderr": 0.011466111817562836 }, "boolq": { "acc": 0.4938837920489297, "acc_stderr": 0.00874440068189348 }, "arc_easy": { "acc": 0.3918350168350168, "acc_stderr": 0.010016835016834962, "acc_norm": 0.3653198653198653, "acc_norm_stderr": 0.009880576614806928 }, "arc_challenge": { "acc": 0.18771331058020477, "acc_stderr": 0.01141100131415512, "acc_norm": 0.2158703071672355, "acc_norm_stderr": 0.01202297536003066 }, "sciq": { "acc": 0.692, "acc_stderr": 0.014606483127342761, "acc_norm": 0.64, "acc_norm_stderr": 0.01518652793204012 }, "piqa": { "acc": 0.6381936887921654, "acc_stderr": 0.011211397313020366, "acc_norm": 0.6207834602829162, "acc_norm_stderr": 0.011320331012905074 } }, "versions": { "anli_r1": 0, "anli_r2": 0, "anli_r3": 0, "cb": 1, "copa": 0, "hellaswag": 0, "rte": 0, "winogrande": 0, "storycloze_2016": 0, "boolq": 1, "arc_easy": 0, "arc_challenge": 0, "sciq": 0, "piqa": 0 } }