Muennighoff's picture
Add
9bae13a
{
"results": {
"anli_r1": {
"acc": 0.333,
"acc_stderr": 0.014910846164229873
},
"anli_r2": {
"acc": 0.351,
"acc_stderr": 0.015100563798316403
},
"anli_r3": {
"acc": 0.335,
"acc_stderr": 0.01363087184382148
},
"cb": {
"acc": 0.39285714285714285,
"acc_stderr": 0.0658538889806635,
"f1": 0.27474323062558353
},
"copa": {
"acc": 0.59,
"acc_stderr": 0.04943110704237102
},
"hellaswag": {
"acc": 0.28281218880701053,
"acc_stderr": 0.004494454911844635,
"acc_norm": 0.2951603266281617,
"acc_norm_stderr": 0.004551826272978058
},
"rte": {
"acc": 0.48375451263537905,
"acc_stderr": 0.030080573208738064
},
"winogrande": {
"acc": 0.49013417521704816,
"acc_stderr": 0.014049749833367592
},
"storycloze_2016": {
"acc": 0.564404061998931,
"acc_stderr": 0.011466111817562836
},
"boolq": {
"acc": 0.4938837920489297,
"acc_stderr": 0.00874440068189348
},
"arc_easy": {
"acc": 0.3918350168350168,
"acc_stderr": 0.010016835016834962,
"acc_norm": 0.3653198653198653,
"acc_norm_stderr": 0.009880576614806928
},
"arc_challenge": {
"acc": 0.18771331058020477,
"acc_stderr": 0.01141100131415512,
"acc_norm": 0.2158703071672355,
"acc_norm_stderr": 0.01202297536003066
},
"sciq": {
"acc": 0.692,
"acc_stderr": 0.014606483127342761,
"acc_norm": 0.64,
"acc_norm_stderr": 0.01518652793204012
},
"piqa": {
"acc": 0.6381936887921654,
"acc_stderr": 0.011211397313020366,
"acc_norm": 0.6207834602829162,
"acc_norm_stderr": 0.011320331012905074
}
},
"versions": {
"anli_r1": 0,
"anli_r2": 0,
"anli_r3": 0,
"cb": 1,
"copa": 0,
"hellaswag": 0,
"rte": 0,
"winogrande": 0,
"storycloze_2016": 0,
"boolq": 1,
"arc_easy": 0,
"arc_challenge": 0,
"sciq": 0,
"piqa": 0
}
}