Muennighoff's picture
Add eval
990f338
task,metric,value,err,version
anli_r1,acc,0.35,0.015090650341444233,0
anli_r2,acc,0.34,0.014987482264363937,0
anli_r3,acc,0.33166666666666667,0.013596836729485163,0
arc_challenge,acc,0.2636518771331058,0.012875929151297061,0
arc_challenge,acc_norm,0.2790102389078498,0.013106784883601345,0
arc_easy,acc,0.5656565656565656,0.010170943451269425,0
arc_easy,acc_norm,0.5404040404040404,0.010226230740889027,0
boolq,acc,0.5951070336391437,0.008585393347962315,1
cb,acc,0.44642857142857145,0.06703189227942398,1
cb,f1,0.3011143410852713,,1
copa,acc,0.75,0.04351941398892446,0
hellaswag,acc,0.4255128460466043,0.004934100774481221,0
hellaswag,acc_norm,0.5439155546703844,0.004970497804772303,0
piqa,acc,0.7295973884657236,0.010363167031620803,0
piqa,acc_norm,0.7323177366702938,0.010330111189370415,0
rte,acc,0.5487364620938628,0.029953149241808946,0
sciq,acc,0.873,0.010534798620855748,0
sciq,acc_norm,0.855,0.01113997751789013,0
storycloze_2016,acc,0.6787814003206841,0.010798029402794913,0
winogrande,acc,0.5295974743488555,0.014027843827840083,0