Muennighoff's picture
A
eb2a9c4
task,metric,value,err,version
anli_r1,acc,0.337,0.014955087918653605,0
anli_r2,acc,0.339,0.014976758771620344,0
anli_r3,acc,0.3308333333333333,0.013588208070708986,0
arc_challenge,acc,0.2645051194539249,0.012889272949313366,0
arc_challenge,acc_norm,0.29180887372013653,0.013284525292403501,0
arc_easy,acc,0.5963804713804713,0.010067368960348226,0
arc_easy,acc_norm,0.5340909090909091,0.010235908103438687,0
boolq,acc,0.6125382262996942,0.00852066653613694,1
cb,acc,0.4107142857142857,0.0663363415035954,1
cb,f1,0.1940928270042194,,1
copa,acc,0.73,0.0446196043338474,0
hellaswag,acc,0.43706432981477794,0.00495009555596467,0
hellaswag,acc_norm,0.5617406891057558,0.004951594063272048,0
piqa,acc,0.719804134929271,0.010478122015577082,0
piqa,acc_norm,0.720892274211099,0.010465657948498233,0
rte,acc,0.5126353790613718,0.030086851767188564,0
sciq,acc,0.827,0.011967214137559933,0
sciq,acc_norm,0.751,0.013681600278702301,0
storycloze_2016,acc,0.7076429716729022,0.010518239729787741,0
winogrande,acc,0.5808997632202052,0.013867325192210117,0