{ "results": { "anli_r1": { "acc": 0.328, "acc_stderr": 0.014853842487270333 }, "anli_r2": { "acc": 0.325, "acc_stderr": 0.014818724459095527 }, "anli_r3": { "acc": 0.34, "acc_stderr": 0.013680495725767789 }, "cb": { "acc": 0.42857142857142855, "acc_stderr": 0.06672848092813058, "f1": 0.30414746543778803 }, "copa": { "acc": 0.66, "acc_stderr": 0.04760952285695237 }, "hellaswag": { "acc": 0.28141804421429994, "acc_stderr": 0.00448771884333028, "acc_norm": 0.29934276040629354, "acc_norm_stderr": 0.004570342034463229 }, "rte": { "acc": 0.5487364620938628, "acc_stderr": 0.029953149241808943 }, "winogrande": { "acc": 0.4988161010260458, "acc_stderr": 0.014052446290529019 }, "storycloze_2016": { "acc": 0.5831106360235169, "acc_stderr": 0.011401581234266751 }, "boolq": { "acc": 0.5541284403669725, "acc_stderr": 0.008693659886486843 }, "arc_easy": { "acc": 0.4065656565656566, "acc_stderr": 0.010079056419223503, "acc_norm": 0.36952861952861954, "acc_norm_stderr": 0.009904325878447317 }, "arc_challenge": { "acc": 0.18430034129692832, "acc_stderr": 0.011330517933037411, "acc_norm": 0.23122866894197952, "acc_norm_stderr": 0.012320858834772278 }, "sciq": { "acc": 0.685, "acc_stderr": 0.014696631960792496, "acc_norm": 0.595, "acc_norm_stderr": 0.015531136990453047 }, "piqa": { "acc": 0.6376496191512514, "acc_stderr": 0.011215040215104565, "acc_norm": 0.6289445048966268, "acc_norm_stderr": 0.011271222398600525 } }, "versions": { "anli_r1": 0, "anli_r2": 0, "anli_r3": 0, "cb": 1, "copa": 0, "hellaswag": 0, "rte": 0, "winogrande": 0, "storycloze_2016": 0, "boolq": 1, "arc_easy": 0, "arc_challenge": 0, "sciq": 0, "piqa": 0 } }