|
{ |
|
"results": { |
|
"anli_r1": { |
|
"acc": 0.355, |
|
"acc_stderr": 0.01513949154378053 |
|
}, |
|
"anli_r2": { |
|
"acc": 0.359, |
|
"acc_stderr": 0.015177264224798601 |
|
}, |
|
"anli_r3": { |
|
"acc": 0.3308333333333333, |
|
"acc_stderr": 0.013588208070708992 |
|
}, |
|
"cb": { |
|
"acc": 0.48214285714285715, |
|
"acc_stderr": 0.0673769750864465, |
|
"f1": 0.3403298350824588 |
|
}, |
|
"copa": { |
|
"acc": 0.7, |
|
"acc_stderr": 0.046056618647183814 |
|
}, |
|
"hellaswag": { |
|
"acc": 0.4303923521210914, |
|
"acc_stderr": 0.004941191607317909, |
|
"acc_norm": 0.5592511451902011, |
|
"acc_norm_stderr": 0.004954622308739016 |
|
}, |
|
"rte": { |
|
"acc": 0.5451263537906137, |
|
"acc_stderr": 0.029973636495415252 |
|
}, |
|
"winogrande": { |
|
"acc": 0.5422257300710339, |
|
"acc_stderr": 0.014002284504422442 |
|
}, |
|
"storycloze_2016": { |
|
"acc": 0.689470871191876, |
|
"acc_stderr": 0.010700112173178448 |
|
}, |
|
"boolq": { |
|
"acc": 0.5856269113149847, |
|
"acc_stderr": 0.00861586377642113 |
|
}, |
|
"arc_easy": { |
|
"acc": 0.5648148148148148, |
|
"acc_stderr": 0.010173216430370927, |
|
"acc_norm": 0.5340909090909091, |
|
"acc_norm_stderr": 0.010235908103438688 |
|
}, |
|
"arc_challenge": { |
|
"acc": 0.2551194539249147, |
|
"acc_stderr": 0.012739038695202098, |
|
"acc_norm": 0.2858361774744027, |
|
"acc_norm_stderr": 0.013203196088537369 |
|
}, |
|
"sciq": { |
|
"acc": 0.862, |
|
"acc_stderr": 0.010912152632504411, |
|
"acc_norm": 0.796, |
|
"acc_norm_stderr": 0.012749374359024391 |
|
}, |
|
"piqa": { |
|
"acc": 0.7328618063112078, |
|
"acc_stderr": 0.010323440492612426, |
|
"acc_norm": 0.73449401523395, |
|
"acc_norm_stderr": 0.010303308653024432 |
|
} |
|
}, |
|
"versions": { |
|
"anli_r1": 0, |
|
"anli_r2": 0, |
|
"anli_r3": 0, |
|
"cb": 1, |
|
"copa": 0, |
|
"hellaswag": 0, |
|
"rte": 0, |
|
"winogrande": 0, |
|
"storycloze_2016": 0, |
|
"boolq": 1, |
|
"arc_easy": 0, |
|
"arc_challenge": 0, |
|
"sciq": 0, |
|
"piqa": 0 |
|
} |
|
} |