ChatSKKU5.8B / eval /chatskku_0_shot.json
jojo0217's picture
Upload 3 files
ed40acb
raw
history blame
No virus
1.2 kB
{
"results": {
"kobest_boolq": {
"acc": 0.5256410256410257,
"acc_stderr": 0.013331203323083502,
"macro_f1": 0.3992444490131579,
"macro_f1_stderr": 0.010971221905948464
},
"kobest_copa": {
"acc": 0.785,
"acc_stderr": 0.012997843819031832,
"macro_f1": 0.7847052615029975,
"macro_f1_stderr": 0.012967330755596378
},
"kobest_hellaswag": {
"acc": 0.466,
"acc_stderr": 0.02233126442325838,
"acc_norm": 0.592,
"acc_norm_stderr": 0.022000910893877193,
"macro_f1": 0.46440112486053614,
"macro_f1_stderr": 0.022343780241897912
},
"kobest_sentineg": {
"acc": 0.5062972292191436,
"acc_stderr": 0.02512395255890725,
"macro_f1": 0.34501683501683506,
"macro_f1_stderr": 0.01352473866949455
}
},
"versions": {
"kobest_boolq": 0,
"kobest_copa": 0,
"kobest_hellaswag": 0,
"kobest_sentineg": 0
},
"config": {
"model": "gpt2",
"model_args": "pretrained=jojo0217/ChatSKKU5.8B",
"num_fewshot": 0,
"batch_size": "4",
"device": "cuda:0",
"no_cache": true,
"limit": null,
"bootstrap_iters": 100000,
"description_dict": {}
}
}