ChatSKKU5.8B / eval /kullm_0_shot.json
jojo0217's picture
Upload 3 files
ed40acb
raw
history blame
No virus
1.21 kB
{
"results": {
"kobest_boolq": {
"acc": 0.5028490028490028,
"acc_stderr": 0.013348550797680814,
"macro_f1": 0.3371320037986705,
"macro_f1_stderr": 0.006306119104194062
},
"kobest_copa": {
"acc": 0.766,
"acc_stderr": 0.013394902889660007,
"macro_f1": 0.7652638674884438,
"macro_f1_stderr": 0.01339434219317699
},
"kobest_hellaswag": {
"acc": 0.444,
"acc_stderr": 0.02224224437573102,
"acc_norm": 0.552,
"acc_norm_stderr": 0.02226169729227013,
"macro_f1": 0.4425279610634302,
"macro_f1_stderr": 0.02226671964725493
},
"kobest_sentineg": {
"acc": 0.5037783375314862,
"acc_stderr": 0.025125227983562776,
"macro_f1": 0.33500837520938026,
"macro_f1_stderr": 0.011139659523368081
}
},
"versions": {
"kobest_boolq": 0,
"kobest_copa": 0,
"kobest_hellaswag": 0,
"kobest_sentineg": 0
},
"config": {
"model": "gpt2",
"model_args": "pretrained=nlpai-lab/kullm-polyglot-5.8b-v2",
"num_fewshot": 0,
"batch_size": "2",
"device": "cuda:0",
"no_cache": true,
"limit": null,
"bootstrap_iters": 100000,
"description_dict": {}
}
}