ChatSKKU5.8B / eval /koalpaca_0_shot.json
jojo0217's picture
Upload 3 files
ed40acb
raw
history blame
1.21 kB
{
"results": {
"kobest_boolq": {
"acc": 0.5626780626780626,
"acc_stderr": 0.013243469872682661,
"macro_f1": 0.5053421868652208,
"macro_f1_stderr": 0.013395027664000827
},
"kobest_copa": {
"acc": 0.698,
"acc_stderr": 0.014526080235459544,
"macro_f1": 0.6977279551596436,
"macro_f1_stderr": 0.014458551946793323
},
"kobest_hellaswag": {
"acc": 0.384,
"acc_stderr": 0.021772369465547194,
"acc_norm": 0.462,
"acc_norm_stderr": 0.022318338119870537,
"macro_f1": 0.3834926136948366,
"macro_f1_stderr": 0.02180403516376896
},
"kobest_sentineg": {
"acc": 0.3879093198992443,
"acc_stderr": 0.024486425812624234,
"macro_f1": 0.38484935437589674,
"macro_f1_stderr": 0.024320271236487046
}
},
"versions": {
"kobest_boolq": 0,
"kobest_copa": 0,
"kobest_hellaswag": 0,
"kobest_sentineg": 0
},
"config": {
"model": "gpt2",
"model_args": "pretrained=beomi/KoAlpaca-Polyglot-5.8B",
"num_fewshot": 0,
"batch_size": "4",
"device": "cuda:0",
"no_cache": true,
"limit": null,
"bootstrap_iters": 100000,
"description_dict": {}
}
}