|
{ |
|
"best_metric": 0.9592657342657342, |
|
"best_model_checkpoint": "output-no-git/EN-OUTPUT/ON_FS_OUT/XLNetFalseTrue-0-1/FalseTrue-0/train_from_dev_and_test.csv/0/checkpoint-81", |
|
"epoch": 9.0, |
|
"global_step": 81, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"eval_accuracy": 0.8583691120147705, |
|
"eval_f1": 0.8558168316831684, |
|
"eval_f1_binary": 0.8750000000000001, |
|
"eval_f1_weighted": 0.8600157226023032, |
|
"eval_loss": 0.336619108915329, |
|
"eval_runtime": 1.8593, |
|
"eval_samples_per_second": 250.638, |
|
"eval_steps_per_second": 31.733, |
|
"step": 9 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_accuracy": 0.8712446093559265, |
|
"eval_f1": 0.8563619924379419, |
|
"eval_f1_binary": 0.9025974025974026, |
|
"eval_f1_weighted": 0.8664821895114718, |
|
"eval_loss": 0.28895148634910583, |
|
"eval_runtime": 1.8336, |
|
"eval_samples_per_second": 254.149, |
|
"eval_steps_per_second": 32.178, |
|
"step": 18 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_accuracy": 0.946351945400238, |
|
"eval_f1": 0.9442250149611011, |
|
"eval_f1_binary": 0.9551166965888689, |
|
"eval_f1_weighted": 0.946609031111385, |
|
"eval_loss": 0.17678162455558777, |
|
"eval_runtime": 1.8406, |
|
"eval_samples_per_second": 253.179, |
|
"eval_steps_per_second": 32.055, |
|
"step": 27 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy": 0.9484978318214417, |
|
"eval_f1": 0.9456876456876457, |
|
"eval_f1_binary": 0.9580419580419581, |
|
"eval_f1_weighted": 0.9483918084776456, |
|
"eval_loss": 0.18410657346248627, |
|
"eval_runtime": 1.8296, |
|
"eval_samples_per_second": 254.697, |
|
"eval_steps_per_second": 32.247, |
|
"step": 36 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_accuracy": 0.9399141669273376, |
|
"eval_f1": 0.9357975122028027, |
|
"eval_f1_binary": 0.952054794520548, |
|
"eval_f1_weighted": 0.9393559731393049, |
|
"eval_loss": 0.23064567148685455, |
|
"eval_runtime": 1.9476, |
|
"eval_samples_per_second": 239.272, |
|
"eval_steps_per_second": 30.294, |
|
"step": 45 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_accuracy": 0.959227442741394, |
|
"eval_f1": 0.9571332432811903, |
|
"eval_f1_binary": 0.9666080843585237, |
|
"eval_f1_weighted": 0.9592071355341688, |
|
"eval_loss": 0.1858169287443161, |
|
"eval_runtime": 1.8406, |
|
"eval_samples_per_second": 253.182, |
|
"eval_steps_per_second": 32.055, |
|
"step": 54 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_accuracy": 0.9570815563201904, |
|
"eval_f1": 0.9550097511054471, |
|
"eval_f1_binary": 0.9646643109540636, |
|
"eval_f1_weighted": 0.9571229809435562, |
|
"eval_loss": 0.19335472583770752, |
|
"eval_runtime": 1.8323, |
|
"eval_samples_per_second": 254.327, |
|
"eval_steps_per_second": 32.2, |
|
"step": 63 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_accuracy": 0.954935610294342, |
|
"eval_f1": 0.9527143581938102, |
|
"eval_f1_binary": 0.962962962962963, |
|
"eval_f1_weighted": 0.9549576150316936, |
|
"eval_loss": 0.20666901767253876, |
|
"eval_runtime": 1.8259, |
|
"eval_samples_per_second": 255.216, |
|
"eval_steps_per_second": 32.313, |
|
"step": 72 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_accuracy": 0.9613733887672424, |
|
"eval_f1": 0.9592657342657342, |
|
"eval_f1_binary": 0.9685314685314687, |
|
"eval_f1_weighted": 0.9612938563582343, |
|
"eval_loss": 0.21665425598621368, |
|
"eval_runtime": 1.8426, |
|
"eval_samples_per_second": 252.897, |
|
"eval_steps_per_second": 32.019, |
|
"step": 81 |
|
} |
|
], |
|
"max_steps": 81, |
|
"num_train_epochs": 9, |
|
"total_flos": 180756537375744.0, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|