cv_parser / trainer_state.json
nhanv
update
904bd0a
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 10.0,
"global_step": 910,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_accuracy": 0.9533894011551323,
"eval_f1": 0.6969990319457888,
"eval_loss": 0.20486080646514893,
"eval_precision": 0.6617647058823529,
"eval_recall": 0.7361963190184049,
"eval_runtime": 1.2373,
"eval_samples_per_second": 130.123,
"eval_steps_per_second": 33.137,
"step": 91
},
{
"epoch": 1.1,
"learning_rate": 4.4505494505494504e-05,
"loss": 0.5036,
"step": 100
},
{
"epoch": 2.0,
"eval_accuracy": 0.9722362954706657,
"eval_f1": 0.8234146341463414,
"eval_loss": 0.11564752459526062,
"eval_precision": 0.7873134328358209,
"eval_recall": 0.8629856850715747,
"eval_runtime": 1.2367,
"eval_samples_per_second": 130.181,
"eval_steps_per_second": 33.152,
"step": 182
},
{
"epoch": 2.2,
"learning_rate": 3.901098901098901e-05,
"loss": 0.1442,
"step": 200
},
{
"epoch": 3.0,
"eval_accuracy": 0.9771000101327388,
"eval_f1": 0.8632812499999999,
"eval_loss": 0.10779214650392532,
"eval_precision": 0.8261682242990654,
"eval_recall": 0.9038854805725971,
"eval_runtime": 1.2508,
"eval_samples_per_second": 128.715,
"eval_steps_per_second": 32.778,
"step": 273
},
{
"epoch": 3.3,
"learning_rate": 3.3516483516483513e-05,
"loss": 0.0757,
"step": 300
},
{
"epoch": 4.0,
"eval_accuracy": 0.9780119566318776,
"eval_f1": 0.8851148851148851,
"eval_loss": 0.1178947389125824,
"eval_precision": 0.865234375,
"eval_recall": 0.9059304703476483,
"eval_runtime": 1.2453,
"eval_samples_per_second": 129.288,
"eval_steps_per_second": 32.924,
"step": 364
},
{
"epoch": 4.4,
"learning_rate": 2.8021978021978025e-05,
"loss": 0.0526,
"step": 400
},
{
"epoch": 5.0,
"eval_accuracy": 0.9836862904042962,
"eval_f1": 0.897876643073812,
"eval_loss": 0.0906740128993988,
"eval_precision": 0.888,
"eval_recall": 0.9079754601226994,
"eval_runtime": 1.2584,
"eval_samples_per_second": 127.94,
"eval_steps_per_second": 32.581,
"step": 455
},
{
"epoch": 5.49,
"learning_rate": 2.252747252747253e-05,
"loss": 0.0342,
"step": 500
},
{
"epoch": 6.0,
"eval_accuracy": 0.9831796534603303,
"eval_f1": 0.9130869130869131,
"eval_loss": 0.0972292423248291,
"eval_precision": 0.892578125,
"eval_recall": 0.934560327198364,
"eval_runtime": 1.2748,
"eval_samples_per_second": 126.296,
"eval_steps_per_second": 32.162,
"step": 546
},
{
"epoch": 6.59,
"learning_rate": 1.7032967032967035e-05,
"loss": 0.0245,
"step": 600
},
{
"epoch": 7.0,
"eval_accuracy": 0.9833823082379167,
"eval_f1": 0.9107321965897693,
"eval_loss": 0.10643576085567474,
"eval_precision": 0.8937007874015748,
"eval_recall": 0.9284253578732107,
"eval_runtime": 1.2478,
"eval_samples_per_second": 129.031,
"eval_steps_per_second": 32.859,
"step": 637
},
{
"epoch": 7.69,
"learning_rate": 1.153846153846154e-05,
"loss": 0.0188,
"step": 700
},
{
"epoch": 8.0,
"eval_accuracy": 0.9850035464586078,
"eval_f1": 0.9169169169169169,
"eval_loss": 0.09653466939926147,
"eval_precision": 0.8980392156862745,
"eval_recall": 0.9366053169734151,
"eval_runtime": 1.2451,
"eval_samples_per_second": 129.306,
"eval_steps_per_second": 32.929,
"step": 728
},
{
"epoch": 8.79,
"learning_rate": 6.043956043956044e-06,
"loss": 0.0159,
"step": 800
},
{
"epoch": 9.0,
"eval_accuracy": 0.984598236903435,
"eval_f1": 0.9201213346814965,
"eval_loss": 0.09986742585897446,
"eval_precision": 0.91,
"eval_recall": 0.9304703476482618,
"eval_runtime": 1.2461,
"eval_samples_per_second": 129.208,
"eval_steps_per_second": 32.904,
"step": 819
},
{
"epoch": 9.89,
"learning_rate": 5.494505494505495e-07,
"loss": 0.0141,
"step": 900
},
{
"epoch": 10.0,
"eval_accuracy": 0.985104873847401,
"eval_f1": 0.911088911088911,
"eval_loss": 0.09563781321048737,
"eval_precision": 0.890625,
"eval_recall": 0.9325153374233128,
"eval_runtime": 1.2493,
"eval_samples_per_second": 128.877,
"eval_steps_per_second": 32.819,
"step": 910
},
{
"epoch": 10.0,
"step": 910,
"total_flos": 1883034567828480.0,
"train_loss": 0.09724931471295409,
"train_runtime": 322.9196,
"train_samples_per_second": 44.624,
"train_steps_per_second": 2.818
}
],
"max_steps": 910,
"num_train_epochs": 10,
"total_flos": 1883034567828480.0,
"trial_name": null,
"trial_params": null
}