SecBERT-CyNER / trainer_state.json
Anonymous
Upload folder using huggingface_hub
3566be9
{
"best_metric": 0.12117183208465576,
"best_model_checkpoint": "/content/cyner_secbert/checkpoint-500",
"epoch": 10.0,
"eval_steps": 500,
"global_step": 3520,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.42,
"learning_rate": 1.715909090909091e-05,
"loss": 0.165,
"step": 500
},
{
"epoch": 1.42,
"eval_accuracy": 0.9723376956633307,
"eval_f1": 0.6189111747851002,
"eval_loss": 0.12117183208465576,
"eval_precision": 0.7047308319738989,
"eval_recall": 0.5517241379310345,
"eval_runtime": 2.5587,
"eval_samples_per_second": 317.348,
"eval_steps_per_second": 39.864,
"step": 500
},
{
"epoch": 2.84,
"learning_rate": 1.431818181818182e-05,
"loss": 0.04,
"step": 1000
},
{
"epoch": 2.84,
"eval_accuracy": 0.970490120605594,
"eval_f1": 0.5904761904761905,
"eval_loss": 0.16471919417381287,
"eval_precision": 0.6924398625429553,
"eval_recall": 0.5146871008939975,
"eval_runtime": 1.9792,
"eval_samples_per_second": 410.273,
"eval_steps_per_second": 51.537,
"step": 1000
},
{
"epoch": 4.26,
"learning_rate": 1.1477272727272729e-05,
"loss": 0.0156,
"step": 1500
},
{
"epoch": 4.26,
"eval_accuracy": 0.9713625866050808,
"eval_f1": 0.5977175463623395,
"eval_loss": 0.18028192222118378,
"eval_precision": 0.6768982229402262,
"eval_recall": 0.5351213282247765,
"eval_runtime": 2.4993,
"eval_samples_per_second": 324.895,
"eval_steps_per_second": 40.812,
"step": 1500
},
{
"epoch": 5.68,
"learning_rate": 8.636363636363637e-06,
"loss": 0.0087,
"step": 2000
},
{
"epoch": 5.68,
"eval_accuracy": 0.9713112650756992,
"eval_f1": 0.5938375350140056,
"eval_loss": 0.1866268515586853,
"eval_precision": 0.6573643410852713,
"eval_recall": 0.541507024265645,
"eval_runtime": 2.0145,
"eval_samples_per_second": 403.074,
"eval_steps_per_second": 50.632,
"step": 2000
},
{
"epoch": 7.1,
"learning_rate": 5.795454545454546e-06,
"loss": 0.0036,
"step": 2500
},
{
"epoch": 7.1,
"eval_accuracy": 0.9719271234282781,
"eval_f1": 0.6052076002814919,
"eval_loss": 0.20198111236095428,
"eval_precision": 0.6739811912225705,
"eval_recall": 0.5491698595146871,
"eval_runtime": 2.4675,
"eval_samples_per_second": 329.073,
"eval_steps_per_second": 41.337,
"step": 2500
},
{
"epoch": 8.52,
"learning_rate": 2.954545454545455e-06,
"loss": 0.0024,
"step": 3000
},
{
"epoch": 8.52,
"eval_accuracy": 0.9720297664870413,
"eval_f1": 0.6080892608089261,
"eval_loss": 0.20356133580207825,
"eval_precision": 0.6697388632872504,
"eval_recall": 0.5568326947637292,
"eval_runtime": 2.5877,
"eval_samples_per_second": 313.797,
"eval_steps_per_second": 39.418,
"step": 3000
},
{
"epoch": 9.94,
"learning_rate": 1.1363636363636364e-07,
"loss": 0.0018,
"step": 3500
},
{
"epoch": 9.94,
"eval_accuracy": 0.971465229663844,
"eval_f1": 0.6036414565826329,
"eval_loss": 0.20842024683952332,
"eval_precision": 0.6682170542635659,
"eval_recall": 0.5504469987228607,
"eval_runtime": 1.9903,
"eval_samples_per_second": 407.98,
"eval_steps_per_second": 51.249,
"step": 3500
},
{
"epoch": 10.0,
"step": 3520,
"total_flos": 507181396306572.0,
"train_loss": 0.03371541356159882,
"train_runtime": 327.9315,
"train_samples_per_second": 85.689,
"train_steps_per_second": 10.734
}
],
"logging_steps": 500,
"max_steps": 3520,
"num_train_epochs": 10,
"save_steps": 500,
"total_flos": 507181396306572.0,
"trial_name": null,
"trial_params": null
}