|
{ |
|
"best_metric": 0.2942464351654053, |
|
"best_model_checkpoint": "deberta-v3-small-Tweet_About_Disaster_Or_Not/checkpoint-286", |
|
"epoch": 5.0, |
|
"global_step": 715, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.01, |
|
"learning_rate": 1.9972027972027975e-05, |
|
"loss": 0.6828, |
|
"step": 1 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"learning_rate": 1.6000000000000003e-05, |
|
"loss": 0.4167, |
|
"step": 143 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_F1": 0.7164179104477612, |
|
"eval_Precision": 0.6536964980544747, |
|
"eval_Recall": 0.7924528301886793, |
|
"eval_accuracy": 0.8830255057167986, |
|
"eval_loss": 0.31481608748435974, |
|
"eval_runtime": 112.0574, |
|
"eval_samples_per_second": 10.147, |
|
"eval_steps_per_second": 0.161, |
|
"step": 143 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"learning_rate": 1.2e-05, |
|
"loss": 0.255, |
|
"step": 286 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_F1": 0.7452830188679244, |
|
"eval_Precision": 0.7452830188679245, |
|
"eval_Recall": 0.7452830188679245, |
|
"eval_accuracy": 0.9050131926121372, |
|
"eval_loss": 0.2942464351654053, |
|
"eval_runtime": 107.0503, |
|
"eval_samples_per_second": 10.621, |
|
"eval_steps_per_second": 0.168, |
|
"step": 286 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"learning_rate": 8.000000000000001e-06, |
|
"loss": 0.1935, |
|
"step": 429 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_F1": 0.7288135593220341, |
|
"eval_Precision": 0.6615384615384615, |
|
"eval_Recall": 0.8113207547169812, |
|
"eval_accuracy": 0.8874230430958663, |
|
"eval_loss": 0.30222010612487793, |
|
"eval_runtime": 97.6108, |
|
"eval_samples_per_second": 11.648, |
|
"eval_steps_per_second": 0.184, |
|
"step": 429 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"learning_rate": 4.000000000000001e-06, |
|
"loss": 0.1512, |
|
"step": 572 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_F1": 0.7172131147540985, |
|
"eval_Precision": 0.6340579710144928, |
|
"eval_Recall": 0.8254716981132075, |
|
"eval_accuracy": 0.8786279683377308, |
|
"eval_loss": 0.34052926301956177, |
|
"eval_runtime": 109.9221, |
|
"eval_samples_per_second": 10.344, |
|
"eval_steps_per_second": 0.164, |
|
"step": 572 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"learning_rate": 0.0, |
|
"loss": 0.1192, |
|
"step": 715 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_F1": 0.7372881355932203, |
|
"eval_Precision": 0.6692307692307692, |
|
"eval_Recall": 0.8207547169811321, |
|
"eval_accuracy": 0.8909410729991205, |
|
"eval_loss": 0.36176347732543945, |
|
"eval_runtime": 106.1779, |
|
"eval_samples_per_second": 10.708, |
|
"eval_steps_per_second": 0.17, |
|
"step": 715 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"step": 715, |
|
"total_flos": 1565044222059360.0, |
|
"train_loss": 0.2275060863761635, |
|
"train_runtime": 26600.6068, |
|
"train_samples_per_second": 1.71, |
|
"train_steps_per_second": 0.027 |
|
} |
|
], |
|
"max_steps": 715, |
|
"num_train_epochs": 5, |
|
"total_flos": 1565044222059360.0, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|