|
{ |
|
"best_metric": 0.2557324171066284, |
|
"best_model_checkpoint": "distilbert-base-uncased-Tweet_About_Disaster_Or_Not/checkpoint-429", |
|
"epoch": 5.0, |
|
"global_step": 715, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.01, |
|
"learning_rate": 1.9972027972027975e-05, |
|
"loss": 0.6649, |
|
"step": 1 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"learning_rate": 1.6000000000000003e-05, |
|
"loss": 0.3734, |
|
"step": 143 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_F1": 0.7404063205417606, |
|
"eval_Precision": 0.6919831223628692, |
|
"eval_Recall": 0.7961165048543689, |
|
"eval_accuracy": 0.8988566402814424, |
|
"eval_loss": 0.2855009436607361, |
|
"eval_runtime": 32.5504, |
|
"eval_samples_per_second": 34.93, |
|
"eval_steps_per_second": 0.553, |
|
"step": 143 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"learning_rate": 1.2e-05, |
|
"loss": 0.2466, |
|
"step": 286 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_F1": 0.7381974248927039, |
|
"eval_Precision": 0.6615384615384615, |
|
"eval_Recall": 0.8349514563106796, |
|
"eval_accuracy": 0.8927000879507476, |
|
"eval_loss": 0.255790650844574, |
|
"eval_runtime": 32.1564, |
|
"eval_samples_per_second": 35.358, |
|
"eval_steps_per_second": 0.56, |
|
"step": 286 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"learning_rate": 8.000000000000001e-06, |
|
"loss": 0.1723, |
|
"step": 429 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_F1": 0.7752293577981653, |
|
"eval_Precision": 0.7347826086956522, |
|
"eval_Recall": 0.8203883495145631, |
|
"eval_accuracy": 0.9138082673702727, |
|
"eval_loss": 0.2557324171066284, |
|
"eval_runtime": 32.7041, |
|
"eval_samples_per_second": 34.766, |
|
"eval_steps_per_second": 0.55, |
|
"step": 429 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"learning_rate": 4.000000000000001e-06, |
|
"loss": 0.1292, |
|
"step": 572 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_F1": 0.7741935483870966, |
|
"eval_Precision": 0.7368421052631579, |
|
"eval_Recall": 0.8155339805825242, |
|
"eval_accuracy": 0.9138082673702727, |
|
"eval_loss": 0.27726978063583374, |
|
"eval_runtime": 31.6616, |
|
"eval_samples_per_second": 35.911, |
|
"eval_steps_per_second": 0.569, |
|
"step": 572 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"learning_rate": 0.0, |
|
"loss": 0.0913, |
|
"step": 715 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_F1": 0.7759815242494226, |
|
"eval_Precision": 0.7400881057268722, |
|
"eval_Recall": 0.8155339805825242, |
|
"eval_accuracy": 0.9146877748460862, |
|
"eval_loss": 0.300839364528656, |
|
"eval_runtime": 62.0482, |
|
"eval_samples_per_second": 18.324, |
|
"eval_steps_per_second": 0.29, |
|
"step": 715 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"step": 715, |
|
"total_flos": 494206887142080.0, |
|
"train_loss": 0.20296044624768772, |
|
"train_runtime": 4241.2382, |
|
"train_samples_per_second": 10.723, |
|
"train_steps_per_second": 0.169 |
|
} |
|
], |
|
"max_steps": 715, |
|
"num_train_epochs": 5, |
|
"total_flos": 494206887142080.0, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|