|
{ |
|
"best_metric": 0.6578601002693176, |
|
"best_model_checkpoint": "hBERTv2_new_no_pretrain_qqp/checkpoint-14215", |
|
"epoch": 10.0, |
|
"global_step": 28430, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"learning_rate": 0.0004900105522335561, |
|
"loss": 0.6669, |
|
"step": 2843 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_accuracy": 0.6318327974276527, |
|
"eval_combined_score": 0.3159163987138264, |
|
"eval_f1": 0.0, |
|
"eval_loss": 0.6595353484153748, |
|
"eval_runtime": 67.7356, |
|
"eval_samples_per_second": 596.88, |
|
"eval_steps_per_second": 4.665, |
|
"step": 2843 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"learning_rate": 0.0004800105522335561, |
|
"loss": 0.6591, |
|
"step": 5686 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_accuracy": 0.6318327974276527, |
|
"eval_combined_score": 0.3159163987138264, |
|
"eval_f1": 0.0, |
|
"eval_loss": 0.6586501598358154, |
|
"eval_runtime": 67.7263, |
|
"eval_samples_per_second": 596.962, |
|
"eval_steps_per_second": 4.666, |
|
"step": 5686 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"learning_rate": 0.0004700105522335561, |
|
"loss": 0.6589, |
|
"step": 8529 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_accuracy": 0.6318327974276527, |
|
"eval_combined_score": 0.3159163987138264, |
|
"eval_f1": 0.0, |
|
"eval_loss": 0.6581756472587585, |
|
"eval_runtime": 67.7959, |
|
"eval_samples_per_second": 596.348, |
|
"eval_steps_per_second": 4.661, |
|
"step": 8529 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"learning_rate": 0.0004600140696447415, |
|
"loss": 0.6587, |
|
"step": 11372 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy": 0.6318327974276527, |
|
"eval_combined_score": 0.3159163987138264, |
|
"eval_f1": 0.0, |
|
"eval_loss": 0.6579899787902832, |
|
"eval_runtime": 67.7187, |
|
"eval_samples_per_second": 597.028, |
|
"eval_steps_per_second": 4.666, |
|
"step": 11372 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"learning_rate": 0.0004500175870559268, |
|
"loss": 0.6586, |
|
"step": 14215 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_accuracy": 0.6318327974276527, |
|
"eval_combined_score": 0.3159163987138264, |
|
"eval_f1": 0.0, |
|
"eval_loss": 0.6578601002693176, |
|
"eval_runtime": 67.6584, |
|
"eval_samples_per_second": 597.561, |
|
"eval_steps_per_second": 4.671, |
|
"step": 14215 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"learning_rate": 0.0004400211044671122, |
|
"loss": 0.6586, |
|
"step": 17058 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_accuracy": 0.6318327974276527, |
|
"eval_combined_score": 0.3159163987138264, |
|
"eval_f1": 0.0, |
|
"eval_loss": 0.6580154895782471, |
|
"eval_runtime": 67.6879, |
|
"eval_samples_per_second": 597.3, |
|
"eval_steps_per_second": 4.668, |
|
"step": 17058 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"learning_rate": 0.00043002110446711226, |
|
"loss": 0.6586, |
|
"step": 19901 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_accuracy": 0.6318327974276527, |
|
"eval_combined_score": 0.3159163987138264, |
|
"eval_f1": 0.0, |
|
"eval_loss": 0.6579923629760742, |
|
"eval_runtime": 67.6844, |
|
"eval_samples_per_second": 597.331, |
|
"eval_steps_per_second": 4.669, |
|
"step": 19901 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"learning_rate": 0.00042002813928948297, |
|
"loss": 0.6586, |
|
"step": 22744 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_accuracy": 0.6318327974276527, |
|
"eval_combined_score": 0.3159163987138264, |
|
"eval_f1": 0.0, |
|
"eval_loss": 0.6579098701477051, |
|
"eval_runtime": 67.6644, |
|
"eval_samples_per_second": 597.508, |
|
"eval_steps_per_second": 4.67, |
|
"step": 22744 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"learning_rate": 0.00041003165670066834, |
|
"loss": 0.6586, |
|
"step": 25587 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_accuracy": 0.6318327974276527, |
|
"eval_combined_score": 0.3159163987138264, |
|
"eval_f1": 0.0, |
|
"eval_loss": 0.6579644680023193, |
|
"eval_runtime": 67.7204, |
|
"eval_samples_per_second": 597.014, |
|
"eval_steps_per_second": 4.666, |
|
"step": 25587 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"learning_rate": 0.0004000351741118537, |
|
"loss": 0.6586, |
|
"step": 28430 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_accuracy": 0.6318327974276527, |
|
"eval_combined_score": 0.3159163987138264, |
|
"eval_f1": 0.0, |
|
"eval_loss": 0.6579644680023193, |
|
"eval_runtime": 67.7641, |
|
"eval_samples_per_second": 596.629, |
|
"eval_steps_per_second": 4.663, |
|
"step": 28430 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"step": 28430, |
|
"total_flos": 5.3244920021909504e+17, |
|
"train_loss": 0.6595250953891686, |
|
"train_runtime": 18380.3319, |
|
"train_samples_per_second": 989.77, |
|
"train_steps_per_second": 7.734 |
|
} |
|
], |
|
"max_steps": 142150, |
|
"num_train_epochs": 50, |
|
"total_flos": 5.3244920021909504e+17, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|