|
{ |
|
"best_metric": 0.27679798007011414, |
|
"best_model_checkpoint": "spa_en_mBERT/checkpoint-4480", |
|
"epoch": 6.0, |
|
"global_step": 5376, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.56, |
|
"learning_rate": 1.988839285714286e-05, |
|
"loss": 1.015, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_accuracy": 0.8975234842015372, |
|
"eval_f1": 0.7030225599300675, |
|
"eval_loss": 0.40301570296287537, |
|
"eval_precision": 0.7149695684879983, |
|
"eval_recall": 0.691468253968254, |
|
"eval_runtime": 5.8245, |
|
"eval_samples_per_second": 283.973, |
|
"eval_steps_per_second": 17.856, |
|
"step": 896 |
|
}, |
|
{ |
|
"epoch": 1.12, |
|
"learning_rate": 1.9776785714285716e-05, |
|
"loss": 0.466, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 1.67, |
|
"learning_rate": 1.9665178571428575e-05, |
|
"loss": 0.3444, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_accuracy": 0.9197465890810875, |
|
"eval_f1": 0.772121694173792, |
|
"eval_loss": 0.30006563663482666, |
|
"eval_precision": 0.7738142686329215, |
|
"eval_recall": 0.770436507936508, |
|
"eval_runtime": 5.9225, |
|
"eval_samples_per_second": 279.276, |
|
"eval_steps_per_second": 17.56, |
|
"step": 1792 |
|
}, |
|
{ |
|
"epoch": 2.23, |
|
"learning_rate": 1.955357142857143e-05, |
|
"loss": 0.2916, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 2.79, |
|
"learning_rate": 1.944196428571429e-05, |
|
"loss": 0.2491, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_accuracy": 0.9214545310110619, |
|
"eval_f1": 0.7768938768773725, |
|
"eval_loss": 0.2882336974143982, |
|
"eval_precision": 0.7754859967051071, |
|
"eval_recall": 0.7783068783068783, |
|
"eval_runtime": 5.8599, |
|
"eval_samples_per_second": 282.259, |
|
"eval_steps_per_second": 17.748, |
|
"step": 2688 |
|
}, |
|
{ |
|
"epoch": 3.35, |
|
"learning_rate": 1.9330357142857144e-05, |
|
"loss": 0.2111, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 3.91, |
|
"learning_rate": 1.9218750000000003e-05, |
|
"loss": 0.1889, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy": 0.9311659682640557, |
|
"eval_f1": 0.8087478559176673, |
|
"eval_loss": 0.279913067817688, |
|
"eval_precision": 0.8067254540668597, |
|
"eval_recall": 0.8107804232804233, |
|
"eval_runtime": 5.8665, |
|
"eval_samples_per_second": 281.939, |
|
"eval_steps_per_second": 17.728, |
|
"step": 3584 |
|
}, |
|
{ |
|
"epoch": 4.46, |
|
"learning_rate": 1.910714285714286e-05, |
|
"loss": 0.1683, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_accuracy": 0.9332115266220483, |
|
"eval_f1": 0.8155864706270193, |
|
"eval_loss": 0.27679798007011414, |
|
"eval_precision": 0.8130669120546865, |
|
"eval_recall": 0.8181216931216931, |
|
"eval_runtime": 6.0326, |
|
"eval_samples_per_second": 274.178, |
|
"eval_steps_per_second": 17.24, |
|
"step": 4480 |
|
}, |
|
{ |
|
"epoch": 5.02, |
|
"learning_rate": 1.8995535714285717e-05, |
|
"loss": 0.1568, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 5.58, |
|
"learning_rate": 1.8883928571428573e-05, |
|
"loss": 0.1313, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_accuracy": 0.9282068595714257, |
|
"eval_f1": 0.7986634908032288, |
|
"eval_loss": 0.30244389176368713, |
|
"eval_precision": 0.7989806724913953, |
|
"eval_recall": 0.7983465608465609, |
|
"eval_runtime": 5.8739, |
|
"eval_samples_per_second": 281.583, |
|
"eval_steps_per_second": 17.705, |
|
"step": 5376 |
|
} |
|
], |
|
"max_steps": 89600, |
|
"num_train_epochs": 100, |
|
"total_flos": 3919265715030336.0, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|