DunnBC22's picture
All Dunn!!!
83db6c2
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 5.0,
"global_step": 665,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.01,
"learning_rate": 1.9969924812030075e-05,
"loss": 1.4231,
"step": 1
},
{
"epoch": 1.0,
"learning_rate": 1.6000000000000003e-05,
"loss": 0.8756,
"step": 133
},
{
"epoch": 1.0,
"eval_Macro F1": 0.6559577437042121,
"eval_Macro Precision": 0.6414383471396911,
"eval_Macro Recall": 0.6726779588705305,
"eval_Micro F1": 0.869914853358562,
"eval_Micro Precision": 0.869914853358562,
"eval_Micro Recall": 0.869914853358562,
"eval_Weighted F1": 0.8557169411489111,
"eval_Weighted Precision": 0.8436710960059746,
"eval_Weighted Recall": 0.869914853358562,
"eval_accuracy": 0.869914853358562,
"eval_loss": 0.452942818403244,
"eval_runtime": 45.2965,
"eval_samples_per_second": 46.67,
"eval_steps_per_second": 0.751,
"step": 133
},
{
"epoch": 2.0,
"learning_rate": 1.2e-05,
"loss": 0.4097,
"step": 266
},
{
"epoch": 2.0,
"eval_Macro F1": 0.7826498896982309,
"eval_Macro Precision": 0.8743465956410477,
"eval_Macro Recall": 0.763545504951241,
"eval_Micro F1": 0.902554399243141,
"eval_Micro Precision": 0.902554399243141,
"eval_Micro Recall": 0.902554399243141,
"eval_Weighted F1": 0.8981990872046596,
"eval_Weighted Precision": 0.9058995948483624,
"eval_Weighted Recall": 0.902554399243141,
"eval_accuracy": 0.902554399243141,
"eval_loss": 0.31955790519714355,
"eval_runtime": 46.2695,
"eval_samples_per_second": 45.689,
"eval_steps_per_second": 0.735,
"step": 266
},
{
"epoch": 3.0,
"learning_rate": 8.000000000000001e-06,
"loss": 0.3147,
"step": 399
},
{
"epoch": 3.0,
"eval_Macro F1": 0.8469888698710597,
"eval_Macro Precision": 0.8751072643902021,
"eval_Macro Recall": 0.8318917244382616,
"eval_Micro F1": 0.9115421002838221,
"eval_Micro Precision": 0.9115421002838221,
"eval_Micro Recall": 0.9115421002838221,
"eval_Weighted F1": 0.9110995447372147,
"eval_Weighted Precision": 0.9138453932389957,
"eval_Weighted Recall": 0.9115421002838221,
"eval_accuracy": 0.9115421002838221,
"eval_loss": 0.2824004292488098,
"eval_runtime": 44.6739,
"eval_samples_per_second": 47.321,
"eval_steps_per_second": 0.761,
"step": 399
},
{
"epoch": 4.0,
"learning_rate": 4.000000000000001e-06,
"loss": 0.2685,
"step": 532
},
{
"epoch": 4.0,
"eval_Macro F1": 0.8681032986279441,
"eval_Macro Precision": 0.8797074213841205,
"eval_Macro Recall": 0.8601906345542645,
"eval_Micro F1": 0.9186376537369915,
"eval_Micro Precision": 0.9186376537369915,
"eval_Micro Recall": 0.9186376537369915,
"eval_Weighted F1": 0.918722301523608,
"eval_Weighted Precision": 0.9202617437649651,
"eval_Weighted Recall": 0.9186376537369915,
"eval_accuracy": 0.9186376537369915,
"eval_loss": 0.26486265659332275,
"eval_runtime": 44.116,
"eval_samples_per_second": 47.919,
"eval_steps_per_second": 0.771,
"step": 532
},
{
"epoch": 5.0,
"learning_rate": 0.0,
"loss": 0.2479,
"step": 665
},
{
"epoch": 5.0,
"eval_Macro F1": 0.8749369503373983,
"eval_Macro Precision": 0.8821869512033577,
"eval_Macro Recall": 0.8684302125750863,
"eval_Micro F1": 0.9167455061494797,
"eval_Micro Precision": 0.9167455061494797,
"eval_Micro Recall": 0.9167455061494797,
"eval_Weighted F1": 0.9165697427628363,
"eval_Weighted Precision": 0.9168439952197603,
"eval_Weighted Recall": 0.9167455061494797,
"eval_accuracy": 0.9167455061494797,
"eval_loss": 0.26428648829460144,
"eval_runtime": 44.094,
"eval_samples_per_second": 47.943,
"eval_steps_per_second": 0.771,
"step": 665
},
{
"epoch": 5.0,
"step": 665,
"total_flos": 283497743040960.0,
"train_loss": 0.42408741363009117,
"train_runtime": 3111.9997,
"train_samples_per_second": 13.586,
"train_steps_per_second": 0.214
}
],
"max_steps": 665,
"num_train_epochs": 5,
"total_flos": 283497743040960.0,
"trial_name": null,
"trial_params": null
}