{ "best_metric": null, "best_model_checkpoint": null, "epoch": 5.0, "global_step": 665, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.01, "learning_rate": 1.9969924812030075e-05, "loss": 1.4231, "step": 1 }, { "epoch": 1.0, "learning_rate": 1.6000000000000003e-05, "loss": 0.8756, "step": 133 }, { "epoch": 1.0, "eval_Macro F1": 0.6559577437042121, "eval_Macro Precision": 0.6414383471396911, "eval_Macro Recall": 0.6726779588705305, "eval_Micro F1": 0.869914853358562, "eval_Micro Precision": 0.869914853358562, "eval_Micro Recall": 0.869914853358562, "eval_Weighted F1": 0.8557169411489111, "eval_Weighted Precision": 0.8436710960059746, "eval_Weighted Recall": 0.869914853358562, "eval_accuracy": 0.869914853358562, "eval_loss": 0.452942818403244, "eval_runtime": 45.2965, "eval_samples_per_second": 46.67, "eval_steps_per_second": 0.751, "step": 133 }, { "epoch": 2.0, "learning_rate": 1.2e-05, "loss": 0.4097, "step": 266 }, { "epoch": 2.0, "eval_Macro F1": 0.7826498896982309, "eval_Macro Precision": 0.8743465956410477, "eval_Macro Recall": 0.763545504951241, "eval_Micro F1": 0.902554399243141, "eval_Micro Precision": 0.902554399243141, "eval_Micro Recall": 0.902554399243141, "eval_Weighted F1": 0.8981990872046596, "eval_Weighted Precision": 0.9058995948483624, "eval_Weighted Recall": 0.902554399243141, "eval_accuracy": 0.902554399243141, "eval_loss": 0.31955790519714355, "eval_runtime": 46.2695, "eval_samples_per_second": 45.689, "eval_steps_per_second": 0.735, "step": 266 }, { "epoch": 3.0, "learning_rate": 8.000000000000001e-06, "loss": 0.3147, "step": 399 }, { "epoch": 3.0, "eval_Macro F1": 0.8469888698710597, "eval_Macro Precision": 0.8751072643902021, "eval_Macro Recall": 0.8318917244382616, "eval_Micro F1": 0.9115421002838221, "eval_Micro Precision": 0.9115421002838221, "eval_Micro Recall": 0.9115421002838221, "eval_Weighted F1": 0.9110995447372147, "eval_Weighted Precision": 0.9138453932389957, "eval_Weighted Recall": 0.9115421002838221, "eval_accuracy": 0.9115421002838221, "eval_loss": 0.2824004292488098, "eval_runtime": 44.6739, "eval_samples_per_second": 47.321, "eval_steps_per_second": 0.761, "step": 399 }, { "epoch": 4.0, "learning_rate": 4.000000000000001e-06, "loss": 0.2685, "step": 532 }, { "epoch": 4.0, "eval_Macro F1": 0.8681032986279441, "eval_Macro Precision": 0.8797074213841205, "eval_Macro Recall": 0.8601906345542645, "eval_Micro F1": 0.9186376537369915, "eval_Micro Precision": 0.9186376537369915, "eval_Micro Recall": 0.9186376537369915, "eval_Weighted F1": 0.918722301523608, "eval_Weighted Precision": 0.9202617437649651, "eval_Weighted Recall": 0.9186376537369915, "eval_accuracy": 0.9186376537369915, "eval_loss": 0.26486265659332275, "eval_runtime": 44.116, "eval_samples_per_second": 47.919, "eval_steps_per_second": 0.771, "step": 532 }, { "epoch": 5.0, "learning_rate": 0.0, "loss": 0.2479, "step": 665 }, { "epoch": 5.0, "eval_Macro F1": 0.8749369503373983, "eval_Macro Precision": 0.8821869512033577, "eval_Macro Recall": 0.8684302125750863, "eval_Micro F1": 0.9167455061494797, "eval_Micro Precision": 0.9167455061494797, "eval_Micro Recall": 0.9167455061494797, "eval_Weighted F1": 0.9165697427628363, "eval_Weighted Precision": 0.9168439952197603, "eval_Weighted Recall": 0.9167455061494797, "eval_accuracy": 0.9167455061494797, "eval_loss": 0.26428648829460144, "eval_runtime": 44.094, "eval_samples_per_second": 47.943, "eval_steps_per_second": 0.771, "step": 665 }, { "epoch": 5.0, "step": 665, "total_flos": 283497743040960.0, "train_loss": 0.42408741363009117, "train_runtime": 3111.9997, "train_samples_per_second": 13.586, "train_steps_per_second": 0.214 } ], "max_steps": 665, "num_train_epochs": 5, "total_flos": 283497743040960.0, "trial_name": null, "trial_params": null }