{ "best_metric": null, "best_model_checkpoint": null, "epoch": 26.666666666666668, "global_step": 400, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.67, "eval_accuracy": 0.6659393661001378, "eval_f1": 0.5035663338088445, "eval_loss": 1.1944581270217896, "eval_precision": 0.4800543970988214, "eval_recall": 0.5295, "eval_runtime": 3.6881, "eval_samples_per_second": 14.641, "eval_steps_per_second": 1.627, "step": 25 }, { "epoch": 3.33, "eval_accuracy": 0.7687184198438217, "eval_f1": 0.7759615384615385, "eval_loss": 0.7770130038261414, "eval_precision": 0.7472222222222222, "eval_recall": 0.807, "eval_runtime": 3.715, "eval_samples_per_second": 14.536, "eval_steps_per_second": 1.615, "step": 50 }, { "epoch": 5.0, "eval_accuracy": 0.8118971061093248, "eval_f1": 0.8231029482841953, "eval_loss": 0.5989910364151001, "eval_precision": 0.7965388213283442, "eval_recall": 0.8515, "eval_runtime": 3.6727, "eval_samples_per_second": 14.703, "eval_steps_per_second": 1.634, "step": 75 }, { "epoch": 6.67, "eval_accuracy": 0.7702112999540652, "eval_f1": 0.8409471418320977, "eval_loss": 0.6813620924949646, "eval_precision": 0.8060522696011004, "eval_recall": 0.879, "eval_runtime": 3.7496, "eval_samples_per_second": 14.402, "eval_steps_per_second": 1.6, "step": 100 }, { "epoch": 8.33, "eval_accuracy": 0.8316490583371612, "eval_f1": 0.8467469879518073, "eval_loss": 0.5391940474510193, "eval_precision": 0.8172093023255814, "eval_recall": 0.8785, "eval_runtime": 3.7027, "eval_samples_per_second": 14.584, "eval_steps_per_second": 1.62, "step": 125 }, { "epoch": 10.0, "eval_accuracy": 0.811437758383096, "eval_f1": 0.8603297769156159, "eval_loss": 0.5438030362129211, "eval_precision": 0.835216572504708, "eval_recall": 0.887, "eval_runtime": 3.7703, "eval_samples_per_second": 14.322, "eval_steps_per_second": 1.591, "step": 150 }, { "epoch": 11.67, "eval_accuracy": 0.838194763435921, "eval_f1": 0.8752145133611179, "eval_loss": 0.5429797172546387, "eval_precision": 0.8585858585858586, "eval_recall": 0.8925, "eval_runtime": 3.7262, "eval_samples_per_second": 14.492, "eval_steps_per_second": 1.61, "step": 175 }, { "epoch": 13.33, "eval_accuracy": 0.8257923748277446, "eval_f1": 0.8691817736403724, "eval_loss": 0.5896742939949036, "eval_precision": 0.8520653218059558, "eval_recall": 0.887, "eval_runtime": 3.7744, "eval_samples_per_second": 14.307, "eval_steps_per_second": 1.59, "step": 200 }, { "epoch": 15.0, "eval_accuracy": 0.8430179145613229, "eval_f1": 0.8809756097560977, "eval_loss": 0.5427059531211853, "eval_precision": 0.86, "eval_recall": 0.903, "eval_runtime": 3.6854, "eval_samples_per_second": 14.652, "eval_steps_per_second": 1.628, "step": 225 }, { "epoch": 16.67, "eval_accuracy": 0.8410656867248507, "eval_f1": 0.8822512959763021, "eval_loss": 0.5541779398918152, "eval_precision": 0.871282301316431, "eval_recall": 0.8935, "eval_runtime": 3.7194, "eval_samples_per_second": 14.518, "eval_steps_per_second": 1.613, "step": 250 }, { "epoch": 18.33, "eval_accuracy": 0.83210840606339, "eval_f1": 0.8821515892420537, "eval_loss": 0.6013592481613159, "eval_precision": 0.8631578947368421, "eval_recall": 0.902, "eval_runtime": 3.7675, "eval_samples_per_second": 14.333, "eval_steps_per_second": 1.593, "step": 275 }, { "epoch": 20.0, "eval_accuracy": 0.8365870463941204, "eval_f1": 0.8843036109064112, "eval_loss": 0.5971384644508362, "eval_precision": 0.8691453404152584, "eval_recall": 0.9, "eval_runtime": 3.72, "eval_samples_per_second": 14.516, "eval_steps_per_second": 1.613, "step": 300 }, { "epoch": 21.67, "eval_accuracy": 0.8313045475424896, "eval_f1": 0.8891637803067788, "eval_loss": 0.598324716091156, "eval_precision": 0.8800195886385896, "eval_recall": 0.8985, "eval_runtime": 3.78, "eval_samples_per_second": 14.286, "eval_steps_per_second": 1.587, "step": 325 }, { "epoch": 23.33, "eval_accuracy": 0.8414101975195223, "eval_f1": 0.8964497041420119, "eval_loss": 0.5867139101028442, "eval_precision": 0.8842412451361867, "eval_recall": 0.909, "eval_runtime": 4.0235, "eval_samples_per_second": 13.421, "eval_steps_per_second": 1.491, "step": 350 }, { "epoch": 25.0, "eval_accuracy": 0.8465778594395957, "eval_f1": 0.8928835262250677, "eval_loss": 0.5947966575622559, "eval_precision": 0.8796700630761766, "eval_recall": 0.9065, "eval_runtime": 3.6989, "eval_samples_per_second": 14.599, "eval_steps_per_second": 1.622, "step": 375 }, { "epoch": 26.67, "eval_accuracy": 0.8414101975195223, "eval_f1": 0.8868156150257795, "eval_loss": 0.6016380190849304, "eval_precision": 0.8712011577424024, "eval_recall": 0.903, "eval_runtime": 3.6913, "eval_samples_per_second": 14.629, "eval_steps_per_second": 1.625, "step": 400 }, { "epoch": 26.67, "step": 400, "total_flos": 1054421372928000.0, "train_loss": 0.3642783355712891, "train_runtime": 422.1629, "train_samples_per_second": 9.475, "train_steps_per_second": 0.948 } ], "max_steps": 400, "num_train_epochs": 27, "total_flos": 1054421372928000.0, "trial_name": null, "trial_params": null }