{ "best_metric": 0.9909420289855073, "best_model_checkpoint": "./fossilBERT_output/checkpoint-5661", "epoch": 10.0, "global_step": 6290, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.79, "learning_rate": 4.6025437201907795e-05, "loss": 0.1219, "step": 500 }, { "epoch": 1.0, "eval_accuracy": 0.9829025844930418, "eval_f1": 0.980708838043966, "eval_loss": 0.06422444432973862, "eval_precision": 0.9741532976827094, "eval_recall": 0.987353206865402, "eval_runtime": 2.8563, "eval_samples_per_second": 880.496, "eval_steps_per_second": 55.315, "step": 629 }, { "epoch": 1.59, "learning_rate": 4.205087440381558e-05, "loss": 0.0426, "step": 1000 }, { "epoch": 2.0, "eval_accuracy": 0.9864811133200795, "eval_f1": 0.9845313921747042, "eval_loss": 0.06980240345001221, "eval_precision": 0.9917506874427131, "eval_recall": 0.9774164408310749, "eval_runtime": 2.8485, "eval_samples_per_second": 882.932, "eval_steps_per_second": 55.469, "step": 1258 }, { "epoch": 2.38, "learning_rate": 3.8076311605723374e-05, "loss": 0.0288, "step": 1500 }, { "epoch": 3.0, "eval_accuracy": 0.9876739562624255, "eval_f1": 0.986054880791723, "eval_loss": 0.08222242444753647, "eval_precision": 0.982078853046595, "eval_recall": 0.990063233965673, "eval_runtime": 2.8512, "eval_samples_per_second": 882.071, "eval_steps_per_second": 55.414, "step": 1887 }, { "epoch": 3.18, "learning_rate": 3.410174880763116e-05, "loss": 0.0057, "step": 2000 }, { "epoch": 3.97, "learning_rate": 3.0127186009538953e-05, "loss": 0.0084, "step": 2500 }, { "epoch": 4.0, "eval_accuracy": 0.9880715705765407, "eval_f1": 0.9864253393665158, "eval_loss": 0.07759582996368408, "eval_precision": 0.9882139619220308, "eval_recall": 0.9846431797651309, "eval_runtime": 2.839, "eval_samples_per_second": 885.877, "eval_steps_per_second": 55.654, "step": 2516 }, { "epoch": 4.77, "learning_rate": 2.6152623211446743e-05, "loss": 0.0061, "step": 3000 }, { "epoch": 5.0, "eval_accuracy": 0.988469184890656, "eval_f1": 0.9868599909379248, "eval_loss": 0.10027419775724411, "eval_precision": 0.99, "eval_recall": 0.983739837398374, "eval_runtime": 2.8617, "eval_samples_per_second": 878.859, "eval_steps_per_second": 55.213, "step": 3145 }, { "epoch": 5.56, "learning_rate": 2.2178060413354532e-05, "loss": 0.0016, "step": 3500 }, { "epoch": 6.0, "eval_accuracy": 0.989662027833002, "eval_f1": 0.9882777276825968, "eval_loss": 0.08881077915430069, "eval_precision": 0.9864986498649865, "eval_recall": 0.990063233965673, "eval_runtime": 2.8662, "eval_samples_per_second": 877.455, "eval_steps_per_second": 55.124, "step": 3774 }, { "epoch": 6.36, "learning_rate": 1.820349761526232e-05, "loss": 0.0023, "step": 4000 }, { "epoch": 7.0, "eval_accuracy": 0.9904572564612326, "eval_f1": 0.9891500904159132, "eval_loss": 0.09042701870203018, "eval_precision": 0.9900452488687783, "eval_recall": 0.988256549232159, "eval_runtime": 2.8476, "eval_samples_per_second": 883.214, "eval_steps_per_second": 55.486, "step": 4403 }, { "epoch": 7.15, "learning_rate": 1.4228934817170111e-05, "loss": 0.0037, "step": 4500 }, { "epoch": 7.95, "learning_rate": 1.02543720190779e-05, "loss": 0.0017, "step": 5000 }, { "epoch": 8.0, "eval_accuracy": 0.9888667992047714, "eval_f1": 0.9872611464968153, "eval_loss": 0.09531795978546143, "eval_precision": 0.9945004582951421, "eval_recall": 0.980126467931346, "eval_runtime": 2.8577, "eval_samples_per_second": 880.078, "eval_steps_per_second": 55.289, "step": 5032 }, { "epoch": 8.74, "learning_rate": 6.279809220985691e-06, "loss": 0.0, "step": 5500 }, { "epoch": 9.0, "eval_accuracy": 0.9920477137176938, "eval_f1": 0.9909420289855073, "eval_loss": 0.0791691467165947, "eval_precision": 0.9936421435059037, "eval_recall": 0.988256549232159, "eval_runtime": 2.8459, "eval_samples_per_second": 883.726, "eval_steps_per_second": 55.518, "step": 5661 }, { "epoch": 9.54, "learning_rate": 2.3052464228934817e-06, "loss": 0.0, "step": 6000 }, { "epoch": 10.0, "eval_accuracy": 0.9916500994035785, "eval_f1": 0.990493435943866, "eval_loss": 0.07801677286624908, "eval_precision": 0.9927404718693285, "eval_recall": 0.988256549232159, "eval_runtime": 2.8772, "eval_samples_per_second": 874.116, "eval_steps_per_second": 54.915, "step": 6290 } ], "max_steps": 6290, "num_train_epochs": 10, "total_flos": 3330561570708480.0, "trial_name": null, "trial_params": null }