{ "best_metric": 0.18881076574325562, "best_model_checkpoint": "./model/para_2class_bert_base_multilingual_uncased/checkpoint-858", "epoch": 10.0, "global_step": 2860, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "learning_rate": 2.7e-06, "loss": 0.4425, "step": 286 }, { "epoch": 1.0, "eval_accuracy": 0.8879159369527145, "eval_f1": 0.8871513624348426, "eval_loss": 0.24978627264499664, "eval_precision": 0.886429187723407, "eval_recall": 0.8882284468880799, "eval_runtime": 6.0607, "eval_samples_per_second": 94.213, "eval_steps_per_second": 5.94, "step": 286 }, { "epoch": 2.0, "learning_rate": 2.4000000000000003e-06, "loss": 0.2338, "step": 572 }, { "epoch": 2.0, "eval_accuracy": 0.9019264448336253, "eval_f1": 0.9014181773338266, "eval_loss": 0.21415023505687714, "eval_precision": 0.9005447078496951, "eval_recall": 0.903391782450405, "eval_runtime": 6.0522, "eval_samples_per_second": 94.345, "eval_steps_per_second": 5.948, "step": 572 }, { "epoch": 3.0, "learning_rate": 2.1e-06, "loss": 0.183, "step": 858 }, { "epoch": 3.0, "eval_accuracy": 0.9264448336252189, "eval_f1": 0.9256510416666667, "eval_loss": 0.18881076574325562, "eval_precision": 0.9263208226731912, "eval_recall": 0.9250749188894667, "eval_runtime": 6.0451, "eval_samples_per_second": 94.456, "eval_steps_per_second": 5.955, "step": 858 }, { "epoch": 4.0, "learning_rate": 1.8e-06, "loss": 0.1649, "step": 1144 }, { "epoch": 4.0, "eval_accuracy": 0.9264448336252189, "eval_f1": 0.9260253183298786, "eval_loss": 0.21701288223266602, "eval_precision": 0.9250830564784054, "eval_recall": 0.9277992421428041, "eval_runtime": 6.0482, "eval_samples_per_second": 94.408, "eval_steps_per_second": 5.952, "step": 1144 }, { "epoch": 5.0, "learning_rate": 1.5e-06, "loss": 0.1377, "step": 1430 }, { "epoch": 5.0, "eval_accuracy": 0.9352014010507881, "eval_f1": 0.9345720877657515, "eval_loss": 0.20453482866287231, "eval_precision": 0.934725767677018, "eval_recall": 0.9344243009634198, "eval_runtime": 6.095, "eval_samples_per_second": 93.683, "eval_steps_per_second": 5.906, "step": 1430 }, { "epoch": 6.0, "learning_rate": 1.2000000000000002e-06, "loss": 0.1274, "step": 1716 }, { "epoch": 6.0, "eval_accuracy": 0.9334500875656743, "eval_f1": 0.9330341711520418, "eval_loss": 0.24984127283096313, "eval_precision": 0.9321215703659917, "eval_recall": 0.9345295589072987, "eval_runtime": 6.1229, "eval_samples_per_second": 93.257, "eval_steps_per_second": 5.88, "step": 1716 }, { "epoch": 7.0, "learning_rate": 9e-07, "loss": 0.1107, "step": 2002 }, { "epoch": 7.0, "eval_accuracy": 0.9334500875656743, "eval_f1": 0.9331381733021078, "eval_loss": 0.2757098972797394, "eval_precision": 0.9322114084887807, "eval_recall": 0.9355511801273002, "eval_runtime": 6.1134, "eval_samples_per_second": 93.402, "eval_steps_per_second": 5.889, "step": 2002 }, { "epoch": 8.0, "learning_rate": 6.000000000000001e-07, "loss": 0.101, "step": 2288 }, { "epoch": 8.0, "eval_accuracy": 0.9404553415061296, "eval_f1": 0.940146750524109, "eval_loss": 0.27531886100769043, "eval_precision": 0.9391599449144206, "eval_recall": 0.9422814968917949, "eval_runtime": 6.0533, "eval_samples_per_second": 94.328, "eval_steps_per_second": 5.947, "step": 2288 }, { "epoch": 9.0, "learning_rate": 3.0000000000000004e-07, "loss": 0.0871, "step": 2574 }, { "epoch": 9.0, "eval_accuracy": 0.9281961471103327, "eval_f1": 0.9279973919007445, "eval_loss": 0.3327995836734772, "eval_precision": 0.927807224185316, "eval_recall": 0.9317804690789311, "eval_runtime": 6.0307, "eval_samples_per_second": 94.682, "eval_steps_per_second": 5.969, "step": 2574 }, { "epoch": 10.0, "learning_rate": 0.0, "loss": 0.08, "step": 2860 }, { "epoch": 10.0, "eval_accuracy": 0.9422066549912435, "eval_f1": 0.9418922711138935, "eval_loss": 0.2849212884902954, "eval_precision": 0.9408979089790899, "eval_recall": 0.9438789409812518, "eval_runtime": 6.0221, "eval_samples_per_second": 94.818, "eval_steps_per_second": 5.978, "step": 2860 } ], "max_steps": 2860, "num_train_epochs": 10, "total_flos": 1.20136507877376e+16, "trial_name": null, "trial_params": null }