{ "best_metric": 0.697825193570947, "best_model_checkpoint": "trained/hebban-reviews5/bert-base-multilingual-cased/checkpoint-4500", "epoch": 4.382997370727432, "global_step": 5001, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.44, "learning_rate": 4.502099580083983e-05, "loss": 1.3159, "step": 500 }, { "epoch": 0.44, "eval_accuracy": 0.4912475345167653, "eval_f1": 0.48070042281702435, "eval_loss": 1.1863828897476196, "eval_precision": 0.5054226630223979, "eval_qwk": 0.6104106009981652, "eval_recall": 0.4912475345167653, "eval_runtime": 23.5101, "eval_samples_per_second": 690.086, "eval_steps_per_second": 5.402, "step": 500 }, { "epoch": 0.88, "learning_rate": 4.003199360127974e-05, "loss": 1.092, "step": 1000 }, { "epoch": 0.88, "eval_accuracy": 0.5488165680473372, "eval_f1": 0.5517553489817303, "eval_loss": 1.0387530326843262, "eval_precision": 0.5678859988610889, "eval_qwk": 0.6346615351470672, "eval_recall": 0.5488165680473372, "eval_runtime": 23.5201, "eval_samples_per_second": 689.794, "eval_steps_per_second": 5.4, "step": 1000 }, { "epoch": 1.31, "learning_rate": 3.5032993401319734e-05, "loss": 0.9709, "step": 1500 }, { "epoch": 1.31, "eval_accuracy": 0.5436390532544378, "eval_f1": 0.5408623179767048, "eval_loss": 1.0117485523223877, "eval_precision": 0.5642348913139151, "eval_qwk": 0.6678503252600388, "eval_recall": 0.5436390532544378, "eval_runtime": 23.6496, "eval_samples_per_second": 686.015, "eval_steps_per_second": 5.37, "step": 1500 }, { "epoch": 1.75, "learning_rate": 3.0033993201359727e-05, "loss": 0.9404, "step": 2000 }, { "epoch": 1.75, "eval_accuracy": 0.5279215976331361, "eval_f1": 0.5218328433667149, "eval_loss": 1.0087615251541138, "eval_precision": 0.5543969942392576, "eval_qwk": 0.6748096376745845, "eval_recall": 0.5279215976331361, "eval_runtime": 23.476, "eval_samples_per_second": 691.088, "eval_steps_per_second": 5.41, "step": 2000 }, { "epoch": 2.19, "learning_rate": 2.503499300139972e-05, "loss": 0.8657, "step": 2500 }, { "epoch": 2.19, "eval_accuracy": 0.5708826429980276, "eval_f1": 0.5692427852436814, "eval_loss": 1.0947091579437256, "eval_precision": 0.5827881052454773, "eval_qwk": 0.6863988830193634, "eval_recall": 0.5708826429980276, "eval_runtime": 23.3841, "eval_samples_per_second": 693.805, "eval_steps_per_second": 5.431, "step": 2500 }, { "epoch": 2.63, "learning_rate": 2.0035992801439712e-05, "loss": 0.8004, "step": 3000 }, { "epoch": 2.63, "eval_accuracy": 0.5539940828402367, "eval_f1": 0.5591418616361084, "eval_loss": 1.0360697507858276, "eval_precision": 0.5772334772150153, "eval_qwk": 0.6712182177231302, "eval_recall": 0.5539940828402367, "eval_runtime": 23.5321, "eval_samples_per_second": 689.441, "eval_steps_per_second": 5.397, "step": 3000 }, { "epoch": 3.07, "learning_rate": 1.5046990601879624e-05, "loss": 0.7687, "step": 3500 }, { "epoch": 3.07, "eval_accuracy": 0.5808678500986193, "eval_f1": 0.5832607549463982, "eval_loss": 1.2274583578109741, "eval_precision": 0.5914789641012546, "eval_qwk": 0.689381177306146, "eval_recall": 0.5808678500986193, "eval_runtime": 23.7912, "eval_samples_per_second": 681.932, "eval_steps_per_second": 5.338, "step": 3500 }, { "epoch": 3.51, "learning_rate": 1.0047990401919617e-05, "loss": 0.6773, "step": 4000 }, { "epoch": 3.51, "eval_accuracy": 0.5830251479289941, "eval_f1": 0.5826927994622666, "eval_loss": 1.222939133644104, "eval_precision": 0.5930910696407776, "eval_qwk": 0.6959801434105679, "eval_recall": 0.5830251479289941, "eval_runtime": 23.6989, "eval_samples_per_second": 684.589, "eval_steps_per_second": 5.359, "step": 4000 }, { "epoch": 3.94, "learning_rate": 5.048990201959608e-06, "loss": 0.6584, "step": 4500 }, { "epoch": 3.94, "eval_accuracy": 0.5886341222879684, "eval_f1": 0.5886427250282493, "eval_loss": 1.281541347503662, "eval_precision": 0.5969768120377853, "eval_qwk": 0.697825193570947, "eval_recall": 0.5886341222879684, "eval_runtime": 23.7004, "eval_samples_per_second": 684.544, "eval_steps_per_second": 5.359, "step": 4500 }, { "epoch": 4.38, "learning_rate": 4.999000199960008e-08, "loss": 0.5961, "step": 5000 }, { "epoch": 4.38, "eval_accuracy": 0.5894354043392505, "eval_f1": 0.5909264551740898, "eval_loss": 1.359961748123169, "eval_precision": 0.5997451050742093, "eval_qwk": 0.6969542849451541, "eval_recall": 0.5894354043392505, "eval_runtime": 23.5424, "eval_samples_per_second": 689.138, "eval_steps_per_second": 5.395, "step": 5000 }, { "epoch": 4.38, "step": 5001, "total_flos": 1.6839139993111757e+17, "train_loss": 0.8685172849525287, "train_runtime": 2653.5735, "train_samples_per_second": 241.232, "train_steps_per_second": 1.885 } ], "max_steps": 5001, "num_train_epochs": 5, "total_flos": 1.6839139993111757e+17, "trial_name": null, "trial_params": null }