{ "best_metric": 0.33476540446281433, "best_model_checkpoint": "relevancy-eksyar/checkpoint-151", "epoch": 1.0, "eval_steps": 500, "global_step": 151, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.046357615894039736, "grad_norm": 6.584251403808594, "learning_rate": 2.317880794701987e-06, "loss": 0.7096, "step": 7 }, { "epoch": 0.09271523178807947, "grad_norm": 5.720220565795898, "learning_rate": 4.635761589403974e-06, "loss": 0.7046, "step": 14 }, { "epoch": 0.1390728476821192, "grad_norm": 5.474271774291992, "learning_rate": 6.95364238410596e-06, "loss": 0.6714, "step": 21 }, { "epoch": 0.18543046357615894, "grad_norm": 5.771448135375977, "learning_rate": 9.271523178807948e-06, "loss": 0.6352, "step": 28 }, { "epoch": 0.23178807947019867, "grad_norm": 6.3206658363342285, "learning_rate": 1.1589403973509934e-05, "loss": 0.5865, "step": 35 }, { "epoch": 0.2781456953642384, "grad_norm": 6.563697814941406, "learning_rate": 1.3576158940397351e-05, "loss": 0.6163, "step": 42 }, { "epoch": 0.32450331125827814, "grad_norm": 5.018538951873779, "learning_rate": 1.589403973509934e-05, "loss": 0.5652, "step": 49 }, { "epoch": 0.3708609271523179, "grad_norm": 6.649289608001709, "learning_rate": 1.8211920529801323e-05, "loss": 0.5127, "step": 56 }, { "epoch": 0.41721854304635764, "grad_norm": 5.347183704376221, "learning_rate": 2.052980132450331e-05, "loss": 0.4503, "step": 63 }, { "epoch": 0.46357615894039733, "grad_norm": 5.734078884124756, "learning_rate": 2.2516556291390732e-05, "loss": 0.4906, "step": 70 }, { "epoch": 0.5099337748344371, "grad_norm": 7.377983093261719, "learning_rate": 2.4834437086092715e-05, "loss": 0.4134, "step": 77 }, { "epoch": 0.5562913907284768, "grad_norm": 4.084234237670898, "learning_rate": 2.6821192052980134e-05, "loss": 0.358, "step": 84 }, { "epoch": 0.6026490066225165, "grad_norm": 7.116121768951416, "learning_rate": 2.913907284768212e-05, "loss": 0.4049, "step": 91 }, { "epoch": 0.6490066225165563, "grad_norm": 10.74765682220459, "learning_rate": 3.145695364238411e-05, "loss": 0.3495, "step": 98 }, { "epoch": 0.695364238410596, "grad_norm": 13.722650527954102, "learning_rate": 3.37748344370861e-05, "loss": 0.4953, "step": 105 }, { "epoch": 0.7417218543046358, "grad_norm": 12.211973190307617, "learning_rate": 3.609271523178808e-05, "loss": 0.3584, "step": 112 }, { "epoch": 0.7880794701986755, "grad_norm": 15.666670799255371, "learning_rate": 3.841059602649007e-05, "loss": 0.303, "step": 119 }, { "epoch": 0.8344370860927153, "grad_norm": 23.443561553955078, "learning_rate": 4.0728476821192055e-05, "loss": 0.3172, "step": 126 }, { "epoch": 0.8807947019867549, "grad_norm": 39.46857452392578, "learning_rate": 4.304635761589404e-05, "loss": 0.3557, "step": 133 }, { "epoch": 0.9271523178807947, "grad_norm": 15.615972518920898, "learning_rate": 4.536423841059603e-05, "loss": 0.4137, "step": 140 }, { "epoch": 0.9735099337748344, "grad_norm": 24.9617977142334, "learning_rate": 4.768211920529801e-05, "loss": 0.365, "step": 147 }, { "epoch": 1.0, "eval_accuracy": 0.8940397350993378, "eval_auc": 0.953993245910267, "eval_f1": 0.8896551724137931, "eval_loss": 0.33476540446281433, "eval_precision": 0.9280575539568345, "eval_recall": 0.8543046357615894, "eval_runtime": 0.6234, "eval_samples_per_second": 484.403, "eval_steps_per_second": 30.476, "step": 151 } ], "logging_steps": 7, "max_steps": 1510, "num_input_tokens_seen": 0, "num_train_epochs": 10, "save_steps": 500, "stateful_callbacks": { "EarlyStoppingCallback": { "args": { "early_stopping_patience": 5, "early_stopping_threshold": 0.01 }, "attributes": { "early_stopping_patience_counter": 0 } }, "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": false }, "attributes": {} } }, "total_flos": 79459538718720.0, "train_batch_size": 8, "trial_name": null, "trial_params": null }