{ "best_metric": 1.6452902555465698, "best_model_checkpoint": "fruit_100_types_image_detection/checkpoint-4220", "epoch": 5.0, "eval_steps": 500, "global_step": 4220, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.59, "grad_norm": 2.6183602809906006, "learning_rate": 1.7841726618705034e-06, "loss": 1.8505, "step": 500 }, { "epoch": 1.0, "eval_accuracy": 0.8403333333333334, "eval_loss": 1.8119271993637085, "eval_runtime": 167.1143, "eval_samples_per_second": 107.711, "eval_steps_per_second": 6.732, "step": 844 }, { "epoch": 1.18, "grad_norm": 3.343961000442505, "learning_rate": 1.5443645083932852e-06, "loss": 1.7915, "step": 1000 }, { "epoch": 1.78, "grad_norm": 3.8417131900787354, "learning_rate": 1.3045563549160672e-06, "loss": 1.7335, "step": 1500 }, { "epoch": 2.0, "eval_accuracy": 0.8433333333333334, "eval_loss": 1.7391046285629272, "eval_runtime": 169.3646, "eval_samples_per_second": 106.28, "eval_steps_per_second": 6.642, "step": 1688 }, { "epoch": 2.37, "grad_norm": 2.7001466751098633, "learning_rate": 1.0647482014388488e-06, "loss": 1.7029, "step": 2000 }, { "epoch": 2.96, "grad_norm": 3.4065492153167725, "learning_rate": 8.249400479616306e-07, "loss": 1.6636, "step": 2500 }, { "epoch": 3.0, "eval_accuracy": 0.8451666666666666, "eval_loss": 1.6863653659820557, "eval_runtime": 183.0164, "eval_samples_per_second": 98.352, "eval_steps_per_second": 6.147, "step": 2532 }, { "epoch": 3.55, "grad_norm": 2.9417073726654053, "learning_rate": 5.851318944844125e-07, "loss": 1.6379, "step": 3000 }, { "epoch": 4.0, "eval_accuracy": 0.8458333333333333, "eval_loss": 1.655003309249878, "eval_runtime": 182.964, "eval_samples_per_second": 98.38, "eval_steps_per_second": 6.149, "step": 3376 }, { "epoch": 4.15, "grad_norm": 3.41286563873291, "learning_rate": 3.4532374100719426e-07, "loss": 1.617, "step": 3500 }, { "epoch": 4.74, "grad_norm": 3.1814427375793457, "learning_rate": 1.0551558752997601e-07, "loss": 1.6055, "step": 4000 }, { "epoch": 5.0, "eval_accuracy": 0.8466666666666667, "eval_loss": 1.6452902555465698, "eval_runtime": 165.9895, "eval_samples_per_second": 108.441, "eval_steps_per_second": 6.778, "step": 4220 } ], "logging_steps": 500, "max_steps": 4220, "num_input_tokens_seen": 0, "num_train_epochs": 5, "save_steps": 500, "total_flos": 1.047060731179008e+19, "train_batch_size": 32, "trial_name": null, "trial_params": null }