{ "best_metric": 0.48922964930534363, "best_model_checkpoint": "marvel_heroes_image_detection/checkpoint-1312", "epoch": 16.0, "eval_steps": 500, "global_step": 1312, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "eval_accuracy": 0.8984615384615384, "eval_loss": 0.49428293108940125, "eval_runtime": 12.0605, "eval_samples_per_second": 53.895, "eval_steps_per_second": 6.799, "step": 82 }, { "epoch": 2.0, "eval_accuracy": 0.8969230769230769, "eval_loss": 0.49431312084198, "eval_runtime": 12.3803, "eval_samples_per_second": 52.503, "eval_steps_per_second": 6.623, "step": 164 }, { "epoch": 3.0, "eval_accuracy": 0.9015384615384615, "eval_loss": 0.49280208349227905, "eval_runtime": 12.4968, "eval_samples_per_second": 52.013, "eval_steps_per_second": 6.562, "step": 246 }, { "epoch": 4.0, "eval_accuracy": 0.8969230769230769, "eval_loss": 0.49426719546318054, "eval_runtime": 12.057, "eval_samples_per_second": 53.91, "eval_steps_per_second": 6.801, "step": 328 }, { "epoch": 5.0, "eval_accuracy": 0.8984615384615384, "eval_loss": 0.4925532042980194, "eval_runtime": 12.0769, "eval_samples_per_second": 53.822, "eval_steps_per_second": 6.79, "step": 410 }, { "epoch": 6.0, "eval_accuracy": 0.8938461538461538, "eval_loss": 0.49220046401023865, "eval_runtime": 12.1699, "eval_samples_per_second": 53.411, "eval_steps_per_second": 6.738, "step": 492 }, { "epoch": 6.1, "grad_norm": 4.925354480743408, "learning_rate": 7.169811320754716e-07, "loss": 0.5614, "step": 500 }, { "epoch": 7.0, "eval_accuracy": 0.8876923076923077, "eval_loss": 0.49260208010673523, "eval_runtime": 13.062, "eval_samples_per_second": 49.763, "eval_steps_per_second": 6.278, "step": 574 }, { "epoch": 8.0, "eval_accuracy": 0.8984615384615384, "eval_loss": 0.4912846088409424, "eval_runtime": 12.3802, "eval_samples_per_second": 52.503, "eval_steps_per_second": 6.623, "step": 656 }, { "epoch": 9.0, "eval_accuracy": 0.8923076923076924, "eval_loss": 0.4908252954483032, "eval_runtime": 12.0634, "eval_samples_per_second": 53.882, "eval_steps_per_second": 6.797, "step": 738 }, { "epoch": 10.0, "eval_accuracy": 0.8923076923076924, "eval_loss": 0.4904528260231018, "eval_runtime": 12.2539, "eval_samples_per_second": 53.044, "eval_steps_per_second": 6.692, "step": 820 }, { "epoch": 11.0, "eval_accuracy": 0.8892307692307693, "eval_loss": 0.4904911518096924, "eval_runtime": 12.1087, "eval_samples_per_second": 53.68, "eval_steps_per_second": 6.772, "step": 902 }, { "epoch": 12.0, "eval_accuracy": 0.8938461538461538, "eval_loss": 0.48976370692253113, "eval_runtime": 12.1182, "eval_samples_per_second": 53.639, "eval_steps_per_second": 6.767, "step": 984 }, { "epoch": 12.2, "grad_norm": 4.339879512786865, "learning_rate": 4.0251572327044023e-07, "loss": 0.519, "step": 1000 }, { "epoch": 13.0, "eval_accuracy": 0.8892307692307693, "eval_loss": 0.489905446767807, "eval_runtime": 12.1611, "eval_samples_per_second": 53.449, "eval_steps_per_second": 6.743, "step": 1066 }, { "epoch": 14.0, "eval_accuracy": 0.8923076923076924, "eval_loss": 0.48949161171913147, "eval_runtime": 12.1412, "eval_samples_per_second": 53.537, "eval_steps_per_second": 6.754, "step": 1148 }, { "epoch": 15.0, "eval_accuracy": 0.8923076923076924, "eval_loss": 0.48962101340293884, "eval_runtime": 12.0964, "eval_samples_per_second": 53.735, "eval_steps_per_second": 6.779, "step": 1230 }, { "epoch": 16.0, "eval_accuracy": 0.8907692307692308, "eval_loss": 0.48922964930534363, "eval_runtime": 11.9519, "eval_samples_per_second": 54.385, "eval_steps_per_second": 6.861, "step": 1312 } ], "logging_steps": 500, "max_steps": 1640, "num_input_tokens_seen": 0, "num_train_epochs": 20, "save_steps": 500, "total_flos": 3.2213602471819346e+18, "train_batch_size": 32, "trial_name": null, "trial_params": null }