{ "best_metric": 0.8303472995758057, "best_model_checkpoint": "face_emotions_image_detection/checkpoint-6800", "epoch": 20.0, "eval_steps": 500, "global_step": 6800, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "eval_accuracy": 0.5581299131154324, "eval_loss": 1.5780813694000244, "eval_runtime": 34.4094, "eval_samples_per_second": 70.242, "eval_steps_per_second": 2.209, "step": 340 }, { "epoch": 1.47, "learning_rate": 9.333333333333333e-07, "loss": 1.5754, "step": 500 }, { "epoch": 2.0, "eval_accuracy": 0.6235002068680182, "eval_loss": 1.4531924724578857, "eval_runtime": 33.5063, "eval_samples_per_second": 72.136, "eval_steps_per_second": 2.268, "step": 680 }, { "epoch": 2.94, "learning_rate": 8.592592592592592e-07, "loss": 1.3718, "step": 1000 }, { "epoch": 3.0, "eval_accuracy": 0.6607364501448076, "eval_loss": 1.335525631904602, "eval_runtime": 33.5199, "eval_samples_per_second": 72.107, "eval_steps_per_second": 2.267, "step": 1020 }, { "epoch": 4.0, "eval_accuracy": 0.676458419528341, "eval_loss": 1.2385190725326538, "eval_runtime": 33.0393, "eval_samples_per_second": 73.155, "eval_steps_per_second": 2.3, "step": 1360 }, { "epoch": 4.41, "learning_rate": 7.851851851851852e-07, "loss": 1.2055, "step": 1500 }, { "epoch": 5.0, "eval_accuracy": 0.6830781961108813, "eval_loss": 1.1576205492019653, "eval_runtime": 34.4609, "eval_samples_per_second": 70.137, "eval_steps_per_second": 2.205, "step": 1700 }, { "epoch": 5.88, "learning_rate": 7.111111111111111e-07, "loss": 1.0902, "step": 2000 }, { "epoch": 6.0, "eval_accuracy": 0.6963177492759619, "eval_loss": 1.0941061973571777, "eval_runtime": 33.7137, "eval_samples_per_second": 71.692, "eval_steps_per_second": 2.254, "step": 2040 }, { "epoch": 7.0, "eval_accuracy": 0.7136946628051303, "eval_loss": 1.0437400341033936, "eval_runtime": 34.1074, "eval_samples_per_second": 70.864, "eval_steps_per_second": 2.228, "step": 2380 }, { "epoch": 7.35, "learning_rate": 6.37037037037037e-07, "loss": 0.9981, "step": 2500 }, { "epoch": 8.0, "eval_accuracy": 0.7194869673148532, "eval_loss": 0.999989926815033, "eval_runtime": 34.4809, "eval_samples_per_second": 70.097, "eval_steps_per_second": 2.204, "step": 2720 }, { "epoch": 8.82, "learning_rate": 5.62962962962963e-07, "loss": 0.9352, "step": 3000 }, { "epoch": 9.0, "eval_accuracy": 0.7273479520066197, "eval_loss": 0.9669674634933472, "eval_runtime": 34.4622, "eval_samples_per_second": 70.135, "eval_steps_per_second": 2.205, "step": 3060 }, { "epoch": 10.0, "eval_accuracy": 0.7290028961522549, "eval_loss": 0.9405105113983154, "eval_runtime": 33.8763, "eval_samples_per_second": 71.348, "eval_steps_per_second": 2.243, "step": 3400 }, { "epoch": 10.29, "learning_rate": 4.888888888888889e-07, "loss": 0.8851, "step": 3500 }, { "epoch": 11.0, "eval_accuracy": 0.7343814646255689, "eval_loss": 0.9163816571235657, "eval_runtime": 34.0893, "eval_samples_per_second": 70.902, "eval_steps_per_second": 2.229, "step": 3740 }, { "epoch": 11.76, "learning_rate": 4.1481481481481476e-07, "loss": 0.8465, "step": 4000 }, { "epoch": 12.0, "eval_accuracy": 0.7347952006619777, "eval_loss": 0.8966172933578491, "eval_runtime": 34.3056, "eval_samples_per_second": 70.455, "eval_steps_per_second": 2.215, "step": 4080 }, { "epoch": 13.0, "eval_accuracy": 0.7422424493173355, "eval_loss": 0.8790085911750793, "eval_runtime": 34.0958, "eval_samples_per_second": 70.888, "eval_steps_per_second": 2.229, "step": 4420 }, { "epoch": 13.24, "learning_rate": 3.407407407407407e-07, "loss": 0.8165, "step": 4500 }, { "epoch": 14.0, "eval_accuracy": 0.7480347538270583, "eval_loss": 0.8644098043441772, "eval_runtime": 34.0216, "eval_samples_per_second": 71.043, "eval_steps_per_second": 2.234, "step": 4760 }, { "epoch": 14.71, "learning_rate": 2.6666666666666667e-07, "loss": 0.7954, "step": 5000 }, { "epoch": 15.0, "eval_accuracy": 0.750517170045511, "eval_loss": 0.8529735803604126, "eval_runtime": 34.2111, "eval_samples_per_second": 70.649, "eval_steps_per_second": 2.221, "step": 5100 }, { "epoch": 16.0, "eval_accuracy": 0.7509309060819197, "eval_loss": 0.8457837104797363, "eval_runtime": 33.6533, "eval_samples_per_second": 71.821, "eval_steps_per_second": 2.258, "step": 5440 }, { "epoch": 16.18, "learning_rate": 1.9259259259259257e-07, "loss": 0.7811, "step": 5500 }, { "epoch": 17.0, "eval_accuracy": 0.7534133223003724, "eval_loss": 0.8384882211685181, "eval_runtime": 33.6326, "eval_samples_per_second": 71.865, "eval_steps_per_second": 2.26, "step": 5780 }, { "epoch": 17.65, "learning_rate": 1.1851851851851851e-07, "loss": 0.7673, "step": 6000 }, { "epoch": 18.0, "eval_accuracy": 0.7550682664460074, "eval_loss": 0.8335217237472534, "eval_runtime": 33.2974, "eval_samples_per_second": 72.588, "eval_steps_per_second": 2.282, "step": 6120 }, { "epoch": 19.0, "eval_accuracy": 0.7529995862639636, "eval_loss": 0.8314878940582275, "eval_runtime": 33.8017, "eval_samples_per_second": 71.505, "eval_steps_per_second": 2.248, "step": 6460 }, { "epoch": 19.12, "learning_rate": 4.444444444444444e-08, "loss": 0.7594, "step": 6500 }, { "epoch": 20.0, "eval_accuracy": 0.7538270583367811, "eval_loss": 0.8303472995758057, "eval_runtime": 34.3877, "eval_samples_per_second": 70.287, "eval_steps_per_second": 2.21, "step": 6800 } ], "logging_steps": 500, "max_steps": 6800, "num_input_tokens_seen": 0, "num_train_epochs": 20, "save_steps": 500, "total_flos": 3.3702474498545664e+19, "train_batch_size": 64, "trial_name": null, "trial_params": null }