{ "best_metric": 1.1392158269882202, "best_model_checkpoint": "./vit-artworkclassifier\\checkpoint-600", "epoch": 4.0, "global_step": 1112, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.18, "learning_rate": 9.550359712230216e-05, "loss": 1.9425, "step": 50 }, { "epoch": 0.36, "learning_rate": 9.100719424460432e-05, "loss": 1.5906, "step": 100 }, { "epoch": 0.36, "eval_accuracy": 0.48467650397275824, "eval_loss": 1.4708987474441528, "eval_runtime": 7.3715, "eval_samples_per_second": 119.514, "eval_steps_per_second": 15.058, "step": 100 }, { "epoch": 0.54, "learning_rate": 8.651079136690648e-05, "loss": 1.4388, "step": 150 }, { "epoch": 0.72, "learning_rate": 8.201438848920863e-05, "loss": 1.3395, "step": 200 }, { "epoch": 0.72, "eval_accuracy": 0.5073779795686719, "eval_loss": 1.3207731246948242, "eval_runtime": 7.4035, "eval_samples_per_second": 118.998, "eval_steps_per_second": 14.993, "step": 200 }, { "epoch": 0.9, "learning_rate": 7.751798561151079e-05, "loss": 1.3275, "step": 250 }, { "epoch": 1.08, "learning_rate": 7.302158273381295e-05, "loss": 1.1461, "step": 300 }, { "epoch": 1.08, "eval_accuracy": 0.5164585698070374, "eval_loss": 1.3362975120544434, "eval_runtime": 7.64, "eval_samples_per_second": 115.314, "eval_steps_per_second": 14.529, "step": 300 }, { "epoch": 1.26, "learning_rate": 6.852517985611511e-05, "loss": 0.9749, "step": 350 }, { "epoch": 1.44, "learning_rate": 6.402877697841726e-05, "loss": 0.9593, "step": 400 }, { "epoch": 1.44, "eval_accuracy": 0.5845629965947786, "eval_loss": 1.1789547204971313, "eval_runtime": 7.248, "eval_samples_per_second": 121.551, "eval_steps_per_second": 15.315, "step": 400 }, { "epoch": 1.62, "learning_rate": 5.953237410071942e-05, "loss": 0.9175, "step": 450 }, { "epoch": 1.8, "learning_rate": 5.512589928057554e-05, "loss": 0.8761, "step": 500 }, { "epoch": 1.8, "eval_accuracy": 0.5902383654937571, "eval_loss": 1.1252126693725586, "eval_runtime": 7.2535, "eval_samples_per_second": 121.459, "eval_steps_per_second": 15.303, "step": 500 }, { "epoch": 1.98, "learning_rate": 5.06294964028777e-05, "loss": 0.8615, "step": 550 }, { "epoch": 2.16, "learning_rate": 4.613309352517986e-05, "loss": 0.5922, "step": 600 }, { "epoch": 2.16, "eval_accuracy": 0.5947786606129398, "eval_loss": 1.1392158269882202, "eval_runtime": 7.5695, "eval_samples_per_second": 116.388, "eval_steps_per_second": 14.664, "step": 600 }, { "epoch": 2.34, "learning_rate": 4.163669064748202e-05, "loss": 0.4684, "step": 650 }, { "epoch": 2.52, "learning_rate": 3.714028776978418e-05, "loss": 0.4803, "step": 700 }, { "epoch": 2.52, "eval_accuracy": 0.5936435868331441, "eval_loss": 1.1560313701629639, "eval_runtime": 7.3175, "eval_samples_per_second": 120.396, "eval_steps_per_second": 15.169, "step": 700 }, { "epoch": 2.7, "learning_rate": 3.2643884892086335e-05, "loss": 0.4766, "step": 750 }, { "epoch": 2.88, "learning_rate": 2.8147482014388493e-05, "loss": 0.4454, "step": 800 }, { "epoch": 2.88, "eval_accuracy": 0.6118047673098751, "eval_loss": 1.1545273065567017, "eval_runtime": 7.2475, "eval_samples_per_second": 121.559, "eval_steps_per_second": 15.316, "step": 800 }, { "epoch": 3.06, "learning_rate": 2.3651079136690647e-05, "loss": 0.371, "step": 850 }, { "epoch": 3.24, "learning_rate": 1.9154676258992808e-05, "loss": 0.2271, "step": 900 }, { "epoch": 3.24, "eval_accuracy": 0.6038592508513053, "eval_loss": 1.2283731698989868, "eval_runtime": 7.1705, "eval_samples_per_second": 122.865, "eval_steps_per_second": 15.48, "step": 900 }, { "epoch": 3.42, "learning_rate": 1.4658273381294965e-05, "loss": 0.2249, "step": 950 }, { "epoch": 3.6, "learning_rate": 1.0161870503597123e-05, "loss": 0.207, "step": 1000 }, { "epoch": 3.6, "eval_accuracy": 0.5959137343927355, "eval_loss": 1.262502670288086, "eval_runtime": 7.2385, "eval_samples_per_second": 121.71, "eval_steps_per_second": 15.335, "step": 1000 }, { "epoch": 3.78, "learning_rate": 5.665467625899281e-06, "loss": 0.1906, "step": 1050 }, { "epoch": 3.96, "learning_rate": 1.169064748201439e-06, "loss": 0.1958, "step": 1100 }, { "epoch": 3.96, "eval_accuracy": 0.6004540295119183, "eval_loss": 1.262100338935852, "eval_runtime": 7.2855, "eval_samples_per_second": 120.925, "eval_steps_per_second": 15.236, "step": 1100 }, { "epoch": 4.0, "step": 1112, "total_flos": 2.7542380976164454e+18, "train_loss": 0.7775138853479633, "train_runtime": 613.7183, "train_samples_per_second": 57.909, "train_steps_per_second": 1.812 } ], "max_steps": 1112, "num_train_epochs": 4, "total_flos": 2.7542380976164454e+18, "trial_name": null, "trial_params": null }