{ "best_metric": 6.141994476318359, "best_model_checkpoint": "Transformers/vit-base-clothing-leafs-example/checkpoint-36000", "epoch": 5.0, "global_step": 36155, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.14, "learning_rate": 0.0001944682616512239, "loss": 8.6059, "step": 1000 }, { "epoch": 0.14, "eval_accuracy": 0.0002420302883618007, "eval_loss": 8.584440231323242, "eval_runtime": 155.6325, "eval_samples_per_second": 185.835, "eval_steps_per_second": 23.234, "step": 1000 }, { "epoch": 0.28, "learning_rate": 0.0001889365233024478, "loss": 8.5506, "step": 2000 }, { "epoch": 0.28, "eval_accuracy": 0.00100269690892746, "eval_loss": 8.518888473510742, "eval_runtime": 153.9354, "eval_samples_per_second": 187.884, "eval_steps_per_second": 23.49, "step": 2000 }, { "epoch": 0.41, "learning_rate": 0.00018341584843036926, "loss": 8.4931, "step": 3000 }, { "epoch": 0.41, "eval_accuracy": 0.0012101514418090035, "eval_loss": 8.464128494262695, "eval_runtime": 157.4956, "eval_samples_per_second": 183.637, "eval_steps_per_second": 22.959, "step": 3000 }, { "epoch": 0.55, "learning_rate": 0.00017788411008159315, "loss": 8.4223, "step": 4000 }, { "epoch": 0.55, "eval_accuracy": 0.0016250605075720905, "eval_loss": 8.349540710449219, "eval_runtime": 156.3508, "eval_samples_per_second": 184.982, "eval_steps_per_second": 23.127, "step": 4000 }, { "epoch": 0.69, "learning_rate": 0.00017235237173281705, "loss": 8.3144, "step": 5000 }, { "epoch": 0.69, "eval_accuracy": 0.0020745453288154346, "eval_loss": 8.255170822143555, "eval_runtime": 157.1252, "eval_samples_per_second": 184.07, "eval_steps_per_second": 23.013, "step": 5000 }, { "epoch": 0.83, "learning_rate": 0.00016682063338404094, "loss": 8.1936, "step": 6000 }, { "epoch": 0.83, "eval_accuracy": 0.0023511513726574926, "eval_loss": 8.138504981994629, "eval_runtime": 157.2716, "eval_samples_per_second": 183.898, "eval_steps_per_second": 22.992, "step": 6000 }, { "epoch": 0.97, "learning_rate": 0.00016128889503526483, "loss": 8.0638, "step": 7000 }, { "epoch": 0.97, "eval_accuracy": 0.002835211949381094, "eval_loss": 7.992447376251221, "eval_runtime": 156.9147, "eval_samples_per_second": 184.317, "eval_steps_per_second": 23.044, "step": 7000 }, { "epoch": 1.11, "learning_rate": 0.00015575715668648873, "loss": 7.8485, "step": 8000 }, { "epoch": 1.11, "eval_accuracy": 0.0036304543254270104, "eval_loss": 7.836571216583252, "eval_runtime": 155.7627, "eval_samples_per_second": 185.68, "eval_steps_per_second": 23.215, "step": 8000 }, { "epoch": 1.24, "learning_rate": 0.00015022541833771265, "loss": 7.6933, "step": 9000 }, { "epoch": 1.24, "eval_accuracy": 0.004494848212433442, "eval_loss": 7.659491062164307, "eval_runtime": 156.4028, "eval_samples_per_second": 184.92, "eval_steps_per_second": 23.12, "step": 9000 }, { "epoch": 1.38, "learning_rate": 0.00014469367998893652, "loss": 7.5808, "step": 10000 }, { "epoch": 1.38, "eval_accuracy": 0.00615448447548579, "eval_loss": 7.523160934448242, "eval_runtime": 155.1944, "eval_samples_per_second": 186.36, "eval_steps_per_second": 23.3, "step": 10000 }, { "epoch": 1.52, "learning_rate": 0.0001391674733785092, "loss": 7.4352, "step": 11000 }, { "epoch": 1.52, "eval_accuracy": 0.00701887836249222, "eval_loss": 7.381638526916504, "eval_runtime": 156.5342, "eval_samples_per_second": 184.765, "eval_steps_per_second": 23.1, "step": 11000 }, { "epoch": 1.66, "learning_rate": 0.0001336357350297331, "loss": 7.3279, "step": 12000 }, { "epoch": 1.66, "eval_accuracy": 0.008436484337182767, "eval_loss": 7.285288333892822, "eval_runtime": 157.1769, "eval_samples_per_second": 184.009, "eval_steps_per_second": 23.006, "step": 12000 }, { "epoch": 1.8, "learning_rate": 0.000128103996680957, "loss": 7.2141, "step": 13000 }, { "epoch": 1.8, "eval_accuracy": 0.010511029665998203, "eval_loss": 7.1552510261535645, "eval_runtime": 155.9751, "eval_samples_per_second": 185.427, "eval_steps_per_second": 23.183, "step": 13000 }, { "epoch": 1.94, "learning_rate": 0.0001225722583321809, "loss": 7.151, "step": 14000 }, { "epoch": 1.94, "eval_accuracy": 0.011859484129728235, "eval_loss": 7.085327625274658, "eval_runtime": 156.2266, "eval_samples_per_second": 185.129, "eval_steps_per_second": 23.146, "step": 14000 }, { "epoch": 2.07, "learning_rate": 0.00011704605172175355, "loss": 6.9695, "step": 15000 }, { "epoch": 2.07, "eval_accuracy": 0.013380817370859553, "eval_loss": 7.008819103240967, "eval_runtime": 155.749, "eval_samples_per_second": 185.696, "eval_steps_per_second": 23.217, "step": 15000 }, { "epoch": 2.21, "learning_rate": 0.00011151984511132624, "loss": 6.8563, "step": 16000 }, { "epoch": 2.21, "eval_accuracy": 0.013934029458543669, "eval_loss": 6.940927982330322, "eval_runtime": 155.6806, "eval_samples_per_second": 185.778, "eval_steps_per_second": 23.227, "step": 16000 }, { "epoch": 2.35, "learning_rate": 0.00010598810676255014, "loss": 6.8019, "step": 17000 }, { "epoch": 2.35, "eval_accuracy": 0.01583569600995782, "eval_loss": 6.863400936126709, "eval_runtime": 156.1188, "eval_samples_per_second": 185.256, "eval_steps_per_second": 23.162, "step": 17000 }, { "epoch": 2.49, "learning_rate": 0.00010045636841377403, "loss": 6.7372, "step": 18000 }, { "epoch": 2.49, "eval_accuracy": 0.017495332273010165, "eval_loss": 6.800116539001465, "eval_runtime": 156.6848, "eval_samples_per_second": 184.587, "eval_steps_per_second": 23.078, "step": 18000 }, { "epoch": 2.63, "learning_rate": 9.492463006499794e-05, "loss": 6.6903, "step": 19000 }, { "epoch": 2.63, "eval_accuracy": 0.019120392780582255, "eval_loss": 6.7322998046875, "eval_runtime": 156.774, "eval_samples_per_second": 184.482, "eval_steps_per_second": 23.065, "step": 19000 }, { "epoch": 2.77, "learning_rate": 8.93984234545706e-05, "loss": 6.6482, "step": 20000 }, { "epoch": 2.77, "eval_accuracy": 0.020710877532674088, "eval_loss": 6.66375732421875, "eval_runtime": 156.4579, "eval_samples_per_second": 184.855, "eval_steps_per_second": 23.112, "step": 20000 }, { "epoch": 2.9, "learning_rate": 8.38666851057945e-05, "loss": 6.5669, "step": 21000 }, { "epoch": 2.9, "eval_accuracy": 0.023891847036857754, "eval_loss": 6.609040260314941, "eval_runtime": 155.2279, "eval_samples_per_second": 186.32, "eval_steps_per_second": 23.295, "step": 21000 }, { "epoch": 3.04, "learning_rate": 7.834047849536717e-05, "loss": 6.4484, "step": 22000 }, { "epoch": 3.04, "eval_accuracy": 0.023995574303298527, "eval_loss": 6.544083595275879, "eval_runtime": 155.967, "eval_samples_per_second": 185.437, "eval_steps_per_second": 23.184, "step": 22000 }, { "epoch": 3.18, "learning_rate": 7.281427188493984e-05, "loss": 6.2568, "step": 23000 }, { "epoch": 3.18, "eval_accuracy": 0.02734942258488348, "eval_loss": 6.501514911651611, "eval_runtime": 156.6432, "eval_samples_per_second": 184.636, "eval_steps_per_second": 23.084, "step": 23000 }, { "epoch": 3.32, "learning_rate": 6.728253353616373e-05, "loss": 6.2452, "step": 24000 }, { "epoch": 3.32, "eval_accuracy": 0.030426664822626376, "eval_loss": 6.458929061889648, "eval_runtime": 156.5343, "eval_samples_per_second": 184.765, "eval_steps_per_second": 23.1, "step": 24000 }, { "epoch": 3.46, "learning_rate": 6.175632692573642e-05, "loss": 6.2002, "step": 25000 }, { "epoch": 3.46, "eval_accuracy": 0.031049028421271004, "eval_loss": 6.431183815002441, "eval_runtime": 156.3543, "eval_samples_per_second": 184.977, "eval_steps_per_second": 23.127, "step": 25000 }, { "epoch": 3.6, "learning_rate": 5.622458857696031e-05, "loss": 6.1699, "step": 26000 }, { "epoch": 3.6, "eval_accuracy": 0.03194799806375769, "eval_loss": 6.372282981872559, "eval_runtime": 156.6121, "eval_samples_per_second": 184.673, "eval_steps_per_second": 23.089, "step": 26000 }, { "epoch": 3.73, "learning_rate": 5.0692850228184205e-05, "loss": 6.1284, "step": 27000 }, { "epoch": 3.73, "eval_accuracy": 0.03429914943641518, "eval_loss": 6.332355976104736, "eval_runtime": 156.1088, "eval_samples_per_second": 185.268, "eval_steps_per_second": 23.163, "step": 27000 }, { "epoch": 3.87, "learning_rate": 4.516664361775688e-05, "loss": 6.1186, "step": 28000 }, { "epoch": 3.87, "eval_accuracy": 0.034956088790540074, "eval_loss": 6.3029093742370605, "eval_runtime": 154.5904, "eval_samples_per_second": 187.088, "eval_steps_per_second": 23.391, "step": 28000 }, { "epoch": 4.01, "learning_rate": 3.963490526898078e-05, "loss": 6.0611, "step": 29000 }, { "epoch": 4.01, "eval_accuracy": 0.03810248253924348, "eval_loss": 6.272293567657471, "eval_runtime": 156.0431, "eval_samples_per_second": 185.346, "eval_steps_per_second": 23.173, "step": 29000 }, { "epoch": 4.15, "learning_rate": 3.410316692020468e-05, "loss": 5.7883, "step": 30000 }, { "epoch": 4.15, "eval_accuracy": 0.03827536131664477, "eval_loss": 6.252718925476074, "eval_runtime": 145.8769, "eval_samples_per_second": 198.263, "eval_steps_per_second": 24.788, "step": 30000 }, { "epoch": 4.29, "learning_rate": 2.8576960309777352e-05, "loss": 5.7684, "step": 31000 }, { "epoch": 4.29, "eval_accuracy": 0.03924348247009197, "eval_loss": 6.218559741973877, "eval_runtime": 146.1199, "eval_samples_per_second": 197.933, "eval_steps_per_second": 24.747, "step": 31000 }, { "epoch": 4.43, "learning_rate": 2.3045221961001246e-05, "loss": 5.7701, "step": 32000 }, { "epoch": 4.43, "eval_accuracy": 0.04031533088997995, "eval_loss": 6.203105926513672, "eval_runtime": 145.5537, "eval_samples_per_second": 198.703, "eval_steps_per_second": 24.843, "step": 32000 }, { "epoch": 4.56, "learning_rate": 1.751901535057392e-05, "loss": 5.7473, "step": 33000 }, { "epoch": 4.56, "eval_accuracy": 0.04304681557292027, "eval_loss": 6.177652359008789, "eval_runtime": 145.7844, "eval_samples_per_second": 198.389, "eval_steps_per_second": 24.804, "step": 33000 }, { "epoch": 4.7, "learning_rate": 1.1987277001797816e-05, "loss": 5.735, "step": 34000 }, { "epoch": 4.7, "eval_accuracy": 0.044187815503768754, "eval_loss": 6.163440704345703, "eval_runtime": 146.1075, "eval_samples_per_second": 197.95, "eval_steps_per_second": 24.749, "step": 34000 }, { "epoch": 4.84, "learning_rate": 6.455538653021713e-06, "loss": 5.7324, "step": 35000 }, { "epoch": 4.84, "eval_accuracy": 0.04429154277020953, "eval_loss": 6.149352073669434, "eval_runtime": 145.8359, "eval_samples_per_second": 198.319, "eval_steps_per_second": 24.795, "step": 35000 }, { "epoch": 4.98, "learning_rate": 9.238003042456093e-07, "loss": 5.6949, "step": 36000 }, { "epoch": 4.98, "eval_accuracy": 0.044844754857893646, "eval_loss": 6.141994476318359, "eval_runtime": 145.8687, "eval_samples_per_second": 198.274, "eval_steps_per_second": 24.789, "step": 36000 }, { "epoch": 5.0, "step": 36155, "total_flos": 9.416417849072317e+19, "train_loss": 6.8843976465667565, "train_runtime": 17474.7904, "train_samples_per_second": 66.203, "train_steps_per_second": 2.069 } ], "max_steps": 36155, "num_train_epochs": 5, "total_flos": 9.416417849072317e+19, "trial_name": null, "trial_params": null }