{ "best_metric": null, "best_model_checkpoint": null, "epoch": 20.92050209205021, "eval_steps": 500, "global_step": 10000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.21, "learning_rate": 5.9401e-05, "loss": 0.3126, "step": 100 }, { "epoch": 0.42, "learning_rate": 5.8802000000000004e-05, "loss": 0.1588, "step": 200 }, { "epoch": 0.63, "learning_rate": 5.8203e-05, "loss": 0.1026, "step": 300 }, { "epoch": 0.84, "learning_rate": 5.7604e-05, "loss": 0.0713, "step": 400 }, { "epoch": 1.0, "eval_accuracy_background": 0.99061704638999, "eval_accuracy_biofilm": NaN, "eval_iou_background": 0.99061704638999, "eval_iou_biofilm": 0.0, "eval_loss": 0.038060422986745834, "eval_mean_accuracy": 0.99061704638999, "eval_mean_iou": 0.495308523194995, "eval_overall_accuracy": 0.99061704638999, "eval_runtime": 20.5844, "eval_samples_per_second": 12.388, "eval_steps_per_second": 1.555, "step": 478 }, { "epoch": 1.05, "learning_rate": 5.7005e-05, "loss": 0.0599, "step": 500 }, { "epoch": 1.26, "learning_rate": 5.6406e-05, "loss": 0.05, "step": 600 }, { "epoch": 1.46, "learning_rate": 5.5806999999999996e-05, "loss": 0.0471, "step": 700 }, { "epoch": 1.67, "learning_rate": 5.5208000000000004e-05, "loss": 0.0435, "step": 800 }, { "epoch": 1.88, "learning_rate": 5.4609000000000005e-05, "loss": 0.044, "step": 900 }, { "epoch": 2.0, "eval_accuracy_background": 0.99493468531224, "eval_accuracy_biofilm": NaN, "eval_iou_background": 0.99493468531224, "eval_iou_biofilm": 0.0, "eval_loss": 0.020206088200211525, "eval_mean_accuracy": 0.99493468531224, "eval_mean_iou": 0.49746734265612, "eval_overall_accuracy": 0.99493468531224, "eval_runtime": 20.9376, "eval_samples_per_second": 12.179, "eval_steps_per_second": 1.528, "step": 956 }, { "epoch": 2.09, "learning_rate": 5.401e-05, "loss": 0.0486, "step": 1000 }, { "epoch": 2.3, "learning_rate": 5.3411e-05, "loss": 0.042, "step": 1100 }, { "epoch": 2.51, "learning_rate": 5.2812e-05, "loss": 0.0378, "step": 1200 }, { "epoch": 2.72, "learning_rate": 5.2213e-05, "loss": 0.0429, "step": 1300 }, { "epoch": 2.93, "learning_rate": 5.1614000000000004e-05, "loss": 0.041, "step": 1400 }, { "epoch": 3.0, "eval_accuracy_background": 0.9944646370264222, "eval_accuracy_biofilm": NaN, "eval_iou_background": 0.9944646370264222, "eval_iou_biofilm": 0.0, "eval_loss": 0.01811068318784237, "eval_mean_accuracy": 0.9944646370264222, "eval_mean_iou": 0.4972323185132111, "eval_overall_accuracy": 0.9944646370264222, "eval_runtime": 20.8434, "eval_samples_per_second": 12.234, "eval_steps_per_second": 1.535, "step": 1434 }, { "epoch": 3.14, "learning_rate": 5.1015e-05, "loss": 0.0348, "step": 1500 }, { "epoch": 3.35, "learning_rate": 5.0416e-05, "loss": 0.0338, "step": 1600 }, { "epoch": 3.56, "learning_rate": 4.9817e-05, "loss": 0.0378, "step": 1700 }, { "epoch": 3.77, "learning_rate": 4.9218e-05, "loss": 0.0316, "step": 1800 }, { "epoch": 3.97, "learning_rate": 4.8619e-05, "loss": 0.0361, "step": 1900 }, { "epoch": 4.0, "eval_accuracy_background": 0.9925826278137663, "eval_accuracy_biofilm": NaN, "eval_iou_background": 0.9925826278137663, "eval_iou_biofilm": 0.0, "eval_loss": 0.020319059491157532, "eval_mean_accuracy": 0.9925826278137663, "eval_mean_iou": 0.49629131390688314, "eval_overall_accuracy": 0.9925826278137663, "eval_runtime": 21.9308, "eval_samples_per_second": 11.627, "eval_steps_per_second": 1.459, "step": 1912 }, { "epoch": 4.18, "learning_rate": 4.8020000000000004e-05, "loss": 0.0302, "step": 2000 }, { "epoch": 4.39, "learning_rate": 4.7421000000000006e-05, "loss": 0.0303, "step": 2100 }, { "epoch": 4.6, "learning_rate": 4.6822e-05, "loss": 0.0344, "step": 2200 }, { "epoch": 4.81, "learning_rate": 4.6223e-05, "loss": 0.0357, "step": 2300 }, { "epoch": 5.0, "eval_accuracy_background": 0.9941524381895419, "eval_accuracy_biofilm": NaN, "eval_iou_background": 0.9941524381895419, "eval_iou_biofilm": 0.0, "eval_loss": 0.01632993295788765, "eval_mean_accuracy": 0.9941524381895419, "eval_mean_iou": 0.49707621909477095, "eval_overall_accuracy": 0.9941524381895419, "eval_runtime": 21.4286, "eval_samples_per_second": 11.9, "eval_steps_per_second": 1.493, "step": 2390 }, { "epoch": 5.02, "learning_rate": 4.5624e-05, "loss": 0.0258, "step": 2400 }, { "epoch": 5.23, "learning_rate": 4.5025000000000003e-05, "loss": 0.0278, "step": 2500 }, { "epoch": 5.44, "learning_rate": 4.4426000000000005e-05, "loss": 0.0317, "step": 2600 }, { "epoch": 5.65, "learning_rate": 4.3827e-05, "loss": 0.0286, "step": 2700 }, { "epoch": 5.86, "learning_rate": 4.3228e-05, "loss": 0.0336, "step": 2800 }, { "epoch": 6.0, "eval_accuracy_background": 0.9915140030588883, "eval_accuracy_biofilm": NaN, "eval_iou_background": 0.9915140030588883, "eval_iou_biofilm": 0.0, "eval_loss": 0.03403358906507492, "eval_mean_accuracy": 0.9915140030588883, "eval_mean_iou": 0.49575700152944413, "eval_overall_accuracy": 0.9915140030588883, "eval_runtime": 21.1945, "eval_samples_per_second": 12.031, "eval_steps_per_second": 1.51, "step": 2868 }, { "epoch": 6.07, "learning_rate": 4.2629e-05, "loss": 0.035, "step": 2900 }, { "epoch": 6.28, "learning_rate": 4.203e-05, "loss": 0.0262, "step": 3000 }, { "epoch": 6.49, "learning_rate": 4.1431e-05, "loss": 0.0293, "step": 3100 }, { "epoch": 6.69, "learning_rate": 4.0832e-05, "loss": 0.0291, "step": 3200 }, { "epoch": 6.9, "learning_rate": 4.0233e-05, "loss": 0.0295, "step": 3300 }, { "epoch": 7.0, "eval_accuracy_background": 0.9955253040954527, "eval_accuracy_biofilm": NaN, "eval_iou_background": 0.9955253040954527, "eval_iou_biofilm": 0.0, "eval_loss": 0.012596790678799152, "eval_mean_accuracy": 0.9955253040954527, "eval_mean_iou": 0.49776265204772635, "eval_overall_accuracy": 0.9955253040954527, "eval_runtime": 21.3112, "eval_samples_per_second": 11.966, "eval_steps_per_second": 1.502, "step": 3346 }, { "epoch": 7.11, "learning_rate": 3.9634e-05, "loss": 0.0372, "step": 3400 }, { "epoch": 7.32, "learning_rate": 3.9035e-05, "loss": 0.0282, "step": 3500 }, { "epoch": 7.53, "learning_rate": 3.8436e-05, "loss": 0.0302, "step": 3600 }, { "epoch": 7.74, "learning_rate": 3.7837000000000004e-05, "loss": 0.0318, "step": 3700 }, { "epoch": 7.95, "learning_rate": 3.7238000000000005e-05, "loss": 0.0251, "step": 3800 }, { "epoch": 8.0, "eval_accuracy_background": 0.9914670494104436, "eval_accuracy_biofilm": NaN, "eval_iou_background": 0.9914670494104436, "eval_iou_biofilm": 0.0, "eval_loss": 0.022036196663975716, "eval_mean_accuracy": 0.9914670494104436, "eval_mean_iou": 0.4957335247052218, "eval_overall_accuracy": 0.9914670494104436, "eval_runtime": 21.5063, "eval_samples_per_second": 11.857, "eval_steps_per_second": 1.488, "step": 3824 }, { "epoch": 8.16, "learning_rate": 3.6639e-05, "loss": 0.0249, "step": 3900 }, { "epoch": 8.37, "learning_rate": 3.604e-05, "loss": 0.0325, "step": 4000 }, { "epoch": 8.58, "learning_rate": 3.544100000000001e-05, "loss": 0.0296, "step": 4100 }, { "epoch": 8.79, "learning_rate": 3.4842e-05, "loss": 0.0265, "step": 4200 }, { "epoch": 9.0, "learning_rate": 3.4243000000000004e-05, "loss": 0.0265, "step": 4300 }, { "epoch": 9.0, "eval_accuracy_background": 0.9932536159220945, "eval_accuracy_biofilm": NaN, "eval_iou_background": 0.9932536159220945, "eval_iou_biofilm": 0.0, "eval_loss": 0.01821214146912098, "eval_mean_accuracy": 0.9932536159220945, "eval_mean_iou": 0.49662680796104725, "eval_overall_accuracy": 0.9932536159220945, "eval_runtime": 21.4325, "eval_samples_per_second": 11.898, "eval_steps_per_second": 1.493, "step": 4302 }, { "epoch": 9.21, "learning_rate": 3.3644000000000005e-05, "loss": 0.0294, "step": 4400 }, { "epoch": 9.41, "learning_rate": 3.3045000000000006e-05, "loss": 0.0246, "step": 4500 }, { "epoch": 9.62, "learning_rate": 3.2446e-05, "loss": 0.0253, "step": 4600 }, { "epoch": 9.83, "learning_rate": 3.1847e-05, "loss": 0.0238, "step": 4700 }, { "epoch": 10.0, "eval_accuracy_background": 0.9940080441637696, "eval_accuracy_biofilm": NaN, "eval_iou_background": 0.9940080441637696, "eval_iou_biofilm": 0.0, "eval_loss": 0.015465262345969677, "eval_mean_accuracy": 0.9940080441637696, "eval_mean_iou": 0.4970040220818848, "eval_overall_accuracy": 0.9940080441637696, "eval_runtime": 22.1026, "eval_samples_per_second": 11.537, "eval_steps_per_second": 1.448, "step": 4780 }, { "epoch": 10.04, "learning_rate": 3.1248e-05, "loss": 0.0262, "step": 4800 }, { "epoch": 10.25, "learning_rate": 3.0649000000000004e-05, "loss": 0.0253, "step": 4900 }, { "epoch": 10.46, "learning_rate": 3.0050000000000002e-05, "loss": 0.0266, "step": 5000 }, { "epoch": 10.67, "learning_rate": 2.9451e-05, "loss": 0.028, "step": 5100 }, { "epoch": 10.88, "learning_rate": 2.8851999999999998e-05, "loss": 0.0258, "step": 5200 }, { "epoch": 11.0, "eval_accuracy_background": 0.9931246419763669, "eval_accuracy_biofilm": NaN, "eval_iou_background": 0.9931246419763669, "eval_iou_biofilm": 0.0, "eval_loss": 0.01807301491498947, "eval_mean_accuracy": 0.9931246419763669, "eval_mean_iou": 0.4965623209881834, "eval_overall_accuracy": 0.9931246419763669, "eval_runtime": 21.5251, "eval_samples_per_second": 11.847, "eval_steps_per_second": 1.487, "step": 5258 }, { "epoch": 11.09, "learning_rate": 2.8253e-05, "loss": 0.0228, "step": 5300 }, { "epoch": 11.3, "learning_rate": 2.7653999999999996e-05, "loss": 0.0246, "step": 5400 }, { "epoch": 11.51, "learning_rate": 2.7054999999999998e-05, "loss": 0.0262, "step": 5500 }, { "epoch": 11.72, "learning_rate": 2.6455999999999995e-05, "loss": 0.0306, "step": 5600 }, { "epoch": 11.92, "learning_rate": 2.5857e-05, "loss": 0.0264, "step": 5700 }, { "epoch": 12.0, "eval_accuracy_background": 0.9937508887389549, "eval_accuracy_biofilm": NaN, "eval_iou_background": 0.9937508887389549, "eval_iou_biofilm": 0.0, "eval_loss": 0.01792028360068798, "eval_mean_accuracy": 0.9937508887389549, "eval_mean_iou": 0.49687544436947745, "eval_overall_accuracy": 0.9937508887389549, "eval_runtime": 21.5267, "eval_samples_per_second": 11.846, "eval_steps_per_second": 1.487, "step": 5736 }, { "epoch": 12.13, "learning_rate": 2.5258e-05, "loss": 0.028, "step": 5800 }, { "epoch": 12.34, "learning_rate": 2.4659e-05, "loss": 0.0268, "step": 5900 }, { "epoch": 12.55, "learning_rate": 2.406e-05, "loss": 0.0266, "step": 6000 }, { "epoch": 12.76, "learning_rate": 2.3460999999999998e-05, "loss": 0.0242, "step": 6100 }, { "epoch": 12.97, "learning_rate": 2.2862e-05, "loss": 0.0265, "step": 6200 }, { "epoch": 13.0, "eval_accuracy_background": 0.991736174383473, "eval_accuracy_biofilm": NaN, "eval_iou_background": 0.991736174383473, "eval_iou_biofilm": 0.0, "eval_loss": 0.022188672795891762, "eval_mean_accuracy": 0.991736174383473, "eval_mean_iou": 0.4958680871917365, "eval_overall_accuracy": 0.991736174383473, "eval_runtime": 22.1635, "eval_samples_per_second": 11.505, "eval_steps_per_second": 1.444, "step": 6214 }, { "epoch": 13.18, "learning_rate": 2.2263e-05, "loss": 0.0233, "step": 6300 }, { "epoch": 13.39, "learning_rate": 2.1663999999999998e-05, "loss": 0.0232, "step": 6400 }, { "epoch": 13.6, "learning_rate": 2.1065e-05, "loss": 0.0311, "step": 6500 }, { "epoch": 13.81, "learning_rate": 2.0465999999999997e-05, "loss": 0.0219, "step": 6600 }, { "epoch": 14.0, "eval_accuracy_background": 0.9924663828634505, "eval_accuracy_biofilm": NaN, "eval_iou_background": 0.9924663828634505, "eval_iou_biofilm": 0.0, "eval_loss": 0.020027143880724907, "eval_mean_accuracy": 0.9924663828634505, "eval_mean_iou": 0.49623319143172523, "eval_overall_accuracy": 0.9924663828634505, "eval_runtime": 22.2537, "eval_samples_per_second": 11.459, "eval_steps_per_second": 1.438, "step": 6692 }, { "epoch": 14.02, "learning_rate": 1.9866999999999998e-05, "loss": 0.0234, "step": 6700 }, { "epoch": 14.23, "learning_rate": 1.9267999999999996e-05, "loss": 0.0281, "step": 6800 }, { "epoch": 14.44, "learning_rate": 1.8669e-05, "loss": 0.0243, "step": 6900 }, { "epoch": 14.64, "learning_rate": 1.807e-05, "loss": 0.0238, "step": 7000 }, { "epoch": 14.85, "learning_rate": 1.7471e-05, "loss": 0.0213, "step": 7100 }, { "epoch": 15.0, "eval_accuracy_background": 0.9916155213374698, "eval_accuracy_biofilm": NaN, "eval_iou_background": 0.9916155213374698, "eval_iou_biofilm": 0.0, "eval_loss": 0.023391906172037125, "eval_mean_accuracy": 0.9916155213374698, "eval_mean_iou": 0.4958077606687349, "eval_overall_accuracy": 0.9916155213374698, "eval_runtime": 21.7106, "eval_samples_per_second": 11.745, "eval_steps_per_second": 1.474, "step": 7170 }, { "epoch": 15.06, "learning_rate": 1.6872e-05, "loss": 0.0231, "step": 7200 }, { "epoch": 15.27, "learning_rate": 1.6272999999999998e-05, "loss": 0.0252, "step": 7300 }, { "epoch": 15.48, "learning_rate": 1.5674e-05, "loss": 0.024, "step": 7400 }, { "epoch": 15.69, "learning_rate": 1.5075000000000002e-05, "loss": 0.0205, "step": 7500 }, { "epoch": 15.9, "learning_rate": 1.4476e-05, "loss": 0.0192, "step": 7600 }, { "epoch": 16.0, "eval_accuracy_background": 0.9922337608850452, "eval_accuracy_biofilm": NaN, "eval_iou_background": 0.9922337608850452, "eval_iou_biofilm": 0.0, "eval_loss": 0.019924867898225784, "eval_mean_accuracy": 0.9922337608850452, "eval_mean_iou": 0.4961168804425226, "eval_overall_accuracy": 0.9922337608850452, "eval_runtime": 21.6803, "eval_samples_per_second": 11.762, "eval_steps_per_second": 1.476, "step": 7648 }, { "epoch": 16.11, "learning_rate": 1.3877e-05, "loss": 0.0234, "step": 7700 }, { "epoch": 16.32, "learning_rate": 1.3277999999999999e-05, "loss": 0.0244, "step": 7800 }, { "epoch": 16.53, "learning_rate": 1.2678999999999998e-05, "loss": 0.0187, "step": 7900 }, { "epoch": 16.74, "learning_rate": 1.2079999999999998e-05, "loss": 0.0232, "step": 8000 }, { "epoch": 16.95, "learning_rate": 1.1480999999999997e-05, "loss": 0.0232, "step": 8100 }, { "epoch": 17.0, "eval_accuracy_background": 0.9922697355685758, "eval_accuracy_biofilm": NaN, "eval_iou_background": 0.9922697355685758, "eval_iou_biofilm": 0.0, "eval_loss": 0.020755073055624962, "eval_mean_accuracy": 0.9922697355685758, "eval_mean_iou": 0.4961348677842879, "eval_overall_accuracy": 0.9922697355685758, "eval_runtime": 21.7178, "eval_samples_per_second": 11.742, "eval_steps_per_second": 1.473, "step": 8126 }, { "epoch": 17.15, "learning_rate": 1.0882000000000004e-05, "loss": 0.0256, "step": 8200 }, { "epoch": 17.36, "learning_rate": 1.0283000000000003e-05, "loss": 0.0195, "step": 8300 }, { "epoch": 17.57, "learning_rate": 9.684000000000002e-06, "loss": 0.0212, "step": 8400 }, { "epoch": 17.78, "learning_rate": 9.085000000000002e-06, "loss": 0.023, "step": 8500 }, { "epoch": 17.99, "learning_rate": 8.486000000000001e-06, "loss": 0.0219, "step": 8600 }, { "epoch": 18.0, "eval_accuracy_background": 0.9909196860980203, "eval_accuracy_biofilm": NaN, "eval_iou_background": 0.9909196860980203, "eval_iou_biofilm": 0.0, "eval_loss": 0.02454926259815693, "eval_mean_accuracy": 0.9909196860980203, "eval_mean_iou": 0.49545984304901014, "eval_overall_accuracy": 0.9909196860980203, "eval_runtime": 22.2518, "eval_samples_per_second": 11.46, "eval_steps_per_second": 1.438, "step": 8604 }, { "epoch": 18.2, "learning_rate": 7.887000000000001e-06, "loss": 0.0223, "step": 8700 }, { "epoch": 18.41, "learning_rate": 7.2879999999999995e-06, "loss": 0.0249, "step": 8800 }, { "epoch": 18.62, "learning_rate": 6.688999999999999e-06, "loss": 0.0259, "step": 8900 }, { "epoch": 18.83, "learning_rate": 6.0899999999999984e-06, "loss": 0.0201, "step": 9000 }, { "epoch": 19.0, "eval_accuracy_background": 0.9921929323433422, "eval_accuracy_biofilm": NaN, "eval_iou_background": 0.9921929323433422, "eval_iou_biofilm": 0.0, "eval_loss": 0.021141713485121727, "eval_mean_accuracy": 0.9921929323433422, "eval_mean_iou": 0.4960964661716711, "eval_overall_accuracy": 0.9921929323433422, "eval_runtime": 22.2034, "eval_samples_per_second": 11.485, "eval_steps_per_second": 1.441, "step": 9082 }, { "epoch": 19.04, "learning_rate": 5.490999999999998e-06, "loss": 0.0263, "step": 9100 }, { "epoch": 19.25, "learning_rate": 4.891999999999997e-06, "loss": 0.0246, "step": 9200 }, { "epoch": 19.46, "learning_rate": 4.292999999999997e-06, "loss": 0.0176, "step": 9300 }, { "epoch": 19.67, "learning_rate": 3.694000000000003e-06, "loss": 0.0185, "step": 9400 }, { "epoch": 19.87, "learning_rate": 3.0950000000000026e-06, "loss": 0.0192, "step": 9500 }, { "epoch": 20.0, "eval_accuracy_background": 0.9923248780389713, "eval_accuracy_biofilm": NaN, "eval_iou_background": 0.9923248780389713, "eval_iou_biofilm": 0.0, "eval_loss": 0.020733820274472237, "eval_mean_accuracy": 0.9923248780389713, "eval_mean_iou": 0.49616243901948565, "eval_overall_accuracy": 0.9923248780389713, "eval_runtime": 21.616, "eval_samples_per_second": 11.797, "eval_steps_per_second": 1.48, "step": 9560 }, { "epoch": 20.08, "learning_rate": 2.496000000000002e-06, "loss": 0.0242, "step": 9600 }, { "epoch": 20.29, "learning_rate": 1.8970000000000013e-06, "loss": 0.0194, "step": 9700 }, { "epoch": 20.5, "learning_rate": 1.298000000000001e-06, "loss": 0.021, "step": 9800 }, { "epoch": 20.71, "learning_rate": 6.990000000000005e-07, "loss": 0.0233, "step": 9900 }, { "epoch": 20.92, "learning_rate": 1e-07, "loss": 0.0175, "step": 10000 }, { "epoch": 20.92, "eval_accuracy_background": 0.9922576669620311, "eval_accuracy_biofilm": NaN, "eval_iou_background": 0.9922576669620311, "eval_iou_biofilm": 0.0, "eval_loss": 0.020812883973121643, "eval_mean_accuracy": 0.9922576669620311, "eval_mean_iou": 0.49612883348101555, "eval_overall_accuracy": 0.9922576669620311, "eval_runtime": 21.7462, "eval_samples_per_second": 11.726, "eval_steps_per_second": 1.472, "step": 10000 }, { "epoch": 20.92, "step": 10000, "total_flos": 1.4004836461707264e+18, "train_loss": 0.03354803665876389, "train_runtime": 13691.4846, "train_samples_per_second": 5.843, "train_steps_per_second": 0.73 } ], "logging_steps": 100, "max_steps": 10000, "num_input_tokens_seen": 0, "num_train_epochs": 21, "save_steps": 500, "total_flos": 1.4004836461707264e+18, "train_batch_size": 8, "trial_name": null, "trial_params": null }