| { |
| "best_global_step": null, |
| "best_metric": null, |
| "best_model_checkpoint": null, |
| "epoch": 7.0, |
| "eval_steps": 500, |
| "global_step": 6657, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 0.005257623554153523, |
| "grad_norm": 9.867259040646717, |
| "learning_rate": 2.4024024024024026e-07, |
| "loss": 0.5972, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.539029061794281, |
| "step": 5, |
| "valid_targets_mean": 3146.7, |
| "valid_targets_min": 458 |
| }, |
| { |
| "epoch": 0.010515247108307046, |
| "grad_norm": 10.555090609046745, |
| "learning_rate": 5.405405405405406e-07, |
| "loss": 0.5131, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5360751152038574, |
| "step": 10, |
| "valid_targets_mean": 3025.6, |
| "valid_targets_min": 1024 |
| }, |
| { |
| "epoch": 0.015772870662460567, |
| "grad_norm": 8.803369549883405, |
| "learning_rate": 8.40840840840841e-07, |
| "loss": 0.4577, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4426497220993042, |
| "step": 15, |
| "valid_targets_mean": 3472.4, |
| "valid_targets_min": 2068 |
| }, |
| { |
| "epoch": 0.02103049421661409, |
| "grad_norm": 8.408275835403625, |
| "learning_rate": 1.1411411411411411e-06, |
| "loss": 0.5083, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4752780795097351, |
| "step": 20, |
| "valid_targets_mean": 3615.2, |
| "valid_targets_min": 2425 |
| }, |
| { |
| "epoch": 0.026288117770767613, |
| "grad_norm": 7.132840466505841, |
| "learning_rate": 1.4414414414414416e-06, |
| "loss": 0.4528, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4682956635951996, |
| "step": 25, |
| "valid_targets_mean": 2989.8, |
| "valid_targets_min": 1134 |
| }, |
| { |
| "epoch": 0.031545741324921134, |
| "grad_norm": 8.834455379215875, |
| "learning_rate": 1.7417417417417418e-06, |
| "loss": 0.5214, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.7035055756568909, |
| "step": 30, |
| "valid_targets_mean": 1482.1, |
| "valid_targets_min": 663 |
| }, |
| { |
| "epoch": 0.03680336487907466, |
| "grad_norm": 4.258834493231341, |
| "learning_rate": 2.0420420420420424e-06, |
| "loss": 0.677, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41128450632095337, |
| "step": 35, |
| "valid_targets_mean": 3055.2, |
| "valid_targets_min": 535 |
| }, |
| { |
| "epoch": 0.04206098843322818, |
| "grad_norm": 3.9762259977256713, |
| "learning_rate": 2.3423423423423424e-06, |
| "loss": 0.3983, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4739842712879181, |
| "step": 40, |
| "valid_targets_mean": 2707.1, |
| "valid_targets_min": 781 |
| }, |
| { |
| "epoch": 0.0473186119873817, |
| "grad_norm": 2.4777552084967, |
| "learning_rate": 2.642642642642643e-06, |
| "loss": 0.4041, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29039710760116577, |
| "step": 45, |
| "valid_targets_mean": 3210.4, |
| "valid_targets_min": 799 |
| }, |
| { |
| "epoch": 0.052576235541535225, |
| "grad_norm": 1.8104974716909379, |
| "learning_rate": 2.942942942942943e-06, |
| "loss": 0.3278, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2590543031692505, |
| "step": 50, |
| "valid_targets_mean": 4841.1, |
| "valid_targets_min": 2802 |
| }, |
| { |
| "epoch": 0.05783385909568875, |
| "grad_norm": 1.261987719529698, |
| "learning_rate": 3.2432432432432437e-06, |
| "loss": 0.2727, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27704891562461853, |
| "step": 55, |
| "valid_targets_mean": 3151.8, |
| "valid_targets_min": 574 |
| }, |
| { |
| "epoch": 0.06309148264984227, |
| "grad_norm": 1.0825036780996253, |
| "learning_rate": 3.5435435435435437e-06, |
| "loss": 0.2914, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28223657608032227, |
| "step": 60, |
| "valid_targets_mean": 3383.4, |
| "valid_targets_min": 813 |
| }, |
| { |
| "epoch": 0.0683491062039958, |
| "grad_norm": 1.589616045570128, |
| "learning_rate": 3.843843843843844e-06, |
| "loss": 0.2895, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.36726120114326477, |
| "step": 65, |
| "valid_targets_mean": 1778.0, |
| "valid_targets_min": 593 |
| }, |
| { |
| "epoch": 0.07360672975814932, |
| "grad_norm": 0.8091453317093126, |
| "learning_rate": 4.1441441441441446e-06, |
| "loss": 0.3116, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25980067253112793, |
| "step": 70, |
| "valid_targets_mean": 3196.0, |
| "valid_targets_min": 1185 |
| }, |
| { |
| "epoch": 0.07886435331230283, |
| "grad_norm": 1.0091602304337675, |
| "learning_rate": 4.444444444444444e-06, |
| "loss": 0.2505, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30630600452423096, |
| "step": 75, |
| "valid_targets_mean": 2149.3, |
| "valid_targets_min": 376 |
| }, |
| { |
| "epoch": 0.08412197686645637, |
| "grad_norm": 0.7459003453913727, |
| "learning_rate": 4.7447447447447454e-06, |
| "loss": 0.2466, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17534321546554565, |
| "step": 80, |
| "valid_targets_mean": 2858.6, |
| "valid_targets_min": 910 |
| }, |
| { |
| "epoch": 0.08937960042060988, |
| "grad_norm": 0.6160013033228736, |
| "learning_rate": 5.045045045045045e-06, |
| "loss": 0.2111, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20561343431472778, |
| "step": 85, |
| "valid_targets_mean": 3631.7, |
| "valid_targets_min": 2798 |
| }, |
| { |
| "epoch": 0.0946372239747634, |
| "grad_norm": 0.775393624677666, |
| "learning_rate": 5.345345345345346e-06, |
| "loss": 0.2564, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24255871772766113, |
| "step": 90, |
| "valid_targets_mean": 2579.2, |
| "valid_targets_min": 471 |
| }, |
| { |
| "epoch": 0.09989484752891693, |
| "grad_norm": 1.1635835559487857, |
| "learning_rate": 5.645645645645647e-06, |
| "loss": 0.2456, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23936918377876282, |
| "step": 95, |
| "valid_targets_mean": 2538.1, |
| "valid_targets_min": 592 |
| }, |
| { |
| "epoch": 0.10515247108307045, |
| "grad_norm": 0.607061488866305, |
| "learning_rate": 5.945945945945947e-06, |
| "loss": 0.2357, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2112111747264862, |
| "step": 100, |
| "valid_targets_mean": 3127.5, |
| "valid_targets_min": 474 |
| }, |
| { |
| "epoch": 0.11041009463722397, |
| "grad_norm": 0.6321253786967143, |
| "learning_rate": 6.246246246246247e-06, |
| "loss": 0.23, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1985323131084442, |
| "step": 105, |
| "valid_targets_mean": 3146.4, |
| "valid_targets_min": 511 |
| }, |
| { |
| "epoch": 0.1156677181913775, |
| "grad_norm": 0.5627310246698635, |
| "learning_rate": 6.546546546546547e-06, |
| "loss": 0.2671, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17968815565109253, |
| "step": 110, |
| "valid_targets_mean": 3607.5, |
| "valid_targets_min": 902 |
| }, |
| { |
| "epoch": 0.12092534174553102, |
| "grad_norm": 0.5955950659118245, |
| "learning_rate": 6.846846846846848e-06, |
| "loss": 0.193, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19982632994651794, |
| "step": 115, |
| "valid_targets_mean": 3110.1, |
| "valid_targets_min": 1643 |
| }, |
| { |
| "epoch": 0.12618296529968454, |
| "grad_norm": 1.3147756039855116, |
| "learning_rate": 7.147147147147148e-06, |
| "loss": 0.2701, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3530358672142029, |
| "step": 120, |
| "valid_targets_mean": 1258.1, |
| "valid_targets_min": 534 |
| }, |
| { |
| "epoch": 0.13144058885383805, |
| "grad_norm": 0.819628422589212, |
| "learning_rate": 7.447447447447448e-06, |
| "loss": 0.2455, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26167190074920654, |
| "step": 125, |
| "valid_targets_mean": 2217.8, |
| "valid_targets_min": 568 |
| }, |
| { |
| "epoch": 0.1366982124079916, |
| "grad_norm": 0.6036534069669649, |
| "learning_rate": 7.747747747747749e-06, |
| "loss": 0.1923, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15864881873130798, |
| "step": 130, |
| "valid_targets_mean": 3244.5, |
| "valid_targets_min": 895 |
| }, |
| { |
| "epoch": 0.14195583596214512, |
| "grad_norm": 1.1567577235641096, |
| "learning_rate": 8.048048048048048e-06, |
| "loss": 0.3608, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5327928066253662, |
| "step": 135, |
| "valid_targets_mean": 2774.1, |
| "valid_targets_min": 652 |
| }, |
| { |
| "epoch": 0.14721345951629863, |
| "grad_norm": 0.6365608983596328, |
| "learning_rate": 8.348348348348348e-06, |
| "loss": 0.3191, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20512095093727112, |
| "step": 140, |
| "valid_targets_mean": 2957.4, |
| "valid_targets_min": 756 |
| }, |
| { |
| "epoch": 0.15247108307045215, |
| "grad_norm": 0.5269954458002594, |
| "learning_rate": 8.64864864864865e-06, |
| "loss": 0.2075, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15970279276371002, |
| "step": 145, |
| "valid_targets_mean": 3300.6, |
| "valid_targets_min": 1332 |
| }, |
| { |
| "epoch": 0.15772870662460567, |
| "grad_norm": 1.3335308368913497, |
| "learning_rate": 8.94894894894895e-06, |
| "loss": 0.2902, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5741272568702698, |
| "step": 150, |
| "valid_targets_mean": 2650.0, |
| "valid_targets_min": 1153 |
| }, |
| { |
| "epoch": 0.16298633017875921, |
| "grad_norm": 0.40986378635288123, |
| "learning_rate": 9.24924924924925e-06, |
| "loss": 0.2039, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1293731927871704, |
| "step": 155, |
| "valid_targets_mean": 3956.4, |
| "valid_targets_min": 636 |
| }, |
| { |
| "epoch": 0.16824395373291273, |
| "grad_norm": 0.47731719302104003, |
| "learning_rate": 9.54954954954955e-06, |
| "loss": 0.1717, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15799108147621155, |
| "step": 160, |
| "valid_targets_mean": 4346.1, |
| "valid_targets_min": 789 |
| }, |
| { |
| "epoch": 0.17350157728706625, |
| "grad_norm": 0.5190209275915764, |
| "learning_rate": 9.849849849849851e-06, |
| "loss": 0.1868, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20154370367527008, |
| "step": 165, |
| "valid_targets_mean": 3998.4, |
| "valid_targets_min": 995 |
| }, |
| { |
| "epoch": 0.17875920084121977, |
| "grad_norm": 0.5394967825763323, |
| "learning_rate": 1.015015015015015e-05, |
| "loss": 0.1718, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14971879124641418, |
| "step": 170, |
| "valid_targets_mean": 2673.9, |
| "valid_targets_min": 488 |
| }, |
| { |
| "epoch": 0.18401682439537329, |
| "grad_norm": 0.536862437321639, |
| "learning_rate": 1.0450450450450452e-05, |
| "loss": 0.1786, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17659367620944977, |
| "step": 175, |
| "valid_targets_mean": 3398.1, |
| "valid_targets_min": 829 |
| }, |
| { |
| "epoch": 0.1892744479495268, |
| "grad_norm": 0.792326697507481, |
| "learning_rate": 1.0750750750750751e-05, |
| "loss": 0.1668, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19177758693695068, |
| "step": 180, |
| "valid_targets_mean": 1999.6, |
| "valid_targets_min": 712 |
| }, |
| { |
| "epoch": 0.19453207150368035, |
| "grad_norm": 0.4832811881573537, |
| "learning_rate": 1.1051051051051051e-05, |
| "loss": 0.1658, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14447200298309326, |
| "step": 185, |
| "valid_targets_mean": 3241.9, |
| "valid_targets_min": 1770 |
| }, |
| { |
| "epoch": 0.19978969505783387, |
| "grad_norm": 0.5191903271061198, |
| "learning_rate": 1.1351351351351352e-05, |
| "loss": 0.148, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15642067790031433, |
| "step": 190, |
| "valid_targets_mean": 3626.0, |
| "valid_targets_min": 2141 |
| }, |
| { |
| "epoch": 0.20504731861198738, |
| "grad_norm": 0.48773669138972087, |
| "learning_rate": 1.1651651651651652e-05, |
| "loss": 0.235, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12580087780952454, |
| "step": 195, |
| "valid_targets_mean": 3509.4, |
| "valid_targets_min": 772 |
| }, |
| { |
| "epoch": 0.2103049421661409, |
| "grad_norm": 0.5559837256351672, |
| "learning_rate": 1.1951951951951951e-05, |
| "loss": 0.1404, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14926278591156006, |
| "step": 200, |
| "valid_targets_mean": 3345.5, |
| "valid_targets_min": 722 |
| }, |
| { |
| "epoch": 0.21556256572029442, |
| "grad_norm": 0.45421761703657215, |
| "learning_rate": 1.2252252252252253e-05, |
| "loss": 0.152, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12437152862548828, |
| "step": 205, |
| "valid_targets_mean": 3691.8, |
| "valid_targets_min": 2535 |
| }, |
| { |
| "epoch": 0.22082018927444794, |
| "grad_norm": 0.5334731587131958, |
| "learning_rate": 1.2552552552552552e-05, |
| "loss": 0.1535, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16034381091594696, |
| "step": 210, |
| "valid_targets_mean": 3218.2, |
| "valid_targets_min": 792 |
| }, |
| { |
| "epoch": 0.22607781282860148, |
| "grad_norm": 0.9110721799975048, |
| "learning_rate": 1.2852852852852854e-05, |
| "loss": 0.1789, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2076105773448944, |
| "step": 215, |
| "valid_targets_mean": 1420.5, |
| "valid_targets_min": 490 |
| }, |
| { |
| "epoch": 0.231335436382755, |
| "grad_norm": 0.4752355755197842, |
| "learning_rate": 1.3153153153153155e-05, |
| "loss": 0.1989, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15308931469917297, |
| "step": 220, |
| "valid_targets_mean": 3622.2, |
| "valid_targets_min": 1196 |
| }, |
| { |
| "epoch": 0.23659305993690852, |
| "grad_norm": 0.7658853879953997, |
| "learning_rate": 1.3453453453453456e-05, |
| "loss": 0.2099, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20712979137897491, |
| "step": 225, |
| "valid_targets_mean": 1924.2, |
| "valid_targets_min": 575 |
| }, |
| { |
| "epoch": 0.24185068349106204, |
| "grad_norm": 0.677218415791282, |
| "learning_rate": 1.3753753753753756e-05, |
| "loss": 0.1784, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17075490951538086, |
| "step": 230, |
| "valid_targets_mean": 2185.2, |
| "valid_targets_min": 524 |
| }, |
| { |
| "epoch": 0.24710830704521555, |
| "grad_norm": 0.6349159756624928, |
| "learning_rate": 1.4054054054054055e-05, |
| "loss": 0.2006, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18034519255161285, |
| "step": 235, |
| "valid_targets_mean": 2365.2, |
| "valid_targets_min": 542 |
| }, |
| { |
| "epoch": 0.25236593059936907, |
| "grad_norm": 0.7051405943756438, |
| "learning_rate": 1.4354354354354357e-05, |
| "loss": 0.2091, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1475905478000641, |
| "step": 240, |
| "valid_targets_mean": 2925.8, |
| "valid_targets_min": 803 |
| }, |
| { |
| "epoch": 0.2576235541535226, |
| "grad_norm": 0.6253098139492942, |
| "learning_rate": 1.4654654654654656e-05, |
| "loss": 0.1656, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14411409199237823, |
| "step": 245, |
| "valid_targets_mean": 2462.1, |
| "valid_targets_min": 629 |
| }, |
| { |
| "epoch": 0.2628811777076761, |
| "grad_norm": 0.7664938237469207, |
| "learning_rate": 1.4954954954954957e-05, |
| "loss": 0.1965, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16011649370193481, |
| "step": 250, |
| "valid_targets_mean": 3909.5, |
| "valid_targets_min": 2393 |
| }, |
| { |
| "epoch": 0.26813880126182965, |
| "grad_norm": 0.5666382634469955, |
| "learning_rate": 1.5255255255255257e-05, |
| "loss": 0.1764, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1639004945755005, |
| "step": 255, |
| "valid_targets_mean": 3106.2, |
| "valid_targets_min": 804 |
| }, |
| { |
| "epoch": 0.2733964248159832, |
| "grad_norm": 0.5100146697881532, |
| "learning_rate": 1.555555555555556e-05, |
| "loss": 0.1544, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1806904375553131, |
| "step": 260, |
| "valid_targets_mean": 4407.3, |
| "valid_targets_min": 1549 |
| }, |
| { |
| "epoch": 0.2786540483701367, |
| "grad_norm": 0.6549359808173243, |
| "learning_rate": 1.5855855855855858e-05, |
| "loss": 0.1447, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16388942301273346, |
| "step": 265, |
| "valid_targets_mean": 2631.7, |
| "valid_targets_min": 596 |
| }, |
| { |
| "epoch": 0.28391167192429023, |
| "grad_norm": 0.41343843926240126, |
| "learning_rate": 1.6156156156156157e-05, |
| "loss": 0.1381, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11629683524370193, |
| "step": 270, |
| "valid_targets_mean": 4891.2, |
| "valid_targets_min": 3804 |
| }, |
| { |
| "epoch": 0.2891692954784437, |
| "grad_norm": 0.517092960334539, |
| "learning_rate": 1.6456456456456457e-05, |
| "loss": 0.1498, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13476485013961792, |
| "step": 275, |
| "valid_targets_mean": 3792.2, |
| "valid_targets_min": 1864 |
| }, |
| { |
| "epoch": 0.29442691903259727, |
| "grad_norm": 0.8171353088666584, |
| "learning_rate": 1.6756756756756757e-05, |
| "loss": 0.1818, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21420735120773315, |
| "step": 280, |
| "valid_targets_mean": 1649.4, |
| "valid_targets_min": 203 |
| }, |
| { |
| "epoch": 0.2996845425867508, |
| "grad_norm": 0.5200131595604154, |
| "learning_rate": 1.705705705705706e-05, |
| "loss": 0.1529, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15774023532867432, |
| "step": 285, |
| "valid_targets_mean": 3947.8, |
| "valid_targets_min": 2443 |
| }, |
| { |
| "epoch": 0.3049421661409043, |
| "grad_norm": 0.9237428764634195, |
| "learning_rate": 1.735735735735736e-05, |
| "loss": 0.1723, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16387858986854553, |
| "step": 290, |
| "valid_targets_mean": 1698.5, |
| "valid_targets_min": 716 |
| }, |
| { |
| "epoch": 0.31019978969505785, |
| "grad_norm": 0.48580301438597634, |
| "learning_rate": 1.765765765765766e-05, |
| "loss": 0.1261, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1362724006175995, |
| "step": 295, |
| "valid_targets_mean": 3700.4, |
| "valid_targets_min": 905 |
| }, |
| { |
| "epoch": 0.31545741324921134, |
| "grad_norm": 0.6212209825059118, |
| "learning_rate": 1.795795795795796e-05, |
| "loss": 0.163, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1739799827337265, |
| "step": 300, |
| "valid_targets_mean": 2566.2, |
| "valid_targets_min": 657 |
| }, |
| { |
| "epoch": 0.3207150368033649, |
| "grad_norm": 0.4722131229404295, |
| "learning_rate": 1.8258258258258258e-05, |
| "loss": 0.154, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1354328691959381, |
| "step": 305, |
| "valid_targets_mean": 3215.8, |
| "valid_targets_min": 1584 |
| }, |
| { |
| "epoch": 0.32597266035751843, |
| "grad_norm": 0.676458950103952, |
| "learning_rate": 1.855855855855856e-05, |
| "loss": 0.1354, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1757308542728424, |
| "step": 310, |
| "valid_targets_mean": 2246.6, |
| "valid_targets_min": 627 |
| }, |
| { |
| "epoch": 0.3312302839116719, |
| "grad_norm": 0.6483673696109898, |
| "learning_rate": 1.885885885885886e-05, |
| "loss": 0.1573, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16886213421821594, |
| "step": 315, |
| "valid_targets_mean": 2176.4, |
| "valid_targets_min": 560 |
| }, |
| { |
| "epoch": 0.33648790746582546, |
| "grad_norm": 0.6511956803543409, |
| "learning_rate": 1.915915915915916e-05, |
| "loss": 0.1598, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17488718032836914, |
| "step": 320, |
| "valid_targets_mean": 2364.9, |
| "valid_targets_min": 613 |
| }, |
| { |
| "epoch": 0.34174553101997895, |
| "grad_norm": 0.5243288842852669, |
| "learning_rate": 1.9459459459459463e-05, |
| "loss": 0.1789, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1510639786720276, |
| "step": 325, |
| "valid_targets_mean": 3067.3, |
| "valid_targets_min": 958 |
| }, |
| { |
| "epoch": 0.3470031545741325, |
| "grad_norm": 0.5830771667606569, |
| "learning_rate": 1.9759759759759763e-05, |
| "loss": 0.1491, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14484402537345886, |
| "step": 330, |
| "valid_targets_mean": 2553.5, |
| "valid_targets_min": 719 |
| }, |
| { |
| "epoch": 0.352260778128286, |
| "grad_norm": 0.6145252909675246, |
| "learning_rate": 2.0060060060060062e-05, |
| "loss": 0.1804, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15925168991088867, |
| "step": 335, |
| "valid_targets_mean": 2510.1, |
| "valid_targets_min": 759 |
| }, |
| { |
| "epoch": 0.35751840168243953, |
| "grad_norm": 1.033866405002161, |
| "learning_rate": 2.0360360360360362e-05, |
| "loss": 0.1775, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26241564750671387, |
| "step": 340, |
| "valid_targets_mean": 1322.8, |
| "valid_targets_min": 521 |
| }, |
| { |
| "epoch": 0.3627760252365931, |
| "grad_norm": 0.5582010823369247, |
| "learning_rate": 2.066066066066066e-05, |
| "loss": 0.1464, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17004817724227905, |
| "step": 345, |
| "valid_targets_mean": 3135.9, |
| "valid_targets_min": 729 |
| }, |
| { |
| "epoch": 0.36803364879074657, |
| "grad_norm": 0.4264448065906292, |
| "learning_rate": 2.0960960960960964e-05, |
| "loss": 0.1265, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10428524017333984, |
| "step": 350, |
| "valid_targets_mean": 3760.6, |
| "valid_targets_min": 2741 |
| }, |
| { |
| "epoch": 0.3732912723449001, |
| "grad_norm": 0.5123778205391243, |
| "learning_rate": 2.1261261261261264e-05, |
| "loss": 0.1449, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1200961023569107, |
| "step": 355, |
| "valid_targets_mean": 2938.2, |
| "valid_targets_min": 927 |
| }, |
| { |
| "epoch": 0.3785488958990536, |
| "grad_norm": 0.529408020442376, |
| "learning_rate": 2.1561561561561564e-05, |
| "loss": 0.1884, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14463025331497192, |
| "step": 360, |
| "valid_targets_mean": 2925.2, |
| "valid_targets_min": 935 |
| }, |
| { |
| "epoch": 0.38380651945320715, |
| "grad_norm": 0.5201812008039938, |
| "learning_rate": 2.1861861861861863e-05, |
| "loss": 0.1225, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10529932379722595, |
| "step": 365, |
| "valid_targets_mean": 2759.2, |
| "valid_targets_min": 647 |
| }, |
| { |
| "epoch": 0.3890641430073607, |
| "grad_norm": 0.4719633496936481, |
| "learning_rate": 2.2162162162162163e-05, |
| "loss": 0.1444, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12036021053791046, |
| "step": 370, |
| "valid_targets_mean": 5071.6, |
| "valid_targets_min": 976 |
| }, |
| { |
| "epoch": 0.3943217665615142, |
| "grad_norm": 0.43189437970159716, |
| "learning_rate": 2.2462462462462466e-05, |
| "loss": 0.1378, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11983726918697357, |
| "step": 375, |
| "valid_targets_mean": 4252.0, |
| "valid_targets_min": 484 |
| }, |
| { |
| "epoch": 0.39957939011566773, |
| "grad_norm": 0.42465160695991117, |
| "learning_rate": 2.2762762762762765e-05, |
| "loss": 0.1201, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10434293746948242, |
| "step": 380, |
| "valid_targets_mean": 4528.9, |
| "valid_targets_min": 949 |
| }, |
| { |
| "epoch": 0.4048370136698212, |
| "grad_norm": 0.5578623891699924, |
| "learning_rate": 2.3063063063063065e-05, |
| "loss": 0.1526, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18567083775997162, |
| "step": 385, |
| "valid_targets_mean": 4286.2, |
| "valid_targets_min": 2724 |
| }, |
| { |
| "epoch": 0.41009463722397477, |
| "grad_norm": 0.4410268826291089, |
| "learning_rate": 2.3363363363363364e-05, |
| "loss": 0.1287, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11271372437477112, |
| "step": 390, |
| "valid_targets_mean": 3200.5, |
| "valid_targets_min": 424 |
| }, |
| { |
| "epoch": 0.4153522607781283, |
| "grad_norm": 0.5408190289850457, |
| "learning_rate": 2.3663663663663664e-05, |
| "loss": 0.1731, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13595326244831085, |
| "step": 395, |
| "valid_targets_mean": 2660.9, |
| "valid_targets_min": 531 |
| }, |
| { |
| "epoch": 0.4206098843322818, |
| "grad_norm": 0.5591662105253836, |
| "learning_rate": 2.3963963963963967e-05, |
| "loss": 0.1625, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11370278894901276, |
| "step": 400, |
| "valid_targets_mean": 2755.6, |
| "valid_targets_min": 616 |
| }, |
| { |
| "epoch": 0.42586750788643535, |
| "grad_norm": 0.4604795245230451, |
| "learning_rate": 2.4264264264264267e-05, |
| "loss": 0.1234, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1495322585105896, |
| "step": 405, |
| "valid_targets_mean": 2762.3, |
| "valid_targets_min": 602 |
| }, |
| { |
| "epoch": 0.43112513144058884, |
| "grad_norm": 0.42440232585948356, |
| "learning_rate": 2.4564564564564566e-05, |
| "loss": 0.1658, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1368899792432785, |
| "step": 410, |
| "valid_targets_mean": 3793.9, |
| "valid_targets_min": 1251 |
| }, |
| { |
| "epoch": 0.4363827549947424, |
| "grad_norm": 0.5979040069002124, |
| "learning_rate": 2.4864864864864866e-05, |
| "loss": 0.1363, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12938565015792847, |
| "step": 415, |
| "valid_targets_mean": 2517.1, |
| "valid_targets_min": 596 |
| }, |
| { |
| "epoch": 0.4416403785488959, |
| "grad_norm": 0.8524591312483077, |
| "learning_rate": 2.5165165165165165e-05, |
| "loss": 0.1598, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17469751834869385, |
| "step": 420, |
| "valid_targets_mean": 1704.4, |
| "valid_targets_min": 595 |
| }, |
| { |
| "epoch": 0.4468980021030494, |
| "grad_norm": 0.8068963566475884, |
| "learning_rate": 2.5465465465465465e-05, |
| "loss": 0.1738, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.205302432179451, |
| "step": 425, |
| "valid_targets_mean": 1854.3, |
| "valid_targets_min": 520 |
| }, |
| { |
| "epoch": 0.45215562565720296, |
| "grad_norm": 0.5383440464588352, |
| "learning_rate": 2.5765765765765768e-05, |
| "loss": 0.1863, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14100906252861023, |
| "step": 430, |
| "valid_targets_mean": 2596.6, |
| "valid_targets_min": 593 |
| }, |
| { |
| "epoch": 0.45741324921135645, |
| "grad_norm": 0.43574834548646346, |
| "learning_rate": 2.6066066066066067e-05, |
| "loss": 0.1459, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10070942342281342, |
| "step": 435, |
| "valid_targets_mean": 3657.7, |
| "valid_targets_min": 647 |
| }, |
| { |
| "epoch": 0.46267087276551, |
| "grad_norm": 0.5115290584023389, |
| "learning_rate": 2.6366366366366367e-05, |
| "loss": 0.153, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13975085318088531, |
| "step": 440, |
| "valid_targets_mean": 2984.0, |
| "valid_targets_min": 676 |
| }, |
| { |
| "epoch": 0.4679284963196635, |
| "grad_norm": 0.5795352827916006, |
| "learning_rate": 2.6666666666666667e-05, |
| "loss": 0.1379, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14506489038467407, |
| "step": 445, |
| "valid_targets_mean": 2498.0, |
| "valid_targets_min": 616 |
| }, |
| { |
| "epoch": 0.47318611987381703, |
| "grad_norm": 0.535282041546169, |
| "learning_rate": 2.6966966966966966e-05, |
| "loss": 0.1375, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1347915083169937, |
| "step": 450, |
| "valid_targets_mean": 2706.7, |
| "valid_targets_min": 541 |
| }, |
| { |
| "epoch": 0.4784437434279706, |
| "grad_norm": 1.0578338493024237, |
| "learning_rate": 2.726726726726727e-05, |
| "loss": 0.1327, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18900179862976074, |
| "step": 455, |
| "valid_targets_mean": 1267.9, |
| "valid_targets_min": 598 |
| }, |
| { |
| "epoch": 0.48370136698212407, |
| "grad_norm": 0.4958868865551675, |
| "learning_rate": 2.756756756756757e-05, |
| "loss": 0.1613, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12313523888587952, |
| "step": 460, |
| "valid_targets_mean": 3047.2, |
| "valid_targets_min": 756 |
| }, |
| { |
| "epoch": 0.4889589905362776, |
| "grad_norm": 0.5741914975359229, |
| "learning_rate": 2.786786786786787e-05, |
| "loss": 0.1245, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1458258330821991, |
| "step": 465, |
| "valid_targets_mean": 2821.1, |
| "valid_targets_min": 680 |
| }, |
| { |
| "epoch": 0.4942166140904311, |
| "grad_norm": 0.5024374122755627, |
| "learning_rate": 2.8168168168168168e-05, |
| "loss": 0.1334, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13367310166358948, |
| "step": 470, |
| "valid_targets_mean": 3039.8, |
| "valid_targets_min": 774 |
| }, |
| { |
| "epoch": 0.49947423764458465, |
| "grad_norm": 0.4910835346264678, |
| "learning_rate": 2.8468468468468467e-05, |
| "loss": 0.1531, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15631186962127686, |
| "step": 475, |
| "valid_targets_mean": 4018.3, |
| "valid_targets_min": 1474 |
| }, |
| { |
| "epoch": 0.5047318611987381, |
| "grad_norm": 0.31397244645960626, |
| "learning_rate": 2.8768768768768774e-05, |
| "loss": 0.1183, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08619725704193115, |
| "step": 480, |
| "valid_targets_mean": 5695.4, |
| "valid_targets_min": 3677 |
| }, |
| { |
| "epoch": 0.5099894847528917, |
| "grad_norm": 0.4753384585551911, |
| "learning_rate": 2.9069069069069073e-05, |
| "loss": 0.1324, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1378968358039856, |
| "step": 485, |
| "valid_targets_mean": 2872.4, |
| "valid_targets_min": 675 |
| }, |
| { |
| "epoch": 0.5152471083070452, |
| "grad_norm": 0.442429826767631, |
| "learning_rate": 2.9369369369369373e-05, |
| "loss": 0.1263, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12641605734825134, |
| "step": 490, |
| "valid_targets_mean": 3971.9, |
| "valid_targets_min": 795 |
| }, |
| { |
| "epoch": 0.5205047318611987, |
| "grad_norm": 0.6197224166860392, |
| "learning_rate": 2.9669669669669673e-05, |
| "loss": 0.2613, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28923261165618896, |
| "step": 495, |
| "valid_targets_mean": 2743.6, |
| "valid_targets_min": 605 |
| }, |
| { |
| "epoch": 0.5257623554153522, |
| "grad_norm": 0.5005822182169736, |
| "learning_rate": 2.9969969969969976e-05, |
| "loss": 0.1248, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11692014336585999, |
| "step": 500, |
| "valid_targets_mean": 3250.8, |
| "valid_targets_min": 941 |
| }, |
| { |
| "epoch": 0.5310199789695058, |
| "grad_norm": 0.5692151849390964, |
| "learning_rate": 3.0270270270270275e-05, |
| "loss": 0.1433, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12837675213813782, |
| "step": 505, |
| "valid_targets_mean": 2529.4, |
| "valid_targets_min": 773 |
| }, |
| { |
| "epoch": 0.5362776025236593, |
| "grad_norm": 0.7452492640467124, |
| "learning_rate": 3.0570570570570575e-05, |
| "loss": 0.167, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3063594698905945, |
| "step": 510, |
| "valid_targets_mean": 2282.3, |
| "valid_targets_min": 955 |
| }, |
| { |
| "epoch": 0.5415352260778128, |
| "grad_norm": 1.1155547682634184, |
| "learning_rate": 3.0870870870870874e-05, |
| "loss": 0.3438, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3546082377433777, |
| "step": 515, |
| "valid_targets_mean": 1554.4, |
| "valid_targets_min": 715 |
| }, |
| { |
| "epoch": 0.5467928496319664, |
| "grad_norm": 1.0015826508178154, |
| "learning_rate": 3.1171171171171174e-05, |
| "loss": 0.3411, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3243759274482727, |
| "step": 520, |
| "valid_targets_mean": 1621.1, |
| "valid_targets_min": 725 |
| }, |
| { |
| "epoch": 0.5520504731861199, |
| "grad_norm": 1.1529949317365271, |
| "learning_rate": 3.1471471471471473e-05, |
| "loss": 0.3199, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32804620265960693, |
| "step": 525, |
| "valid_targets_mean": 1469.3, |
| "valid_targets_min": 714 |
| }, |
| { |
| "epoch": 0.5573080967402734, |
| "grad_norm": 0.9940115017954813, |
| "learning_rate": 3.177177177177177e-05, |
| "loss": 0.3061, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3047122061252594, |
| "step": 530, |
| "valid_targets_mean": 1483.8, |
| "valid_targets_min": 615 |
| }, |
| { |
| "epoch": 0.562565720294427, |
| "grad_norm": 1.0873576094630497, |
| "learning_rate": 3.207207207207207e-05, |
| "loss": 0.2987, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2896285653114319, |
| "step": 535, |
| "valid_targets_mean": 1436.4, |
| "valid_targets_min": 715 |
| }, |
| { |
| "epoch": 0.5678233438485805, |
| "grad_norm": 0.9365567375118371, |
| "learning_rate": 3.237237237237238e-05, |
| "loss": 0.2963, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3406223654747009, |
| "step": 540, |
| "valid_targets_mean": 1576.6, |
| "valid_targets_min": 625 |
| }, |
| { |
| "epoch": 0.573080967402734, |
| "grad_norm": 1.0027497886268528, |
| "learning_rate": 3.267267267267268e-05, |
| "loss": 0.2796, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2638475000858307, |
| "step": 545, |
| "valid_targets_mean": 1417.9, |
| "valid_targets_min": 761 |
| }, |
| { |
| "epoch": 0.5783385909568874, |
| "grad_norm": 0.9205617077717022, |
| "learning_rate": 3.297297297297298e-05, |
| "loss": 0.2926, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.37035784125328064, |
| "step": 550, |
| "valid_targets_mean": 1609.2, |
| "valid_targets_min": 703 |
| }, |
| { |
| "epoch": 0.583596214511041, |
| "grad_norm": 1.1987835943809408, |
| "learning_rate": 3.327327327327328e-05, |
| "loss": 0.27, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29375773668289185, |
| "step": 555, |
| "valid_targets_mean": 1623.3, |
| "valid_targets_min": 733 |
| }, |
| { |
| "epoch": 0.5888538380651945, |
| "grad_norm": 0.9289468307227438, |
| "learning_rate": 3.357357357357358e-05, |
| "loss": 0.272, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27896010875701904, |
| "step": 560, |
| "valid_targets_mean": 1673.9, |
| "valid_targets_min": 835 |
| }, |
| { |
| "epoch": 0.594111461619348, |
| "grad_norm": 0.9413235218021161, |
| "learning_rate": 3.387387387387388e-05, |
| "loss": 0.2607, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27303457260131836, |
| "step": 565, |
| "valid_targets_mean": 1542.9, |
| "valid_targets_min": 815 |
| }, |
| { |
| "epoch": 0.5993690851735016, |
| "grad_norm": 0.9403245224254523, |
| "learning_rate": 3.4174174174174176e-05, |
| "loss": 0.2799, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2741079330444336, |
| "step": 570, |
| "valid_targets_mean": 1620.6, |
| "valid_targets_min": 797 |
| }, |
| { |
| "epoch": 0.6046267087276551, |
| "grad_norm": 1.1276192338957716, |
| "learning_rate": 3.4474474474474476e-05, |
| "loss": 0.2603, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2553476393222809, |
| "step": 575, |
| "valid_targets_mean": 1417.6, |
| "valid_targets_min": 570 |
| }, |
| { |
| "epoch": 0.6098843322818086, |
| "grad_norm": 1.030235956437453, |
| "learning_rate": 3.4774774774774776e-05, |
| "loss": 0.2514, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25277331471443176, |
| "step": 580, |
| "valid_targets_mean": 1507.0, |
| "valid_targets_min": 548 |
| }, |
| { |
| "epoch": 0.6151419558359621, |
| "grad_norm": 1.0659589997175756, |
| "learning_rate": 3.5075075075075075e-05, |
| "loss": 0.2488, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2470894455909729, |
| "step": 585, |
| "valid_targets_mean": 1278.8, |
| "valid_targets_min": 682 |
| }, |
| { |
| "epoch": 0.6203995793901157, |
| "grad_norm": 0.8904338477427017, |
| "learning_rate": 3.5375375375375375e-05, |
| "loss": 0.2702, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28884193301200867, |
| "step": 590, |
| "valid_targets_mean": 1824.2, |
| "valid_targets_min": 896 |
| }, |
| { |
| "epoch": 0.6256572029442692, |
| "grad_norm": 1.0006741773351804, |
| "learning_rate": 3.567567567567568e-05, |
| "loss": 0.2627, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.265505850315094, |
| "step": 595, |
| "valid_targets_mean": 1513.9, |
| "valid_targets_min": 597 |
| }, |
| { |
| "epoch": 0.6309148264984227, |
| "grad_norm": 0.9007620924231974, |
| "learning_rate": 3.597597597597598e-05, |
| "loss": 0.2673, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2536696791648865, |
| "step": 600, |
| "valid_targets_mean": 1559.0, |
| "valid_targets_min": 706 |
| }, |
| { |
| "epoch": 0.6361724500525763, |
| "grad_norm": 0.8810235190375725, |
| "learning_rate": 3.627627627627628e-05, |
| "loss": 0.258, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22736713290214539, |
| "step": 605, |
| "valid_targets_mean": 1439.2, |
| "valid_targets_min": 754 |
| }, |
| { |
| "epoch": 0.6414300736067298, |
| "grad_norm": 1.030350433812722, |
| "learning_rate": 3.657657657657658e-05, |
| "loss": 0.2554, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23971164226531982, |
| "step": 610, |
| "valid_targets_mean": 1424.6, |
| "valid_targets_min": 785 |
| }, |
| { |
| "epoch": 0.6466876971608833, |
| "grad_norm": 0.88153437382438, |
| "learning_rate": 3.687687687687688e-05, |
| "loss": 0.2613, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25444358587265015, |
| "step": 615, |
| "valid_targets_mean": 1526.2, |
| "valid_targets_min": 617 |
| }, |
| { |
| "epoch": 0.6519453207150369, |
| "grad_norm": 1.2253186020583033, |
| "learning_rate": 3.717717717717718e-05, |
| "loss": 0.2676, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2786664068698883, |
| "step": 620, |
| "valid_targets_mean": 1218.8, |
| "valid_targets_min": 648 |
| }, |
| { |
| "epoch": 0.6572029442691903, |
| "grad_norm": 0.8323936549391726, |
| "learning_rate": 3.747747747747748e-05, |
| "loss": 0.2497, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2497854083776474, |
| "step": 625, |
| "valid_targets_mean": 1642.6, |
| "valid_targets_min": 1184 |
| }, |
| { |
| "epoch": 0.6624605678233438, |
| "grad_norm": 0.9238273980255594, |
| "learning_rate": 3.777777777777778e-05, |
| "loss": 0.2457, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24019362032413483, |
| "step": 630, |
| "valid_targets_mean": 1437.6, |
| "valid_targets_min": 774 |
| }, |
| { |
| "epoch": 0.6677181913774973, |
| "grad_norm": 1.1441318370677376, |
| "learning_rate": 3.807807807807808e-05, |
| "loss": 0.2471, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2502342760562897, |
| "step": 635, |
| "valid_targets_mean": 1799.9, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 0.6729758149316509, |
| "grad_norm": 0.8916446370546462, |
| "learning_rate": 3.837837837837838e-05, |
| "loss": 0.2456, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24413703382015228, |
| "step": 640, |
| "valid_targets_mean": 1542.4, |
| "valid_targets_min": 1004 |
| }, |
| { |
| "epoch": 0.6782334384858044, |
| "grad_norm": 0.987486801984616, |
| "learning_rate": 3.8678678678678684e-05, |
| "loss": 0.2468, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.259332537651062, |
| "step": 645, |
| "valid_targets_mean": 1532.9, |
| "valid_targets_min": 803 |
| }, |
| { |
| "epoch": 0.6834910620399579, |
| "grad_norm": 0.8960451517622989, |
| "learning_rate": 3.897897897897898e-05, |
| "loss": 0.2519, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22896456718444824, |
| "step": 650, |
| "valid_targets_mean": 1341.6, |
| "valid_targets_min": 782 |
| }, |
| { |
| "epoch": 0.6887486855941115, |
| "grad_norm": 0.8264223810575569, |
| "learning_rate": 3.927927927927928e-05, |
| "loss": 0.2388, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23387616872787476, |
| "step": 655, |
| "valid_targets_mean": 1656.5, |
| "valid_targets_min": 646 |
| }, |
| { |
| "epoch": 0.694006309148265, |
| "grad_norm": 0.9415724536228907, |
| "learning_rate": 3.957957957957958e-05, |
| "loss": 0.2535, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2822714149951935, |
| "step": 660, |
| "valid_targets_mean": 1465.2, |
| "valid_targets_min": 591 |
| }, |
| { |
| "epoch": 0.6992639327024185, |
| "grad_norm": 0.8234914818457443, |
| "learning_rate": 3.987987987987988e-05, |
| "loss": 0.2472, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28059113025665283, |
| "step": 665, |
| "valid_targets_mean": 1781.1, |
| "valid_targets_min": 796 |
| }, |
| { |
| "epoch": 0.704521556256572, |
| "grad_norm": 0.9133249095800229, |
| "learning_rate": 3.9999975251805184e-05, |
| "loss": 0.2418, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23322954773902893, |
| "step": 670, |
| "valid_targets_mean": 1453.8, |
| "valid_targets_min": 848 |
| }, |
| { |
| "epoch": 0.7097791798107256, |
| "grad_norm": 0.8958156100880204, |
| "learning_rate": 3.9999824013058675e-05, |
| "loss": 0.2381, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22876060009002686, |
| "step": 675, |
| "valid_targets_mean": 1281.6, |
| "valid_targets_min": 665 |
| }, |
| { |
| "epoch": 0.7150368033648791, |
| "grad_norm": 0.8046905965772344, |
| "learning_rate": 3.99995352856012e-05, |
| "loss": 0.2323, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21532827615737915, |
| "step": 680, |
| "valid_targets_mean": 1267.4, |
| "valid_targets_min": 640 |
| }, |
| { |
| "epoch": 0.7202944269190326, |
| "grad_norm": 0.8694228235082393, |
| "learning_rate": 3.999910907141761e-05, |
| "loss": 0.2382, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2755237817764282, |
| "step": 685, |
| "valid_targets_mean": 1699.9, |
| "valid_targets_min": 662 |
| }, |
| { |
| "epoch": 0.7255520504731862, |
| "grad_norm": 0.8794612331979875, |
| "learning_rate": 3.9998545373437924e-05, |
| "loss": 0.2403, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23151585459709167, |
| "step": 690, |
| "valid_targets_mean": 1296.8, |
| "valid_targets_min": 724 |
| }, |
| { |
| "epoch": 0.7308096740273397, |
| "grad_norm": 0.9220348914067749, |
| "learning_rate": 3.999784419553728e-05, |
| "loss": 0.2362, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24824225902557373, |
| "step": 695, |
| "valid_targets_mean": 1328.3, |
| "valid_targets_min": 924 |
| }, |
| { |
| "epoch": 0.7360672975814931, |
| "grad_norm": 0.8634984464960579, |
| "learning_rate": 3.9997005542535916e-05, |
| "loss": 0.2416, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2388066053390503, |
| "step": 700, |
| "valid_targets_mean": 1520.8, |
| "valid_targets_min": 773 |
| }, |
| { |
| "epoch": 0.7413249211356467, |
| "grad_norm": 0.8872199936407936, |
| "learning_rate": 3.9996029420199154e-05, |
| "loss": 0.2386, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24773404002189636, |
| "step": 705, |
| "valid_targets_mean": 1378.1, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 0.7465825446898002, |
| "grad_norm": 0.8919945040136225, |
| "learning_rate": 3.9994915835237336e-05, |
| "loss": 0.2444, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21771392226219177, |
| "step": 710, |
| "valid_targets_mean": 1174.9, |
| "valid_targets_min": 776 |
| }, |
| { |
| "epoch": 0.7518401682439537, |
| "grad_norm": 0.7738287161591382, |
| "learning_rate": 3.999366479530581e-05, |
| "loss": 0.2328, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24148443341255188, |
| "step": 715, |
| "valid_targets_mean": 1885.7, |
| "valid_targets_min": 634 |
| }, |
| { |
| "epoch": 0.7570977917981072, |
| "grad_norm": 0.8529840466513452, |
| "learning_rate": 3.999227630900483e-05, |
| "loss": 0.2525, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2623804211616516, |
| "step": 720, |
| "valid_targets_mean": 1791.7, |
| "valid_targets_min": 573 |
| }, |
| { |
| "epoch": 0.7623554153522608, |
| "grad_norm": 0.754411162708553, |
| "learning_rate": 3.9990750385879554e-05, |
| "loss": 0.2417, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2579789161682129, |
| "step": 725, |
| "valid_targets_mean": 1866.8, |
| "valid_targets_min": 718 |
| }, |
| { |
| "epoch": 0.7676130389064143, |
| "grad_norm": 0.8190451822600759, |
| "learning_rate": 3.998908703641993e-05, |
| "loss": 0.2476, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21567176282405853, |
| "step": 730, |
| "valid_targets_mean": 1395.6, |
| "valid_targets_min": 841 |
| }, |
| { |
| "epoch": 0.7728706624605678, |
| "grad_norm": 0.8610185224444891, |
| "learning_rate": 3.9987286272060644e-05, |
| "loss": 0.2344, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2319350242614746, |
| "step": 735, |
| "valid_targets_mean": 1506.6, |
| "valid_targets_min": 956 |
| }, |
| { |
| "epoch": 0.7781282860147214, |
| "grad_norm": 0.8429412123334002, |
| "learning_rate": 3.998534810518104e-05, |
| "loss": 0.2412, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23787598311901093, |
| "step": 740, |
| "valid_targets_mean": 1253.3, |
| "valid_targets_min": 650 |
| }, |
| { |
| "epoch": 0.7833859095688749, |
| "grad_norm": 0.7815746871106487, |
| "learning_rate": 3.998327254910504e-05, |
| "loss": 0.2403, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2415323704481125, |
| "step": 745, |
| "valid_targets_mean": 1461.0, |
| "valid_targets_min": 780 |
| }, |
| { |
| "epoch": 0.7886435331230284, |
| "grad_norm": 0.8842126818291156, |
| "learning_rate": 3.998105961810105e-05, |
| "loss": 0.2237, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2263525277376175, |
| "step": 750, |
| "valid_targets_mean": 1344.5, |
| "valid_targets_min": 677 |
| }, |
| { |
| "epoch": 0.7939011566771819, |
| "grad_norm": 0.8258316717257442, |
| "learning_rate": 3.997870932738187e-05, |
| "loss": 0.2299, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22840547561645508, |
| "step": 755, |
| "valid_targets_mean": 1378.5, |
| "valid_targets_min": 727 |
| }, |
| { |
| "epoch": 0.7991587802313355, |
| "grad_norm": 0.9213686069053844, |
| "learning_rate": 3.997622169310454e-05, |
| "loss": 0.2371, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23663252592086792, |
| "step": 760, |
| "valid_targets_mean": 1498.6, |
| "valid_targets_min": 726 |
| }, |
| { |
| "epoch": 0.804416403785489, |
| "grad_norm": 0.7573585855870535, |
| "learning_rate": 3.9973596732370296e-05, |
| "loss": 0.2419, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2578279376029968, |
| "step": 765, |
| "valid_targets_mean": 1692.6, |
| "valid_targets_min": 669 |
| }, |
| { |
| "epoch": 0.8096740273396424, |
| "grad_norm": 0.7732889038728027, |
| "learning_rate": 3.997083446322443e-05, |
| "loss": 0.2314, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22062617540359497, |
| "step": 770, |
| "valid_targets_mean": 1561.1, |
| "valid_targets_min": 750 |
| }, |
| { |
| "epoch": 0.814931650893796, |
| "grad_norm": 0.7286375748351296, |
| "learning_rate": 3.9967934904656145e-05, |
| "loss": 0.2313, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23089280724525452, |
| "step": 775, |
| "valid_targets_mean": 1549.7, |
| "valid_targets_min": 736 |
| }, |
| { |
| "epoch": 0.8201892744479495, |
| "grad_norm": 0.8487799558187092, |
| "learning_rate": 3.9964898076598445e-05, |
| "loss": 0.2366, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2550632357597351, |
| "step": 780, |
| "valid_targets_mean": 1574.6, |
| "valid_targets_min": 694 |
| }, |
| { |
| "epoch": 0.825446898002103, |
| "grad_norm": 0.7846483409243643, |
| "learning_rate": 3.996172399992799e-05, |
| "loss": 0.2305, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2323245406150818, |
| "step": 785, |
| "valid_targets_mean": 1547.6, |
| "valid_targets_min": 753 |
| }, |
| { |
| "epoch": 0.8307045215562566, |
| "grad_norm": 0.8227142553349275, |
| "learning_rate": 3.995841269646496e-05, |
| "loss": 0.2269, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23940199613571167, |
| "step": 790, |
| "valid_targets_mean": 1558.7, |
| "valid_targets_min": 809 |
| }, |
| { |
| "epoch": 0.8359621451104101, |
| "grad_norm": 1.076487465858157, |
| "learning_rate": 3.995496418897291e-05, |
| "loss": 0.229, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20003387331962585, |
| "step": 795, |
| "valid_targets_mean": 1292.3, |
| "valid_targets_min": 698 |
| }, |
| { |
| "epoch": 0.8412197686645636, |
| "grad_norm": 0.8062292803141021, |
| "learning_rate": 3.995137850115856e-05, |
| "loss": 0.2166, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2341722548007965, |
| "step": 800, |
| "valid_targets_mean": 1500.9, |
| "valid_targets_min": 750 |
| }, |
| { |
| "epoch": 0.8464773922187171, |
| "grad_norm": 0.8231075534332739, |
| "learning_rate": 3.994765565767174e-05, |
| "loss": 0.2312, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2470659613609314, |
| "step": 805, |
| "valid_targets_mean": 1598.8, |
| "valid_targets_min": 733 |
| }, |
| { |
| "epoch": 0.8517350157728707, |
| "grad_norm": 0.7818547532568481, |
| "learning_rate": 3.9943795684105104e-05, |
| "loss": 0.2261, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22200843691825867, |
| "step": 810, |
| "valid_targets_mean": 1636.2, |
| "valid_targets_min": 907 |
| }, |
| { |
| "epoch": 0.8569926393270242, |
| "grad_norm": 0.8802044076837447, |
| "learning_rate": 3.993979860699403e-05, |
| "loss": 0.2224, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2520860731601715, |
| "step": 815, |
| "valid_targets_mean": 1564.9, |
| "valid_targets_min": 898 |
| }, |
| { |
| "epoch": 0.8622502628811777, |
| "grad_norm": 0.7794016295703586, |
| "learning_rate": 3.993566445381641e-05, |
| "loss": 0.2313, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23362603783607483, |
| "step": 820, |
| "valid_targets_mean": 1685.4, |
| "valid_targets_min": 1119 |
| }, |
| { |
| "epoch": 0.8675078864353313, |
| "grad_norm": 0.8437333752227186, |
| "learning_rate": 3.9931393252992454e-05, |
| "loss": 0.2305, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2498432844877243, |
| "step": 825, |
| "valid_targets_mean": 1480.4, |
| "valid_targets_min": 700 |
| }, |
| { |
| "epoch": 0.8727655099894848, |
| "grad_norm": 1.0963638505692785, |
| "learning_rate": 3.992698503388453e-05, |
| "loss": 0.2273, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22518636286258698, |
| "step": 830, |
| "valid_targets_mean": 1457.9, |
| "valid_targets_min": 798 |
| }, |
| { |
| "epoch": 0.8780231335436383, |
| "grad_norm": 0.8885740371755646, |
| "learning_rate": 3.992243982679691e-05, |
| "loss": 0.2303, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2175990641117096, |
| "step": 835, |
| "valid_targets_mean": 1237.5, |
| "valid_targets_min": 589 |
| }, |
| { |
| "epoch": 0.8832807570977917, |
| "grad_norm": 0.8390904894557905, |
| "learning_rate": 3.991775766297562e-05, |
| "loss": 0.2263, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22461339831352234, |
| "step": 840, |
| "valid_targets_mean": 1234.1, |
| "valid_targets_min": 244 |
| }, |
| { |
| "epoch": 0.8885383806519453, |
| "grad_norm": 0.8314750046327473, |
| "learning_rate": 3.991293857460815e-05, |
| "loss": 0.2424, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24296626448631287, |
| "step": 845, |
| "valid_targets_mean": 1229.9, |
| "valid_targets_min": 641 |
| }, |
| { |
| "epoch": 0.8937960042060988, |
| "grad_norm": 0.8036043592550274, |
| "learning_rate": 3.9907982594823326e-05, |
| "loss": 0.2285, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21325144171714783, |
| "step": 850, |
| "valid_targets_mean": 1430.4, |
| "valid_targets_min": 585 |
| }, |
| { |
| "epoch": 0.8990536277602523, |
| "grad_norm": 0.755706251040133, |
| "learning_rate": 3.9902889757691e-05, |
| "loss": 0.2439, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24100413918495178, |
| "step": 855, |
| "valid_targets_mean": 1902.6, |
| "valid_targets_min": 1156 |
| }, |
| { |
| "epoch": 0.9043112513144059, |
| "grad_norm": 0.7365612894776412, |
| "learning_rate": 3.9897660098221866e-05, |
| "loss": 0.2279, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21114149689674377, |
| "step": 860, |
| "valid_targets_mean": 1476.2, |
| "valid_targets_min": 657 |
| }, |
| { |
| "epoch": 0.9095688748685594, |
| "grad_norm": 0.8675624430726546, |
| "learning_rate": 3.98922936523672e-05, |
| "loss": 0.2339, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21119055151939392, |
| "step": 865, |
| "valid_targets_mean": 1440.7, |
| "valid_targets_min": 672 |
| }, |
| { |
| "epoch": 0.9148264984227129, |
| "grad_norm": 0.8390537419597028, |
| "learning_rate": 3.9886790457018604e-05, |
| "loss": 0.2269, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24388912320137024, |
| "step": 870, |
| "valid_targets_mean": 1651.1, |
| "valid_targets_min": 973 |
| }, |
| { |
| "epoch": 0.9200841219768665, |
| "grad_norm": 0.7941804400740873, |
| "learning_rate": 3.9881150550007776e-05, |
| "loss": 0.2268, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21932603418827057, |
| "step": 875, |
| "valid_targets_mean": 1404.6, |
| "valid_targets_min": 732 |
| }, |
| { |
| "epoch": 0.92534174553102, |
| "grad_norm": 0.783815056504219, |
| "learning_rate": 3.987537397010624e-05, |
| "loss": 0.2345, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2181542068719864, |
| "step": 880, |
| "valid_targets_mean": 1414.5, |
| "valid_targets_min": 634 |
| }, |
| { |
| "epoch": 0.9305993690851735, |
| "grad_norm": 0.7479207862356614, |
| "learning_rate": 3.9869460757025064e-05, |
| "loss": 0.2238, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2406795173883438, |
| "step": 885, |
| "valid_targets_mean": 1663.4, |
| "valid_targets_min": 905 |
| }, |
| { |
| "epoch": 0.935856992639327, |
| "grad_norm": 0.7604101852877805, |
| "learning_rate": 3.9863410951414616e-05, |
| "loss": 0.2211, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2308855652809143, |
| "step": 890, |
| "valid_targets_mean": 1482.2, |
| "valid_targets_min": 596 |
| }, |
| { |
| "epoch": 0.9411146161934806, |
| "grad_norm": 0.852905188319462, |
| "learning_rate": 3.985722459486425e-05, |
| "loss": 0.2169, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2423647791147232, |
| "step": 895, |
| "valid_targets_mean": 1422.8, |
| "valid_targets_min": 687 |
| }, |
| { |
| "epoch": 0.9463722397476341, |
| "grad_norm": 0.7852445064066973, |
| "learning_rate": 3.985090172990206e-05, |
| "loss": 0.2361, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22678713500499725, |
| "step": 900, |
| "valid_targets_mean": 1684.7, |
| "valid_targets_min": 567 |
| }, |
| { |
| "epoch": 0.9516298633017876, |
| "grad_norm": 0.7081748321424154, |
| "learning_rate": 3.984444239999455e-05, |
| "loss": 0.2205, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21190844476222992, |
| "step": 905, |
| "valid_targets_mean": 1780.8, |
| "valid_targets_min": 810 |
| }, |
| { |
| "epoch": 0.9568874868559412, |
| "grad_norm": 0.7499834026647575, |
| "learning_rate": 3.9837846649546354e-05, |
| "loss": 0.2181, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23362717032432556, |
| "step": 910, |
| "valid_targets_mean": 1872.5, |
| "valid_targets_min": 1047 |
| }, |
| { |
| "epoch": 0.9621451104100947, |
| "grad_norm": 0.7736636980606054, |
| "learning_rate": 3.9831114523899945e-05, |
| "loss": 0.2134, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22128413617610931, |
| "step": 915, |
| "valid_targets_mean": 1659.1, |
| "valid_targets_min": 829 |
| }, |
| { |
| "epoch": 0.9674027339642481, |
| "grad_norm": 0.7354159562943822, |
| "learning_rate": 3.982424606933529e-05, |
| "loss": 0.2098, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22994014620780945, |
| "step": 920, |
| "valid_targets_mean": 1739.2, |
| "valid_targets_min": 1141 |
| }, |
| { |
| "epoch": 0.9726603575184016, |
| "grad_norm": 0.8130210891528385, |
| "learning_rate": 3.981724133306954e-05, |
| "loss": 0.2229, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22318342328071594, |
| "step": 925, |
| "valid_targets_mean": 1412.8, |
| "valid_targets_min": 935 |
| }, |
| { |
| "epoch": 0.9779179810725552, |
| "grad_norm": 0.807124950997584, |
| "learning_rate": 3.981010036325674e-05, |
| "loss": 0.2247, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24344861507415771, |
| "step": 930, |
| "valid_targets_mean": 1618.1, |
| "valid_targets_min": 684 |
| }, |
| { |
| "epoch": 0.9831756046267087, |
| "grad_norm": 0.8729906575725193, |
| "learning_rate": 3.980282320898746e-05, |
| "loss": 0.2224, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20901045203208923, |
| "step": 935, |
| "valid_targets_mean": 1520.9, |
| "valid_targets_min": 847 |
| }, |
| { |
| "epoch": 0.9884332281808622, |
| "grad_norm": 0.9382395488059447, |
| "learning_rate": 3.9795409920288456e-05, |
| "loss": 0.224, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21550670266151428, |
| "step": 940, |
| "valid_targets_mean": 1646.8, |
| "valid_targets_min": 738 |
| }, |
| { |
| "epoch": 0.9936908517350158, |
| "grad_norm": 0.8207956171745925, |
| "learning_rate": 3.978786054812236e-05, |
| "loss": 0.2286, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2383539378643036, |
| "step": 945, |
| "valid_targets_mean": 1528.8, |
| "valid_targets_min": 594 |
| }, |
| { |
| "epoch": 0.9989484752891693, |
| "grad_norm": 0.7897974603329635, |
| "learning_rate": 3.9780175144387304e-05, |
| "loss": 0.2299, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22173242270946503, |
| "step": 950, |
| "valid_targets_mean": 1938.9, |
| "valid_targets_min": 918 |
| }, |
| { |
| "epoch": 1.0042060988433228, |
| "grad_norm": 0.6968326191051749, |
| "learning_rate": 3.977235376191656e-05, |
| "loss": 0.1969, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15473145246505737, |
| "step": 955, |
| "valid_targets_mean": 2562.4, |
| "valid_targets_min": 543 |
| }, |
| { |
| "epoch": 1.0094637223974763, |
| "grad_norm": 0.4252356509832368, |
| "learning_rate": 3.9764396454478195e-05, |
| "loss": 0.1502, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1259298324584961, |
| "step": 960, |
| "valid_targets_mean": 3733.2, |
| "valid_targets_min": 2731 |
| }, |
| { |
| "epoch": 1.0147213459516298, |
| "grad_norm": 0.43162305543008495, |
| "learning_rate": 3.975630327677468e-05, |
| "loss": 0.1384, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1122618317604065, |
| "step": 965, |
| "valid_targets_mean": 3446.4, |
| "valid_targets_min": 700 |
| }, |
| { |
| "epoch": 1.0199789695057835, |
| "grad_norm": 0.4375741275858772, |
| "learning_rate": 3.974807428444254e-05, |
| "loss": 0.1526, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15583333373069763, |
| "step": 970, |
| "valid_targets_mean": 3481.1, |
| "valid_targets_min": 1095 |
| }, |
| { |
| "epoch": 1.025236593059937, |
| "grad_norm": 0.5038838276022358, |
| "learning_rate": 3.973970953405195e-05, |
| "loss": 0.1278, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15186336636543274, |
| "step": 975, |
| "valid_targets_mean": 2304.1, |
| "valid_targets_min": 560 |
| }, |
| { |
| "epoch": 1.0304942166140905, |
| "grad_norm": 0.41244675764624933, |
| "learning_rate": 3.9731209083106354e-05, |
| "loss": 0.137, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14149606227874756, |
| "step": 980, |
| "valid_targets_mean": 2921.5, |
| "valid_targets_min": 806 |
| }, |
| { |
| "epoch": 1.035751840168244, |
| "grad_norm": 0.7896595898616114, |
| "learning_rate": 3.972257299004206e-05, |
| "loss": 0.2152, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23016992211341858, |
| "step": 985, |
| "valid_targets_mean": 1657.2, |
| "valid_targets_min": 650 |
| }, |
| { |
| "epoch": 1.0410094637223974, |
| "grad_norm": 0.4379386114003751, |
| "learning_rate": 3.9713801314227867e-05, |
| "loss": 0.1308, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.131107896566391, |
| "step": 990, |
| "valid_targets_mean": 3432.3, |
| "valid_targets_min": 1037 |
| }, |
| { |
| "epoch": 1.046267087276551, |
| "grad_norm": 0.6675675390593576, |
| "learning_rate": 3.9704894115964615e-05, |
| "loss": 0.1641, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21469852328300476, |
| "step": 995, |
| "valid_targets_mean": 2068.1, |
| "valid_targets_min": 859 |
| }, |
| { |
| "epoch": 1.0515247108307044, |
| "grad_norm": 0.3030110380328977, |
| "learning_rate": 3.9695851456484805e-05, |
| "loss": 0.1536, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08601504564285278, |
| "step": 1000, |
| "valid_targets_mean": 5273.1, |
| "valid_targets_min": 3285 |
| }, |
| { |
| "epoch": 1.0567823343848581, |
| "grad_norm": 0.38710105306333087, |
| "learning_rate": 3.968667339795218e-05, |
| "loss": 0.1239, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1301286816596985, |
| "step": 1005, |
| "valid_targets_mean": 3644.8, |
| "valid_targets_min": 502 |
| }, |
| { |
| "epoch": 1.0620399579390116, |
| "grad_norm": 0.4963907169584106, |
| "learning_rate": 3.9677360003461246e-05, |
| "loss": 0.1296, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1354469358921051, |
| "step": 1010, |
| "valid_targets_mean": 3477.0, |
| "valid_targets_min": 600 |
| }, |
| { |
| "epoch": 1.0672975814931651, |
| "grad_norm": 0.5283050591592504, |
| "learning_rate": 3.966791133703691e-05, |
| "loss": 0.1297, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13511860370635986, |
| "step": 1015, |
| "valid_targets_mean": 2120.4, |
| "valid_targets_min": 492 |
| }, |
| { |
| "epoch": 1.0725552050473186, |
| "grad_norm": 0.3351755168178175, |
| "learning_rate": 3.965832746363397e-05, |
| "loss": 0.1727, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0992107167840004, |
| "step": 1020, |
| "valid_targets_mean": 4264.1, |
| "valid_targets_min": 1961 |
| }, |
| { |
| "epoch": 1.077812828601472, |
| "grad_norm": 0.3772330213837117, |
| "learning_rate": 3.964860844913676e-05, |
| "loss": 0.1215, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11703327298164368, |
| "step": 1025, |
| "valid_targets_mean": 3787.4, |
| "valid_targets_min": 1822 |
| }, |
| { |
| "epoch": 1.0830704521556256, |
| "grad_norm": 0.5147002269923598, |
| "learning_rate": 3.9638754360358585e-05, |
| "loss": 0.1418, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12644034624099731, |
| "step": 1030, |
| "valid_targets_mean": 2376.2, |
| "valid_targets_min": 644 |
| }, |
| { |
| "epoch": 1.088328075709779, |
| "grad_norm": 0.39865128582762477, |
| "learning_rate": 3.962876526504134e-05, |
| "loss": 0.1122, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11796826124191284, |
| "step": 1035, |
| "valid_targets_mean": 2907.6, |
| "valid_targets_min": 720 |
| }, |
| { |
| "epoch": 1.0935856992639328, |
| "grad_norm": 0.783145494624693, |
| "learning_rate": 3.961864123185502e-05, |
| "loss": 0.141, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15101072192192078, |
| "step": 1040, |
| "valid_targets_mean": 1197.8, |
| "valid_targets_min": 515 |
| }, |
| { |
| "epoch": 1.0988433228180863, |
| "grad_norm": 0.43336387607524735, |
| "learning_rate": 3.9608382330397265e-05, |
| "loss": 0.1428, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11531385779380798, |
| "step": 1045, |
| "valid_targets_mean": 2553.1, |
| "valid_targets_min": 589 |
| }, |
| { |
| "epoch": 1.1041009463722398, |
| "grad_norm": 1.0193659758997566, |
| "learning_rate": 3.959798863119284e-05, |
| "loss": 0.151, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1563202440738678, |
| "step": 1050, |
| "valid_targets_mean": 3193.4, |
| "valid_targets_min": 1086 |
| }, |
| { |
| "epoch": 1.1093585699263933, |
| "grad_norm": 0.44696153444520886, |
| "learning_rate": 3.9587460205693194e-05, |
| "loss": 0.1494, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16717270016670227, |
| "step": 1055, |
| "valid_targets_mean": 3228.1, |
| "valid_targets_min": 1341 |
| }, |
| { |
| "epoch": 1.1146161934805467, |
| "grad_norm": 0.3961650580085898, |
| "learning_rate": 3.9576797126275945e-05, |
| "loss": 0.1896, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13076983392238617, |
| "step": 1060, |
| "valid_targets_mean": 3338.1, |
| "valid_targets_min": 714 |
| }, |
| { |
| "epoch": 1.1198738170347002, |
| "grad_norm": 0.396531277714411, |
| "learning_rate": 3.9565999466244384e-05, |
| "loss": 0.1207, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12670114636421204, |
| "step": 1065, |
| "valid_targets_mean": 3436.3, |
| "valid_targets_min": 669 |
| }, |
| { |
| "epoch": 1.125131440588854, |
| "grad_norm": 0.7436207015770959, |
| "learning_rate": 3.955506729982699e-05, |
| "loss": 0.1487, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18402673304080963, |
| "step": 1070, |
| "valid_targets_mean": 1240.5, |
| "valid_targets_min": 598 |
| }, |
| { |
| "epoch": 1.1303890641430074, |
| "grad_norm": 0.8668415342482751, |
| "learning_rate": 3.9544000702176896e-05, |
| "loss": 0.1747, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18990148603916168, |
| "step": 1075, |
| "valid_targets_mean": 1436.1, |
| "valid_targets_min": 323 |
| }, |
| { |
| "epoch": 1.135646687697161, |
| "grad_norm": 0.4050610243598935, |
| "learning_rate": 3.953279974937139e-05, |
| "loss": 0.1469, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13849858939647675, |
| "step": 1080, |
| "valid_targets_mean": 3868.8, |
| "valid_targets_min": 2827 |
| }, |
| { |
| "epoch": 1.1409043112513144, |
| "grad_norm": 0.49634725160950344, |
| "learning_rate": 3.9521464518411356e-05, |
| "loss": 0.2052, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2748745083808899, |
| "step": 1085, |
| "valid_targets_mean": 3063.6, |
| "valid_targets_min": 900 |
| }, |
| { |
| "epoch": 1.146161934805468, |
| "grad_norm": 0.41502298402516696, |
| "learning_rate": 3.950999508722082e-05, |
| "loss": 0.3039, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13370385766029358, |
| "step": 1090, |
| "valid_targets_mean": 3590.4, |
| "valid_targets_min": 1932 |
| }, |
| { |
| "epoch": 1.1514195583596214, |
| "grad_norm": 0.5952218585264138, |
| "learning_rate": 3.9498391534646325e-05, |
| "loss": 0.1531, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16572102904319763, |
| "step": 1095, |
| "valid_targets_mean": 2208.4, |
| "valid_targets_min": 820 |
| }, |
| { |
| "epoch": 1.1566771819137749, |
| "grad_norm": 0.5130697588962526, |
| "learning_rate": 3.948665394045646e-05, |
| "loss": 0.1504, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2032875418663025, |
| "step": 1100, |
| "valid_targets_mean": 2673.4, |
| "valid_targets_min": 727 |
| }, |
| { |
| "epoch": 1.1619348054679284, |
| "grad_norm": 0.3366525734715256, |
| "learning_rate": 3.9474782385341255e-05, |
| "loss": 0.231, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11511224508285522, |
| "step": 1105, |
| "valid_targets_mean": 4382.8, |
| "valid_targets_min": 2258 |
| }, |
| { |
| "epoch": 1.167192429022082, |
| "grad_norm": 0.4901552037072492, |
| "learning_rate": 3.9462776950911684e-05, |
| "loss": 0.1211, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1944444626569748, |
| "step": 1110, |
| "valid_targets_mean": 3836.1, |
| "valid_targets_min": 1142 |
| }, |
| { |
| "epoch": 1.1724500525762356, |
| "grad_norm": 0.5179425744671011, |
| "learning_rate": 3.9450637719699046e-05, |
| "loss": 0.1339, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14342385530471802, |
| "step": 1115, |
| "valid_targets_mean": 3908.0, |
| "valid_targets_min": 513 |
| }, |
| { |
| "epoch": 1.177707676130389, |
| "grad_norm": 0.31996823896007986, |
| "learning_rate": 3.9438364775154436e-05, |
| "loss": 0.1349, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10580530762672424, |
| "step": 1120, |
| "valid_targets_mean": 3853.7, |
| "valid_targets_min": 1189 |
| }, |
| { |
| "epoch": 1.1829652996845426, |
| "grad_norm": 0.3363261621702768, |
| "learning_rate": 3.942595820164818e-05, |
| "loss": 0.1241, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11392706632614136, |
| "step": 1125, |
| "valid_targets_mean": 3941.4, |
| "valid_targets_min": 748 |
| }, |
| { |
| "epoch": 1.188222923238696, |
| "grad_norm": 0.40996340911609525, |
| "learning_rate": 3.94134180844692e-05, |
| "loss": 0.1207, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12967784702777863, |
| "step": 1130, |
| "valid_targets_mean": 3278.1, |
| "valid_targets_min": 886 |
| }, |
| { |
| "epoch": 1.1934805467928495, |
| "grad_norm": 0.48429205683115417, |
| "learning_rate": 3.940074450982449e-05, |
| "loss": 0.1279, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1487618237733841, |
| "step": 1135, |
| "valid_targets_mean": 2903.9, |
| "valid_targets_min": 1939 |
| }, |
| { |
| "epoch": 1.1987381703470033, |
| "grad_norm": 0.43375160194238566, |
| "learning_rate": 3.93879375648385e-05, |
| "loss": 0.1073, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11100872606039047, |
| "step": 1140, |
| "valid_targets_mean": 2530.4, |
| "valid_targets_min": 519 |
| }, |
| { |
| "epoch": 1.2039957939011567, |
| "grad_norm": 0.5507462662064243, |
| "learning_rate": 3.9374997337552496e-05, |
| "loss": 0.1898, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1793445348739624, |
| "step": 1145, |
| "valid_targets_mean": 2007.8, |
| "valid_targets_min": 645 |
| }, |
| { |
| "epoch": 1.2092534174553102, |
| "grad_norm": 0.4530191618046954, |
| "learning_rate": 3.936192391692404e-05, |
| "loss": 0.0998, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11263026297092438, |
| "step": 1150, |
| "valid_targets_mean": 2953.2, |
| "valid_targets_min": 472 |
| }, |
| { |
| "epoch": 1.2145110410094637, |
| "grad_norm": 0.4359977672738057, |
| "learning_rate": 3.9348717392826306e-05, |
| "loss": 0.117, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10660582780838013, |
| "step": 1155, |
| "valid_targets_mean": 2605.6, |
| "valid_targets_min": 616 |
| }, |
| { |
| "epoch": 1.2197686645636172, |
| "grad_norm": 0.32534861740203447, |
| "learning_rate": 3.933537785604748e-05, |
| "loss": 0.1093, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10801704227924347, |
| "step": 1160, |
| "valid_targets_mean": 4023.8, |
| "valid_targets_min": 2852 |
| }, |
| { |
| "epoch": 1.2250262881177707, |
| "grad_norm": 0.5024667960257416, |
| "learning_rate": 3.932190539829018e-05, |
| "loss": 0.1303, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19506166875362396, |
| "step": 1165, |
| "valid_targets_mean": 2697.2, |
| "valid_targets_min": 792 |
| }, |
| { |
| "epoch": 1.2302839116719242, |
| "grad_norm": 0.3775336673407538, |
| "learning_rate": 3.9308300112170735e-05, |
| "loss": 0.1643, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1055578887462616, |
| "step": 1170, |
| "valid_targets_mean": 3389.0, |
| "valid_targets_min": 729 |
| }, |
| { |
| "epoch": 1.235541535226078, |
| "grad_norm": 0.5420628024099352, |
| "learning_rate": 3.929456209121865e-05, |
| "loss": 0.1559, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15883982181549072, |
| "step": 1175, |
| "valid_targets_mean": 1641.5, |
| "valid_targets_min": 612 |
| }, |
| { |
| "epoch": 1.2407991587802314, |
| "grad_norm": 0.6679706246773904, |
| "learning_rate": 3.928069142987589e-05, |
| "loss": 0.1457, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19529536366462708, |
| "step": 1180, |
| "valid_targets_mean": 1712.1, |
| "valid_targets_min": 664 |
| }, |
| { |
| "epoch": 1.2460567823343849, |
| "grad_norm": 0.49701414835302343, |
| "learning_rate": 3.926668822349625e-05, |
| "loss": 0.1545, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16395148634910583, |
| "step": 1185, |
| "valid_targets_mean": 2137.5, |
| "valid_targets_min": 747 |
| }, |
| { |
| "epoch": 1.2513144058885384, |
| "grad_norm": 0.3729136584258894, |
| "learning_rate": 3.925255256834474e-05, |
| "loss": 0.1742, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11425455659627914, |
| "step": 1190, |
| "valid_targets_mean": 3752.8, |
| "valid_targets_min": 945 |
| }, |
| { |
| "epoch": 1.2565720294426919, |
| "grad_norm": 0.4087750023758472, |
| "learning_rate": 3.923828456159685e-05, |
| "loss": 0.1298, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12711559236049652, |
| "step": 1195, |
| "valid_targets_mean": 3276.1, |
| "valid_targets_min": 840 |
| }, |
| { |
| "epoch": 1.2618296529968454, |
| "grad_norm": 0.4626991304589331, |
| "learning_rate": 3.922388430133793e-05, |
| "loss": 0.1557, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13800734281539917, |
| "step": 1200, |
| "valid_targets_mean": 3255.8, |
| "valid_targets_min": 755 |
| }, |
| { |
| "epoch": 1.267087276550999, |
| "grad_norm": 0.49708542062636973, |
| "learning_rate": 3.9209351886562535e-05, |
| "loss": 0.1393, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13524243235588074, |
| "step": 1205, |
| "valid_targets_mean": 1867.9, |
| "valid_targets_min": 485 |
| }, |
| { |
| "epoch": 1.2723449001051526, |
| "grad_norm": 0.5369768536009524, |
| "learning_rate": 3.919468741717367e-05, |
| "loss": 0.1212, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13757452368736267, |
| "step": 1210, |
| "valid_targets_mean": 2776.2, |
| "valid_targets_min": 605 |
| }, |
| { |
| "epoch": 1.277602523659306, |
| "grad_norm": 0.299871924542344, |
| "learning_rate": 3.9179890993982186e-05, |
| "loss": 0.1165, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09392790496349335, |
| "step": 1215, |
| "valid_targets_mean": 4657.1, |
| "valid_targets_min": 848 |
| }, |
| { |
| "epoch": 1.2828601472134595, |
| "grad_norm": 0.4090001624099689, |
| "learning_rate": 3.916496271870603e-05, |
| "loss": 0.1176, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11056766659021378, |
| "step": 1220, |
| "valid_targets_mean": 2842.2, |
| "valid_targets_min": 677 |
| }, |
| { |
| "epoch": 1.288117770767613, |
| "grad_norm": 0.37686181675990543, |
| "learning_rate": 3.914990269396957e-05, |
| "loss": 0.1158, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12508204579353333, |
| "step": 1225, |
| "valid_targets_mean": 3812.6, |
| "valid_targets_min": 905 |
| }, |
| { |
| "epoch": 1.2933753943217665, |
| "grad_norm": 0.4136496289786487, |
| "learning_rate": 3.913471102330288e-05, |
| "loss": 0.1329, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15721048414707184, |
| "step": 1230, |
| "valid_targets_mean": 2703.1, |
| "valid_targets_min": 808 |
| }, |
| { |
| "epoch": 1.29863301787592, |
| "grad_norm": 0.45042622214795064, |
| "learning_rate": 3.911938781114105e-05, |
| "loss": 0.1322, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1321100890636444, |
| "step": 1235, |
| "valid_targets_mean": 3409.4, |
| "valid_targets_min": 1814 |
| }, |
| { |
| "epoch": 1.3038906414300735, |
| "grad_norm": 0.44334440962146443, |
| "learning_rate": 3.910393316282345e-05, |
| "loss": 0.1373, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15637809038162231, |
| "step": 1240, |
| "valid_targets_mean": 3388.2, |
| "valid_targets_min": 931 |
| }, |
| { |
| "epoch": 1.3091482649842272, |
| "grad_norm": 0.3607137806447017, |
| "learning_rate": 3.9088347184592974e-05, |
| "loss": 0.1055, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11025415360927582, |
| "step": 1245, |
| "valid_targets_mean": 3544.8, |
| "valid_targets_min": 868 |
| }, |
| { |
| "epoch": 1.3144058885383807, |
| "grad_norm": 0.5230434083977941, |
| "learning_rate": 3.907262998359539e-05, |
| "loss": 0.1259, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14851859211921692, |
| "step": 1250, |
| "valid_targets_mean": 1959.2, |
| "valid_targets_min": 664 |
| }, |
| { |
| "epoch": 1.3196635120925342, |
| "grad_norm": 0.3595859099697419, |
| "learning_rate": 3.905678166787852e-05, |
| "loss": 0.1315, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11665290594100952, |
| "step": 1255, |
| "valid_targets_mean": 3505.8, |
| "valid_targets_min": 1141 |
| }, |
| { |
| "epoch": 1.3249211356466877, |
| "grad_norm": 0.41971352909758153, |
| "learning_rate": 3.9040802346391555e-05, |
| "loss": 0.1033, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12182092666625977, |
| "step": 1260, |
| "valid_targets_mean": 3273.2, |
| "valid_targets_min": 1003 |
| }, |
| { |
| "epoch": 1.3301787592008412, |
| "grad_norm": 0.3417759830933672, |
| "learning_rate": 3.902469212898427e-05, |
| "loss": 0.1284, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09475494921207428, |
| "step": 1265, |
| "valid_targets_mean": 3075.9, |
| "valid_targets_min": 531 |
| }, |
| { |
| "epoch": 1.3354363827549949, |
| "grad_norm": 0.36936309510293913, |
| "learning_rate": 3.900845112640631e-05, |
| "loss": 0.1289, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10651171207427979, |
| "step": 1270, |
| "valid_targets_mean": 3199.6, |
| "valid_targets_min": 1003 |
| }, |
| { |
| "epoch": 1.3406940063091484, |
| "grad_norm": 0.4856438902289461, |
| "learning_rate": 3.8992079450306355e-05, |
| "loss": 0.1506, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12961041927337646, |
| "step": 1275, |
| "valid_targets_mean": 2010.4, |
| "valid_targets_min": 597 |
| }, |
| { |
| "epoch": 1.3459516298633019, |
| "grad_norm": 0.3972055097835021, |
| "learning_rate": 3.897557721323145e-05, |
| "loss": 0.1234, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10769897699356079, |
| "step": 1280, |
| "valid_targets_mean": 2575.9, |
| "valid_targets_min": 665 |
| }, |
| { |
| "epoch": 1.3512092534174553, |
| "grad_norm": 0.49578984115567115, |
| "learning_rate": 3.895894452862614e-05, |
| "loss": 0.1474, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1176232397556305, |
| "step": 1285, |
| "valid_targets_mean": 1814.0, |
| "valid_targets_min": 853 |
| }, |
| { |
| "epoch": 1.3564668769716088, |
| "grad_norm": 0.4524392989778532, |
| "learning_rate": 3.894218151083176e-05, |
| "loss": 0.1305, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1428132802248001, |
| "step": 1290, |
| "valid_targets_mean": 2043.7, |
| "valid_targets_min": 708 |
| }, |
| { |
| "epoch": 1.3617245005257623, |
| "grad_norm": 1.0125437273334468, |
| "learning_rate": 3.892528827508562e-05, |
| "loss": 0.1372, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13234540820121765, |
| "step": 1295, |
| "valid_targets_mean": 1978.1, |
| "valid_targets_min": 617 |
| }, |
| { |
| "epoch": 1.3669821240799158, |
| "grad_norm": 0.3298011944841812, |
| "learning_rate": 3.890826493752018e-05, |
| "loss": 0.1153, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08677037805318832, |
| "step": 1300, |
| "valid_targets_mean": 3022.0, |
| "valid_targets_min": 720 |
| }, |
| { |
| "epoch": 1.3722397476340693, |
| "grad_norm": 0.37813410033822, |
| "learning_rate": 3.8891111615162314e-05, |
| "loss": 0.1169, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08522579818964005, |
| "step": 1305, |
| "valid_targets_mean": 3080.2, |
| "valid_targets_min": 785 |
| }, |
| { |
| "epoch": 1.3774973711882228, |
| "grad_norm": 0.5306661224388369, |
| "learning_rate": 3.8873828425932486e-05, |
| "loss": 0.1525, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13316848874092102, |
| "step": 1310, |
| "valid_targets_mean": 1886.2, |
| "valid_targets_min": 446 |
| }, |
| { |
| "epoch": 1.3827549947423765, |
| "grad_norm": 0.40366072200168523, |
| "learning_rate": 3.8856415488643885e-05, |
| "loss": 0.1085, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11138216406106949, |
| "step": 1315, |
| "valid_targets_mean": 3074.6, |
| "valid_targets_min": 681 |
| }, |
| { |
| "epoch": 1.38801261829653, |
| "grad_norm": 0.3901441629273313, |
| "learning_rate": 3.88388729230017e-05, |
| "loss": 0.1181, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14005088806152344, |
| "step": 1320, |
| "valid_targets_mean": 3278.7, |
| "valid_targets_min": 555 |
| }, |
| { |
| "epoch": 1.3932702418506835, |
| "grad_norm": 0.3810101607613737, |
| "learning_rate": 3.8821200849602215e-05, |
| "loss": 0.1154, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1122380867600441, |
| "step": 1325, |
| "valid_targets_mean": 3133.0, |
| "valid_targets_min": 721 |
| }, |
| { |
| "epoch": 1.398527865404837, |
| "grad_norm": 0.31729598628056144, |
| "learning_rate": 3.880339938993204e-05, |
| "loss": 0.1011, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08910711109638214, |
| "step": 1330, |
| "valid_targets_mean": 4206.8, |
| "valid_targets_min": 861 |
| }, |
| { |
| "epoch": 1.4037854889589905, |
| "grad_norm": 0.4498381595826103, |
| "learning_rate": 3.878546866636724e-05, |
| "loss": 0.1134, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1521395891904831, |
| "step": 1335, |
| "valid_targets_mean": 4073.1, |
| "valid_targets_min": 2020 |
| }, |
| { |
| "epoch": 1.4090431125131442, |
| "grad_norm": 0.3693012263191996, |
| "learning_rate": 3.876740880217248e-05, |
| "loss": 0.1182, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10957978665828705, |
| "step": 1340, |
| "valid_targets_mean": 3804.0, |
| "valid_targets_min": 1286 |
| }, |
| { |
| "epoch": 1.4143007360672977, |
| "grad_norm": 0.37262062800960377, |
| "learning_rate": 3.874921992150026e-05, |
| "loss": 0.1426, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12414566427469254, |
| "step": 1345, |
| "valid_targets_mean": 3684.8, |
| "valid_targets_min": 2652 |
| }, |
| { |
| "epoch": 1.4195583596214512, |
| "grad_norm": 0.4731245735319154, |
| "learning_rate": 3.873090214938994e-05, |
| "loss": 0.1418, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24099209904670715, |
| "step": 1350, |
| "valid_targets_mean": 3169.3, |
| "valid_targets_min": 764 |
| }, |
| { |
| "epoch": 1.4248159831756047, |
| "grad_norm": 0.4662014451698648, |
| "learning_rate": 3.871245561176698e-05, |
| "loss": 0.097, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13270971179008484, |
| "step": 1355, |
| "valid_targets_mean": 2353.6, |
| "valid_targets_min": 815 |
| }, |
| { |
| "epoch": 1.4300736067297581, |
| "grad_norm": 0.38093091702914345, |
| "learning_rate": 3.869388043544204e-05, |
| "loss": 0.1442, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12183333933353424, |
| "step": 1360, |
| "valid_targets_mean": 2968.9, |
| "valid_targets_min": 485 |
| }, |
| { |
| "epoch": 1.4353312302839116, |
| "grad_norm": 0.38728961412748175, |
| "learning_rate": 3.8675176748110076e-05, |
| "loss": 0.1154, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12194234132766724, |
| "step": 1365, |
| "valid_targets_mean": 3372.6, |
| "valid_targets_min": 854 |
| }, |
| { |
| "epoch": 1.4405888538380651, |
| "grad_norm": 0.3774155606511259, |
| "learning_rate": 3.865634467834953e-05, |
| "loss": 0.1255, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10121260583400726, |
| "step": 1370, |
| "valid_targets_mean": 3453.6, |
| "valid_targets_min": 743 |
| }, |
| { |
| "epoch": 1.4458464773922186, |
| "grad_norm": 0.5421737966727603, |
| "learning_rate": 3.863738435562139e-05, |
| "loss": 0.1417, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18703538179397583, |
| "step": 1375, |
| "valid_targets_mean": 2007.8, |
| "valid_targets_min": 706 |
| }, |
| { |
| "epoch": 1.4511041009463723, |
| "grad_norm": 0.47373152021408965, |
| "learning_rate": 3.8618295910268316e-05, |
| "loss": 0.17, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17668291926383972, |
| "step": 1380, |
| "valid_targets_mean": 2666.4, |
| "valid_targets_min": 675 |
| }, |
| { |
| "epoch": 1.4563617245005258, |
| "grad_norm": 0.44800091705976475, |
| "learning_rate": 3.859907947351374e-05, |
| "loss": 0.1304, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11316927522420883, |
| "step": 1385, |
| "valid_targets_mean": 2688.8, |
| "valid_targets_min": 663 |
| }, |
| { |
| "epoch": 1.4616193480546793, |
| "grad_norm": 0.543936965602729, |
| "learning_rate": 3.8579735177460994e-05, |
| "loss": 0.1224, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1301974058151245, |
| "step": 1390, |
| "valid_targets_mean": 1787.4, |
| "valid_targets_min": 716 |
| }, |
| { |
| "epoch": 1.4668769716088328, |
| "grad_norm": 0.39623239314685016, |
| "learning_rate": 3.856026315509236e-05, |
| "loss": 0.1151, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11998635530471802, |
| "step": 1395, |
| "valid_targets_mean": 2952.1, |
| "valid_targets_min": 542 |
| }, |
| { |
| "epoch": 1.4721345951629863, |
| "grad_norm": 0.48915348895790417, |
| "learning_rate": 3.8540663540268175e-05, |
| "loss": 0.1171, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12732747197151184, |
| "step": 1400, |
| "valid_targets_mean": 2716.6, |
| "valid_targets_min": 798 |
| }, |
| { |
| "epoch": 1.4773922187171398, |
| "grad_norm": 0.4545764492795325, |
| "learning_rate": 3.852093646772592e-05, |
| "loss": 0.1029, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10610067844390869, |
| "step": 1405, |
| "valid_targets_mean": 2416.6, |
| "valid_targets_min": 635 |
| }, |
| { |
| "epoch": 1.4826498422712935, |
| "grad_norm": 0.3878130056324593, |
| "learning_rate": 3.850108207307927e-05, |
| "loss": 0.1447, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09582462161779404, |
| "step": 1410, |
| "valid_targets_mean": 2784.3, |
| "valid_targets_min": 794 |
| }, |
| { |
| "epoch": 1.487907465825447, |
| "grad_norm": 0.4140660738101145, |
| "learning_rate": 3.848110049281719e-05, |
| "loss": 0.1025, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1034550666809082, |
| "step": 1415, |
| "valid_targets_mean": 2285.6, |
| "valid_targets_min": 704 |
| }, |
| { |
| "epoch": 1.4931650893796005, |
| "grad_norm": 0.4169602584296961, |
| "learning_rate": 3.846099186430297e-05, |
| "loss": 0.1147, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10001115500926971, |
| "step": 1420, |
| "valid_targets_mean": 2570.1, |
| "valid_targets_min": 529 |
| }, |
| { |
| "epoch": 1.498422712933754, |
| "grad_norm": 0.4012394343569159, |
| "learning_rate": 3.8440756325773296e-05, |
| "loss": 0.1255, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1347663551568985, |
| "step": 1425, |
| "valid_targets_mean": 3507.9, |
| "valid_targets_min": 2017 |
| }, |
| { |
| "epoch": 1.5036803364879074, |
| "grad_norm": 0.32637843623804386, |
| "learning_rate": 3.84203940163373e-05, |
| "loss": 0.1129, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11265628039836884, |
| "step": 1430, |
| "valid_targets_mean": 4252.3, |
| "valid_targets_min": 516 |
| }, |
| { |
| "epoch": 1.508937960042061, |
| "grad_norm": 0.3321727896661518, |
| "learning_rate": 3.83999050759756e-05, |
| "loss": 0.1038, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11609843373298645, |
| "step": 1435, |
| "valid_targets_mean": 3945.1, |
| "valid_targets_min": 775 |
| }, |
| { |
| "epoch": 1.5141955835962144, |
| "grad_norm": 0.3104261170739649, |
| "learning_rate": 3.837928964553933e-05, |
| "loss": 0.1091, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09658493101596832, |
| "step": 1440, |
| "valid_targets_mean": 3760.6, |
| "valid_targets_min": 605 |
| }, |
| { |
| "epoch": 1.519453207150368, |
| "grad_norm": 0.4810387672796794, |
| "learning_rate": 3.835854786674918e-05, |
| "loss": 0.1967, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28749269247055054, |
| "step": 1445, |
| "valid_targets_mean": 2532.4, |
| "valid_targets_min": 1132 |
| }, |
| { |
| "epoch": 1.5247108307045214, |
| "grad_norm": 0.388376390316912, |
| "learning_rate": 3.8337679882194443e-05, |
| "loss": 0.1358, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11735714226961136, |
| "step": 1450, |
| "valid_targets_mean": 3141.9, |
| "valid_targets_min": 527 |
| }, |
| { |
| "epoch": 1.5299684542586751, |
| "grad_norm": 0.3997705496398304, |
| "learning_rate": 3.8316685835331984e-05, |
| "loss": 0.1196, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1308724582195282, |
| "step": 1455, |
| "valid_targets_mean": 3037.3, |
| "valid_targets_min": 717 |
| }, |
| { |
| "epoch": 1.5352260778128286, |
| "grad_norm": 0.4084041955754898, |
| "learning_rate": 3.8295565870485295e-05, |
| "loss": 0.112, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14215297996997833, |
| "step": 1460, |
| "valid_targets_mean": 2589.2, |
| "valid_targets_min": 927 |
| }, |
| { |
| "epoch": 1.540483701366982, |
| "grad_norm": 1.0405850837591837, |
| "learning_rate": 3.827432013284349e-05, |
| "loss": 0.2353, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2418077439069748, |
| "step": 1465, |
| "valid_targets_mean": 1337.4, |
| "valid_targets_min": 788 |
| }, |
| { |
| "epoch": 1.5457413249211358, |
| "grad_norm": 0.7561965502287827, |
| "learning_rate": 3.825294876846031e-05, |
| "loss": 0.2251, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22426745295524597, |
| "step": 1470, |
| "valid_targets_mean": 1537.9, |
| "valid_targets_min": 957 |
| }, |
| { |
| "epoch": 1.5509989484752893, |
| "grad_norm": 0.7053409554245997, |
| "learning_rate": 3.823145192425313e-05, |
| "loss": 0.2172, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2108028531074524, |
| "step": 1475, |
| "valid_targets_mean": 1543.2, |
| "valid_targets_min": 796 |
| }, |
| { |
| "epoch": 1.5562565720294428, |
| "grad_norm": 0.8560460096033154, |
| "learning_rate": 3.8209829748001894e-05, |
| "loss": 0.2162, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21613195538520813, |
| "step": 1480, |
| "valid_targets_mean": 1313.4, |
| "valid_targets_min": 697 |
| }, |
| { |
| "epoch": 1.5615141955835963, |
| "grad_norm": 0.6936760698646955, |
| "learning_rate": 3.8188082388348186e-05, |
| "loss": 0.2177, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2191494256258011, |
| "step": 1485, |
| "valid_targets_mean": 1616.7, |
| "valid_targets_min": 638 |
| }, |
| { |
| "epoch": 1.5667718191377498, |
| "grad_norm": 0.7263767449141347, |
| "learning_rate": 3.816620999479413e-05, |
| "loss": 0.2088, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21552985906600952, |
| "step": 1490, |
| "valid_targets_mean": 1660.6, |
| "valid_targets_min": 727 |
| }, |
| { |
| "epoch": 1.5720294426919033, |
| "grad_norm": 0.7470609642858503, |
| "learning_rate": 3.8144212717701424e-05, |
| "loss": 0.2187, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1965349316596985, |
| "step": 1495, |
| "valid_targets_mean": 1361.5, |
| "valid_targets_min": 761 |
| }, |
| { |
| "epoch": 1.5772870662460567, |
| "grad_norm": 0.9342679902589415, |
| "learning_rate": 3.812209070829025e-05, |
| "loss": 0.2012, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20799431204795837, |
| "step": 1500, |
| "valid_targets_mean": 1297.8, |
| "valid_targets_min": 714 |
| }, |
| { |
| "epoch": 1.5825446898002102, |
| "grad_norm": 0.7551967053680876, |
| "learning_rate": 3.809984411863828e-05, |
| "loss": 0.2213, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20301692187786102, |
| "step": 1505, |
| "valid_targets_mean": 1455.5, |
| "valid_targets_min": 741 |
| }, |
| { |
| "epoch": 1.5878023133543637, |
| "grad_norm": 0.6963522007321089, |
| "learning_rate": 3.80774731016796e-05, |
| "loss": 0.2136, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23237518966197968, |
| "step": 1510, |
| "valid_targets_mean": 2029.8, |
| "valid_targets_min": 663 |
| }, |
| { |
| "epoch": 1.5930599369085172, |
| "grad_norm": 0.8478435228214879, |
| "learning_rate": 3.805497781120369e-05, |
| "loss": 0.2056, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21179191768169403, |
| "step": 1515, |
| "valid_targets_mean": 1525.1, |
| "valid_targets_min": 632 |
| }, |
| { |
| "epoch": 1.598317560462671, |
| "grad_norm": 0.8260682380140899, |
| "learning_rate": 3.8032358401854315e-05, |
| "loss": 0.2179, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2055744230747223, |
| "step": 1520, |
| "valid_targets_mean": 1709.6, |
| "valid_targets_min": 933 |
| }, |
| { |
| "epoch": 1.6035751840168244, |
| "grad_norm": 0.7710629303909796, |
| "learning_rate": 3.800961502912854e-05, |
| "loss": 0.2064, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19703570008277893, |
| "step": 1525, |
| "valid_targets_mean": 1535.0, |
| "valid_targets_min": 717 |
| }, |
| { |
| "epoch": 1.608832807570978, |
| "grad_norm": 0.71690856447056, |
| "learning_rate": 3.798674784937557e-05, |
| "loss": 0.1955, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1880686730146408, |
| "step": 1530, |
| "valid_targets_mean": 1315.5, |
| "valid_targets_min": 659 |
| }, |
| { |
| "epoch": 1.6140904311251314, |
| "grad_norm": 0.710257374011556, |
| "learning_rate": 3.7963757019795756e-05, |
| "loss": 0.1952, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18850678205490112, |
| "step": 1535, |
| "valid_targets_mean": 1413.6, |
| "valid_targets_min": 642 |
| }, |
| { |
| "epoch": 1.619348054679285, |
| "grad_norm": 0.7832129294341599, |
| "learning_rate": 3.794064269843946e-05, |
| "loss": 0.2067, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19041520357131958, |
| "step": 1540, |
| "valid_targets_mean": 1340.9, |
| "valid_targets_min": 765 |
| }, |
| { |
| "epoch": 1.6246056782334386, |
| "grad_norm": 0.7978203152836152, |
| "learning_rate": 3.791740504420599e-05, |
| "loss": 0.2147, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21219009160995483, |
| "step": 1545, |
| "valid_targets_mean": 1332.8, |
| "valid_targets_min": 631 |
| }, |
| { |
| "epoch": 1.629863301787592, |
| "grad_norm": 0.8191454502035843, |
| "learning_rate": 3.789404421684251e-05, |
| "loss": 0.2153, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22539633512496948, |
| "step": 1550, |
| "valid_targets_mean": 1548.9, |
| "valid_targets_min": 623 |
| }, |
| { |
| "epoch": 1.6351209253417456, |
| "grad_norm": 1.6820546329379997, |
| "learning_rate": 3.787056037694293e-05, |
| "loss": 0.2099, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23396363854408264, |
| "step": 1555, |
| "valid_targets_mean": 1934.2, |
| "valid_targets_min": 818 |
| }, |
| { |
| "epoch": 1.640378548895899, |
| "grad_norm": 0.6806945395207281, |
| "learning_rate": 3.784695368594682e-05, |
| "loss": 0.2023, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1954052448272705, |
| "step": 1560, |
| "valid_targets_mean": 1563.4, |
| "valid_targets_min": 776 |
| }, |
| { |
| "epoch": 1.6456361724500526, |
| "grad_norm": 0.955894092558591, |
| "learning_rate": 3.782322430613828e-05, |
| "loss": 0.2077, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21555835008621216, |
| "step": 1565, |
| "valid_targets_mean": 1428.6, |
| "valid_targets_min": 623 |
| }, |
| { |
| "epoch": 1.650893796004206, |
| "grad_norm": 0.7923665874268049, |
| "learning_rate": 3.779937240064484e-05, |
| "loss": 0.2127, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21493303775787354, |
| "step": 1570, |
| "valid_targets_mean": 1461.2, |
| "valid_targets_min": 693 |
| }, |
| { |
| "epoch": 1.6561514195583595, |
| "grad_norm": 0.7575966597313151, |
| "learning_rate": 3.777539813343634e-05, |
| "loss": 0.2044, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17569950222969055, |
| "step": 1575, |
| "valid_targets_mean": 1157.9, |
| "valid_targets_min": 611 |
| }, |
| { |
| "epoch": 1.661409043112513, |
| "grad_norm": 0.7956598922283731, |
| "learning_rate": 3.7751301669323776e-05, |
| "loss": 0.1992, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21564935147762299, |
| "step": 1580, |
| "valid_targets_mean": 1616.5, |
| "valid_targets_min": 793 |
| }, |
| { |
| "epoch": 1.6666666666666665, |
| "grad_norm": 0.6908537802167536, |
| "learning_rate": 3.772708317395818e-05, |
| "loss": 0.1986, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19004574418067932, |
| "step": 1585, |
| "valid_targets_mean": 1568.1, |
| "valid_targets_min": 563 |
| }, |
| { |
| "epoch": 1.6719242902208202, |
| "grad_norm": 0.6820529239345657, |
| "learning_rate": 3.770274281382952e-05, |
| "loss": 0.2016, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19403985142707825, |
| "step": 1590, |
| "valid_targets_mean": 1546.9, |
| "valid_targets_min": 837 |
| }, |
| { |
| "epoch": 1.6771819137749737, |
| "grad_norm": 0.7629916835976289, |
| "learning_rate": 3.767828075626551e-05, |
| "loss": 0.1983, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2039937674999237, |
| "step": 1595, |
| "valid_targets_mean": 1719.1, |
| "valid_targets_min": 1107 |
| }, |
| { |
| "epoch": 1.6824395373291272, |
| "grad_norm": 0.8051713078365255, |
| "learning_rate": 3.7653697169430456e-05, |
| "loss": 0.2103, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2031601071357727, |
| "step": 1600, |
| "valid_targets_mean": 1550.2, |
| "valid_targets_min": 680 |
| }, |
| { |
| "epoch": 1.687697160883281, |
| "grad_norm": 0.7186372548592179, |
| "learning_rate": 3.762899222232413e-05, |
| "loss": 0.192, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21175065636634827, |
| "step": 1605, |
| "valid_targets_mean": 1599.1, |
| "valid_targets_min": 803 |
| }, |
| { |
| "epoch": 1.6929547844374344, |
| "grad_norm": 0.8027005235096604, |
| "learning_rate": 3.760416608478061e-05, |
| "loss": 0.199, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20356839895248413, |
| "step": 1610, |
| "valid_targets_mean": 1565.1, |
| "valid_targets_min": 631 |
| }, |
| { |
| "epoch": 1.698212407991588, |
| "grad_norm": 0.7469552681571042, |
| "learning_rate": 3.7579218927467044e-05, |
| "loss": 0.2017, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1995268613100052, |
| "step": 1615, |
| "valid_targets_mean": 1662.8, |
| "valid_targets_min": 804 |
| }, |
| { |
| "epoch": 1.7034700315457414, |
| "grad_norm": 0.7343071593308167, |
| "learning_rate": 3.7554150921882596e-05, |
| "loss": 0.2039, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19197341799736023, |
| "step": 1620, |
| "valid_targets_mean": 1515.2, |
| "valid_targets_min": 675 |
| }, |
| { |
| "epoch": 1.7087276550998949, |
| "grad_norm": 0.7860772677556097, |
| "learning_rate": 3.752896224035716e-05, |
| "loss": 0.1955, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2085728496313095, |
| "step": 1625, |
| "valid_targets_mean": 1305.0, |
| "valid_targets_min": 856 |
| }, |
| { |
| "epoch": 1.7139852786540484, |
| "grad_norm": 0.7234624946863873, |
| "learning_rate": 3.750365305605024e-05, |
| "loss": 0.1923, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.187704399228096, |
| "step": 1630, |
| "valid_targets_mean": 1516.9, |
| "valid_targets_min": 715 |
| }, |
| { |
| "epoch": 1.7192429022082019, |
| "grad_norm": 0.7878834002834912, |
| "learning_rate": 3.7478223542949704e-05, |
| "loss": 0.1853, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19672289490699768, |
| "step": 1635, |
| "valid_targets_mean": 1515.6, |
| "valid_targets_min": 678 |
| }, |
| { |
| "epoch": 1.7245005257623554, |
| "grad_norm": 0.813682661334051, |
| "learning_rate": 3.745267387587065e-05, |
| "loss": 0.2057, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22412776947021484, |
| "step": 1640, |
| "valid_targets_mean": 1387.8, |
| "valid_targets_min": 676 |
| }, |
| { |
| "epoch": 1.7297581493165088, |
| "grad_norm": 0.9732801791083533, |
| "learning_rate": 3.742700423045416e-05, |
| "loss": 0.1904, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17012116312980652, |
| "step": 1645, |
| "valid_targets_mean": 1388.9, |
| "valid_targets_min": 794 |
| }, |
| { |
| "epoch": 1.7350157728706623, |
| "grad_norm": 1.0706073408996923, |
| "learning_rate": 3.7401214783166116e-05, |
| "loss": 0.2, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1910264492034912, |
| "step": 1650, |
| "valid_targets_mean": 1379.6, |
| "valid_targets_min": 607 |
| }, |
| { |
| "epoch": 1.7402733964248158, |
| "grad_norm": 0.7300646659459774, |
| "learning_rate": 3.737530571129596e-05, |
| "loss": 0.1957, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2033732682466507, |
| "step": 1655, |
| "valid_targets_mean": 1653.4, |
| "valid_targets_min": 741 |
| }, |
| { |
| "epoch": 1.7455310199789695, |
| "grad_norm": 0.7482338087375434, |
| "learning_rate": 3.734927719295551e-05, |
| "loss": 0.2054, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21667127311229706, |
| "step": 1660, |
| "valid_targets_mean": 1650.9, |
| "valid_targets_min": 858 |
| }, |
| { |
| "epoch": 1.750788643533123, |
| "grad_norm": 0.7699160727826564, |
| "learning_rate": 3.732312940707772e-05, |
| "loss": 0.1886, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21378806233406067, |
| "step": 1665, |
| "valid_targets_mean": 1565.1, |
| "valid_targets_min": 689 |
| }, |
| { |
| "epoch": 1.7560462670872765, |
| "grad_norm": 0.784999055449363, |
| "learning_rate": 3.729686253341543e-05, |
| "loss": 0.2056, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20358502864837646, |
| "step": 1670, |
| "valid_targets_mean": 1414.7, |
| "valid_targets_min": 725 |
| }, |
| { |
| "epoch": 1.7613038906414302, |
| "grad_norm": 0.7718884541425045, |
| "learning_rate": 3.7270476752540163e-05, |
| "loss": 0.2011, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19702203571796417, |
| "step": 1675, |
| "valid_targets_mean": 1472.6, |
| "valid_targets_min": 828 |
| }, |
| { |
| "epoch": 1.7665615141955837, |
| "grad_norm": 0.7650792702417181, |
| "learning_rate": 3.724397224584086e-05, |
| "loss": 0.2134, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1973450481891632, |
| "step": 1680, |
| "valid_targets_mean": 1424.0, |
| "valid_targets_min": 618 |
| }, |
| { |
| "epoch": 1.7718191377497372, |
| "grad_norm": 0.7384298303756813, |
| "learning_rate": 3.7217349195522656e-05, |
| "loss": 0.1898, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18893392384052277, |
| "step": 1685, |
| "valid_targets_mean": 1494.2, |
| "valid_targets_min": 629 |
| }, |
| { |
| "epoch": 1.7770767613038907, |
| "grad_norm": 0.7066901850808929, |
| "learning_rate": 3.7190607784605604e-05, |
| "loss": 0.2015, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22910484671592712, |
| "step": 1690, |
| "valid_targets_mean": 1844.9, |
| "valid_targets_min": 1071 |
| }, |
| { |
| "epoch": 1.7823343848580442, |
| "grad_norm": 0.7659251894049691, |
| "learning_rate": 3.716374819692341e-05, |
| "loss": 0.1993, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20867155492305756, |
| "step": 1695, |
| "valid_targets_mean": 1349.2, |
| "valid_targets_min": 677 |
| }, |
| { |
| "epoch": 1.7875920084121977, |
| "grad_norm": 0.9231763305447974, |
| "learning_rate": 3.713677061712223e-05, |
| "loss": 0.188, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1793934404850006, |
| "step": 1700, |
| "valid_targets_mean": 1227.6, |
| "valid_targets_min": 679 |
| }, |
| { |
| "epoch": 1.7928496319663512, |
| "grad_norm": 0.7178249077539041, |
| "learning_rate": 3.7109675230659316e-05, |
| "loss": 0.1918, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1823531687259674, |
| "step": 1705, |
| "valid_targets_mean": 1427.4, |
| "valid_targets_min": 504 |
| }, |
| { |
| "epoch": 1.7981072555205047, |
| "grad_norm": 0.6988064955193508, |
| "learning_rate": 3.7082462223801784e-05, |
| "loss": 0.1967, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19073626399040222, |
| "step": 1710, |
| "valid_targets_mean": 1693.7, |
| "valid_targets_min": 1023 |
| }, |
| { |
| "epoch": 1.8033648790746581, |
| "grad_norm": 0.7467760005809908, |
| "learning_rate": 3.7055131783625364e-05, |
| "loss": 0.1994, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1814468652009964, |
| "step": 1715, |
| "valid_targets_mean": 1453.0, |
| "valid_targets_min": 661 |
| }, |
| { |
| "epoch": 1.8086225026288116, |
| "grad_norm": 0.7261516150558474, |
| "learning_rate": 3.702768409801304e-05, |
| "loss": 0.2003, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19200043380260468, |
| "step": 1720, |
| "valid_targets_mean": 1503.2, |
| "valid_targets_min": 889 |
| }, |
| { |
| "epoch": 1.8138801261829653, |
| "grad_norm": 0.7208225356867676, |
| "learning_rate": 3.700011935565384e-05, |
| "loss": 0.1921, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19593971967697144, |
| "step": 1725, |
| "valid_targets_mean": 1688.3, |
| "valid_targets_min": 723 |
| }, |
| { |
| "epoch": 1.8191377497371188, |
| "grad_norm": 0.8678640212242313, |
| "learning_rate": 3.697243774604145e-05, |
| "loss": 0.1951, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18990558385849, |
| "step": 1730, |
| "valid_targets_mean": 1409.5, |
| "valid_targets_min": 793 |
| }, |
| { |
| "epoch": 1.8243953732912723, |
| "grad_norm": 0.8771081813983874, |
| "learning_rate": 3.6944639459473e-05, |
| "loss": 0.1968, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20506446063518524, |
| "step": 1735, |
| "valid_targets_mean": 1478.6, |
| "valid_targets_min": 861 |
| }, |
| { |
| "epoch": 1.8296529968454258, |
| "grad_norm": 1.02269191180137, |
| "learning_rate": 3.69167246870477e-05, |
| "loss": 0.1904, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18175086379051208, |
| "step": 1740, |
| "valid_targets_mean": 1374.3, |
| "valid_targets_min": 752 |
| }, |
| { |
| "epoch": 1.8349106203995795, |
| "grad_norm": 0.8693649422959702, |
| "learning_rate": 3.6888693620665546e-05, |
| "loss": 0.1988, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20953771471977234, |
| "step": 1745, |
| "valid_targets_mean": 1828.4, |
| "valid_targets_min": 789 |
| }, |
| { |
| "epoch": 1.840168243953733, |
| "grad_norm": 0.7679695979527971, |
| "learning_rate": 3.686054645302598e-05, |
| "loss": 0.177, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1746317595243454, |
| "step": 1750, |
| "valid_targets_mean": 1423.6, |
| "valid_targets_min": 638 |
| }, |
| { |
| "epoch": 1.8454258675078865, |
| "grad_norm": 0.8129646630161029, |
| "learning_rate": 3.6832283377626603e-05, |
| "loss": 0.1919, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21307937800884247, |
| "step": 1755, |
| "valid_targets_mean": 1504.5, |
| "valid_targets_min": 605 |
| }, |
| { |
| "epoch": 1.85068349106204, |
| "grad_norm": 0.7270464458683336, |
| "learning_rate": 3.680390458876182e-05, |
| "loss": 0.1964, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19682200253009796, |
| "step": 1760, |
| "valid_targets_mean": 1852.8, |
| "valid_targets_min": 746 |
| }, |
| { |
| "epoch": 1.8559411146161935, |
| "grad_norm": 0.7909843914542467, |
| "learning_rate": 3.67754102815215e-05, |
| "loss": 0.1822, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1827111393213272, |
| "step": 1765, |
| "valid_targets_mean": 1197.2, |
| "valid_targets_min": 723 |
| }, |
| { |
| "epoch": 1.861198738170347, |
| "grad_norm": 0.6951127380664675, |
| "learning_rate": 3.6746800651789636e-05, |
| "loss": 0.2001, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19025492668151855, |
| "step": 1770, |
| "valid_targets_mean": 1528.6, |
| "valid_targets_min": 855 |
| }, |
| { |
| "epoch": 1.8664563617245005, |
| "grad_norm": 0.6650274684528676, |
| "learning_rate": 3.671807589624302e-05, |
| "loss": 0.1928, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18363268673419952, |
| "step": 1775, |
| "valid_targets_mean": 1590.4, |
| "valid_targets_min": 902 |
| }, |
| { |
| "epoch": 1.871713985278654, |
| "grad_norm": 0.7314659087088272, |
| "learning_rate": 3.6689236212349865e-05, |
| "loss": 0.1978, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18726280331611633, |
| "step": 1780, |
| "valid_targets_mean": 1551.3, |
| "valid_targets_min": 803 |
| }, |
| { |
| "epoch": 1.8769716088328074, |
| "grad_norm": 0.7802901129743159, |
| "learning_rate": 3.6660281798368485e-05, |
| "loss": 0.1982, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21072804927825928, |
| "step": 1785, |
| "valid_targets_mean": 1491.0, |
| "valid_targets_min": 740 |
| }, |
| { |
| "epoch": 1.882229232386961, |
| "grad_norm": 0.7317197718747478, |
| "learning_rate": 3.663121285334586e-05, |
| "loss": 0.1899, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1848827451467514, |
| "step": 1790, |
| "valid_targets_mean": 1486.4, |
| "valid_targets_min": 1124 |
| }, |
| { |
| "epoch": 1.8874868559411146, |
| "grad_norm": 0.7757656842265135, |
| "learning_rate": 3.660202957711635e-05, |
| "loss": 0.2021, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2078087031841278, |
| "step": 1795, |
| "valid_targets_mean": 1528.4, |
| "valid_targets_min": 655 |
| }, |
| { |
| "epoch": 1.8927444794952681, |
| "grad_norm": 0.7812219293764121, |
| "learning_rate": 3.657273217030026e-05, |
| "loss": 0.1975, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2079935371875763, |
| "step": 1800, |
| "valid_targets_mean": 1507.2, |
| "valid_targets_min": 667 |
| }, |
| { |
| "epoch": 1.8980021030494216, |
| "grad_norm": 0.7515491496035672, |
| "learning_rate": 3.654332083430252e-05, |
| "loss": 0.2025, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2115655392408371, |
| "step": 1805, |
| "valid_targets_mean": 1626.7, |
| "valid_targets_min": 1012 |
| }, |
| { |
| "epoch": 1.9032597266035753, |
| "grad_norm": 0.7848376700855773, |
| "learning_rate": 3.651379577131121e-05, |
| "loss": 0.2005, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2028706669807434, |
| "step": 1810, |
| "valid_targets_mean": 1362.2, |
| "valid_targets_min": 684 |
| }, |
| { |
| "epoch": 1.9085173501577288, |
| "grad_norm": 0.8019585509267635, |
| "learning_rate": 3.648415718429629e-05, |
| "loss": 0.1994, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18479974567890167, |
| "step": 1815, |
| "valid_targets_mean": 1613.3, |
| "valid_targets_min": 821 |
| }, |
| { |
| "epoch": 1.9137749737118823, |
| "grad_norm": 0.7471485325109173, |
| "learning_rate": 3.6454405277008087e-05, |
| "loss": 0.188, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17082153260707855, |
| "step": 1820, |
| "valid_targets_mean": 1164.2, |
| "valid_targets_min": 620 |
| }, |
| { |
| "epoch": 1.9190325972660358, |
| "grad_norm": 0.7351089773431005, |
| "learning_rate": 3.6424540253975985e-05, |
| "loss": 0.1982, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2008403092622757, |
| "step": 1825, |
| "valid_targets_mean": 1539.8, |
| "valid_targets_min": 656 |
| }, |
| { |
| "epoch": 1.9242902208201893, |
| "grad_norm": 0.7238932187659127, |
| "learning_rate": 3.6394562320506955e-05, |
| "loss": 0.2015, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2348729819059372, |
| "step": 1830, |
| "valid_targets_mean": 1951.9, |
| "valid_targets_min": 697 |
| }, |
| { |
| "epoch": 1.9295478443743428, |
| "grad_norm": 0.9954725097034086, |
| "learning_rate": 3.636447168268419e-05, |
| "loss": 0.1883, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18077613413333893, |
| "step": 1835, |
| "valid_targets_mean": 1668.9, |
| "valid_targets_min": 682 |
| }, |
| { |
| "epoch": 1.9348054679284963, |
| "grad_norm": 0.7600896665159309, |
| "learning_rate": 3.633426854736566e-05, |
| "loss": 0.19, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18231940269470215, |
| "step": 1840, |
| "valid_targets_mean": 1469.9, |
| "valid_targets_min": 850 |
| }, |
| { |
| "epoch": 1.9400630914826498, |
| "grad_norm": 0.6661381415915304, |
| "learning_rate": 3.6303953122182695e-05, |
| "loss": 0.1882, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1681019514799118, |
| "step": 1845, |
| "valid_targets_mean": 1366.6, |
| "valid_targets_min": 747 |
| }, |
| { |
| "epoch": 1.9453207150368033, |
| "grad_norm": 0.7286880752866821, |
| "learning_rate": 3.6273525615538564e-05, |
| "loss": 0.2066, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18884357810020447, |
| "step": 1850, |
| "valid_targets_mean": 1576.2, |
| "valid_targets_min": 933 |
| }, |
| { |
| "epoch": 1.9505783385909568, |
| "grad_norm": 0.8435658108064998, |
| "learning_rate": 3.6242986236607046e-05, |
| "loss": 0.194, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19223934412002563, |
| "step": 1855, |
| "valid_targets_mean": 1368.4, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 1.9558359621451105, |
| "grad_norm": 0.8496444326573576, |
| "learning_rate": 3.6212335195330976e-05, |
| "loss": 0.1859, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17416611313819885, |
| "step": 1860, |
| "valid_targets_mean": 1435.2, |
| "valid_targets_min": 741 |
| }, |
| { |
| "epoch": 1.961093585699264, |
| "grad_norm": 0.6869303661885902, |
| "learning_rate": 3.618157270242082e-05, |
| "loss": 0.187, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17237621545791626, |
| "step": 1865, |
| "valid_targets_mean": 1414.9, |
| "valid_targets_min": 639 |
| }, |
| { |
| "epoch": 1.9663512092534174, |
| "grad_norm": 0.7193511315326917, |
| "learning_rate": 3.615069896935321e-05, |
| "loss": 0.1782, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1867102086544037, |
| "step": 1870, |
| "valid_targets_mean": 1274.8, |
| "valid_targets_min": 720 |
| }, |
| { |
| "epoch": 1.971608832807571, |
| "grad_norm": 0.8698348477600781, |
| "learning_rate": 3.6119714208369506e-05, |
| "loss": 0.1945, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19367027282714844, |
| "step": 1875, |
| "valid_targets_mean": 1450.4, |
| "valid_targets_min": 610 |
| }, |
| { |
| "epoch": 1.9768664563617246, |
| "grad_norm": 0.7050591182067847, |
| "learning_rate": 3.608861863247432e-05, |
| "loss": 0.1911, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1852041482925415, |
| "step": 1880, |
| "valid_targets_mean": 1527.5, |
| "valid_targets_min": 695 |
| }, |
| { |
| "epoch": 1.9821240799158781, |
| "grad_norm": 0.7546464557552481, |
| "learning_rate": 3.6057412455434075e-05, |
| "loss": 0.1981, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20709413290023804, |
| "step": 1885, |
| "valid_targets_mean": 1575.1, |
| "valid_targets_min": 807 |
| }, |
| { |
| "epoch": 1.9873817034700316, |
| "grad_norm": 0.76980779973052, |
| "learning_rate": 3.6026095891775494e-05, |
| "loss": 0.1929, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1803637146949768, |
| "step": 1890, |
| "valid_targets_mean": 1433.2, |
| "valid_targets_min": 765 |
| }, |
| { |
| "epoch": 1.9926393270241851, |
| "grad_norm": 0.7354279088982589, |
| "learning_rate": 3.5994669156784184e-05, |
| "loss": 0.192, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2017996460199356, |
| "step": 1895, |
| "valid_targets_mean": 1380.9, |
| "valid_targets_min": 589 |
| }, |
| { |
| "epoch": 1.9978969505783386, |
| "grad_norm": 0.689374068517502, |
| "learning_rate": 3.5963132466503107e-05, |
| "loss": 0.2006, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20561370253562927, |
| "step": 1900, |
| "valid_targets_mean": 1628.9, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 2.003154574132492, |
| "grad_norm": 0.542940870045068, |
| "learning_rate": 3.593148603773111e-05, |
| "loss": 0.1746, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20123085379600525, |
| "step": 1905, |
| "valid_targets_mean": 2469.9, |
| "valid_targets_min": 333 |
| }, |
| { |
| "epoch": 2.0084121976866456, |
| "grad_norm": 0.4419540251974538, |
| "learning_rate": 3.5899730088021455e-05, |
| "loss": 0.1276, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11125434190034866, |
| "step": 1910, |
| "valid_targets_mean": 3365.8, |
| "valid_targets_min": 589 |
| }, |
| { |
| "epoch": 2.013669821240799, |
| "grad_norm": 0.4574035567884021, |
| "learning_rate": 3.586786483568028e-05, |
| "loss": 0.1142, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12070576846599579, |
| "step": 1915, |
| "valid_targets_mean": 2654.1, |
| "valid_targets_min": 732 |
| }, |
| { |
| "epoch": 2.0189274447949526, |
| "grad_norm": 0.45773077927208944, |
| "learning_rate": 3.583589049976514e-05, |
| "loss": 0.1201, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1785980463027954, |
| "step": 1920, |
| "valid_targets_mean": 2940.4, |
| "valid_targets_min": 803 |
| }, |
| { |
| "epoch": 2.024185068349106, |
| "grad_norm": 0.3723571560691481, |
| "learning_rate": 3.580380730008348e-05, |
| "loss": 0.1056, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09178034961223602, |
| "step": 1925, |
| "valid_targets_mean": 2688.1, |
| "valid_targets_min": 641 |
| }, |
| { |
| "epoch": 2.0294426919032595, |
| "grad_norm": 0.4142851324910883, |
| "learning_rate": 3.577161545719113e-05, |
| "loss": 0.115, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1158660352230072, |
| "step": 1930, |
| "valid_targets_mean": 2836.2, |
| "valid_targets_min": 859 |
| }, |
| { |
| "epoch": 2.034700315457413, |
| "grad_norm": 0.768535775330482, |
| "learning_rate": 3.573931519239079e-05, |
| "loss": 0.1649, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20408882200717926, |
| "step": 1935, |
| "valid_targets_mean": 1436.1, |
| "valid_targets_min": 539 |
| }, |
| { |
| "epoch": 2.039957939011567, |
| "grad_norm": 0.35975117380126753, |
| "learning_rate": 3.5706906727730496e-05, |
| "loss": 0.1262, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12019376456737518, |
| "step": 1940, |
| "valid_targets_mean": 3049.2, |
| "valid_targets_min": 621 |
| }, |
| { |
| "epoch": 2.0452155625657205, |
| "grad_norm": 0.431775338996385, |
| "learning_rate": 3.567439028600211e-05, |
| "loss": 0.1244, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13193655014038086, |
| "step": 1945, |
| "valid_targets_mean": 2847.4, |
| "valid_targets_min": 966 |
| }, |
| { |
| "epoch": 2.050473186119874, |
| "grad_norm": 0.29413558380400784, |
| "learning_rate": 3.564176609073979e-05, |
| "loss": 0.1537, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08345094323158264, |
| "step": 1950, |
| "valid_targets_mean": 3693.9, |
| "valid_targets_min": 738 |
| }, |
| { |
| "epoch": 2.0557308096740274, |
| "grad_norm": 0.3461571050250875, |
| "learning_rate": 3.5609034366218426e-05, |
| "loss": 0.0966, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11638450622558594, |
| "step": 1955, |
| "valid_targets_mean": 3941.9, |
| "valid_targets_min": 754 |
| }, |
| { |
| "epoch": 2.060988433228181, |
| "grad_norm": 0.5767856223059593, |
| "learning_rate": 3.5576195337452146e-05, |
| "loss": 0.1084, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11265841126441956, |
| "step": 1960, |
| "valid_targets_mean": 4264.9, |
| "valid_targets_min": 2385 |
| }, |
| { |
| "epoch": 2.0662460567823344, |
| "grad_norm": 0.3265656751998804, |
| "learning_rate": 3.55432492301927e-05, |
| "loss": 0.1103, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10609455406665802, |
| "step": 1965, |
| "valid_targets_mean": 4118.6, |
| "valid_targets_min": 518 |
| }, |
| { |
| "epoch": 2.071503680336488, |
| "grad_norm": 0.47898524103449897, |
| "learning_rate": 3.551019627092799e-05, |
| "loss": 0.1547, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.221329927444458, |
| "step": 1970, |
| "valid_targets_mean": 2231.9, |
| "valid_targets_min": 549 |
| }, |
| { |
| "epoch": 2.0767613038906414, |
| "grad_norm": 0.3449916365819097, |
| "learning_rate": 3.547703668688044e-05, |
| "loss": 0.0997, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09637214243412018, |
| "step": 1975, |
| "valid_targets_mean": 3676.0, |
| "valid_targets_min": 2542 |
| }, |
| { |
| "epoch": 2.082018927444795, |
| "grad_norm": 0.49967309572106877, |
| "learning_rate": 3.544377070600549e-05, |
| "loss": 0.1177, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13243040442466736, |
| "step": 1980, |
| "valid_targets_mean": 2098.3, |
| "valid_targets_min": 518 |
| }, |
| { |
| "epoch": 2.0872765509989484, |
| "grad_norm": 0.8151213576642133, |
| "learning_rate": 3.541039855699e-05, |
| "loss": 0.0956, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08248072862625122, |
| "step": 1985, |
| "valid_targets_mean": 3478.4, |
| "valid_targets_min": 844 |
| }, |
| { |
| "epoch": 2.092534174553102, |
| "grad_norm": 0.4259631434965719, |
| "learning_rate": 3.537692046925065e-05, |
| "loss": 0.1148, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11570675671100616, |
| "step": 1990, |
| "valid_targets_mean": 2926.8, |
| "valid_targets_min": 577 |
| }, |
| { |
| "epoch": 2.0977917981072554, |
| "grad_norm": 0.5756796963529887, |
| "learning_rate": 3.534333667293244e-05, |
| "loss": 0.1271, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1707330346107483, |
| "step": 1995, |
| "valid_targets_mean": 2119.7, |
| "valid_targets_min": 557 |
| }, |
| { |
| "epoch": 2.103049421661409, |
| "grad_norm": 0.48786814608305074, |
| "learning_rate": 3.5309647398907056e-05, |
| "loss": 0.1216, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12323331832885742, |
| "step": 2000, |
| "valid_targets_mean": 2935.3, |
| "valid_targets_min": 721 |
| }, |
| { |
| "epoch": 2.108307045215563, |
| "grad_norm": 0.3837130198249333, |
| "learning_rate": 3.527585287877125e-05, |
| "loss": 0.1261, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11236828565597534, |
| "step": 2005, |
| "valid_targets_mean": 2415.7, |
| "valid_targets_min": 615 |
| }, |
| { |
| "epoch": 2.1135646687697163, |
| "grad_norm": 0.47079145732206046, |
| "learning_rate": 3.5241953344845345e-05, |
| "loss": 0.1705, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2168724089860916, |
| "step": 2010, |
| "valid_targets_mean": 3522.3, |
| "valid_targets_min": 2609 |
| }, |
| { |
| "epoch": 2.1188222923238698, |
| "grad_norm": 0.35501141623715066, |
| "learning_rate": 3.520794903017153e-05, |
| "loss": 0.1032, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08434702455997467, |
| "step": 2015, |
| "valid_targets_mean": 3968.2, |
| "valid_targets_min": 1908 |
| }, |
| { |
| "epoch": 2.1240799158780233, |
| "grad_norm": 0.5172834601624194, |
| "learning_rate": 3.517384016851235e-05, |
| "loss": 0.1158, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.126325786113739, |
| "step": 2020, |
| "valid_targets_mean": 1879.2, |
| "valid_targets_min": 714 |
| }, |
| { |
| "epoch": 2.1293375394321767, |
| "grad_norm": 0.4430125491281209, |
| "learning_rate": 3.513962699434903e-05, |
| "loss": 0.1481, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1128813624382019, |
| "step": 2025, |
| "valid_targets_mean": 3275.2, |
| "valid_targets_min": 754 |
| }, |
| { |
| "epoch": 2.1345951629863302, |
| "grad_norm": 0.34954179186441253, |
| "learning_rate": 3.5105309742879894e-05, |
| "loss": 0.1351, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1068621426820755, |
| "step": 2030, |
| "valid_targets_mean": 3981.1, |
| "valid_targets_min": 3178 |
| }, |
| { |
| "epoch": 2.1398527865404837, |
| "grad_norm": 0.6993765687380059, |
| "learning_rate": 3.507088865001876e-05, |
| "loss": 0.1543, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28086918592453003, |
| "step": 2035, |
| "valid_targets_mean": 1794.2, |
| "valid_targets_min": 568 |
| }, |
| { |
| "epoch": 2.145110410094637, |
| "grad_norm": 0.4185105641084031, |
| "learning_rate": 3.5036363952393296e-05, |
| "loss": 0.2991, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16000577807426453, |
| "step": 2040, |
| "valid_targets_mean": 3409.7, |
| "valid_targets_min": 1248 |
| }, |
| { |
| "epoch": 2.1503680336487907, |
| "grad_norm": 0.4084098178915287, |
| "learning_rate": 3.500173588734339e-05, |
| "loss": 0.1264, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11279364675283432, |
| "step": 2045, |
| "valid_targets_mean": 3104.0, |
| "valid_targets_min": 833 |
| }, |
| { |
| "epoch": 2.155625657202944, |
| "grad_norm": 0.4730638438776189, |
| "learning_rate": 3.4967004692919555e-05, |
| "loss": 0.1227, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12906594574451447, |
| "step": 2050, |
| "valid_targets_mean": 2711.2, |
| "valid_targets_min": 751 |
| }, |
| { |
| "epoch": 2.1608832807570977, |
| "grad_norm": 0.4112493946337806, |
| "learning_rate": 3.4932170607881226e-05, |
| "loss": 0.2232, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13199396431446075, |
| "step": 2055, |
| "valid_targets_mean": 4013.1, |
| "valid_targets_min": 2594 |
| }, |
| { |
| "epoch": 2.166140904311251, |
| "grad_norm": 0.2374997504606069, |
| "learning_rate": 3.4897233871695205e-05, |
| "loss": 0.0903, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07160152494907379, |
| "step": 2060, |
| "valid_targets_mean": 5072.6, |
| "valid_targets_min": 2664 |
| }, |
| { |
| "epoch": 2.1713985278654047, |
| "grad_norm": 0.33322819897630984, |
| "learning_rate": 3.4862194724533934e-05, |
| "loss": 0.125, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09612695872783661, |
| "step": 2065, |
| "valid_targets_mean": 3613.6, |
| "valid_targets_min": 560 |
| }, |
| { |
| "epoch": 2.176656151419558, |
| "grad_norm": 0.40010571586156196, |
| "learning_rate": 3.4827053407273894e-05, |
| "loss": 0.1235, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13278815150260925, |
| "step": 2070, |
| "valid_targets_mean": 3665.6, |
| "valid_targets_min": 846 |
| }, |
| { |
| "epoch": 2.181913774973712, |
| "grad_norm": 0.35269720467851656, |
| "learning_rate": 3.4791810161493935e-05, |
| "loss": 0.1041, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10680776834487915, |
| "step": 2075, |
| "valid_targets_mean": 3572.8, |
| "valid_targets_min": 1352 |
| }, |
| { |
| "epoch": 2.1871713985278656, |
| "grad_norm": 0.3717577489913566, |
| "learning_rate": 3.47564652294736e-05, |
| "loss": 0.1004, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09458756446838379, |
| "step": 2080, |
| "valid_targets_mean": 2924.1, |
| "valid_targets_min": 533 |
| }, |
| { |
| "epoch": 2.192429022082019, |
| "grad_norm": 0.35094811666033576, |
| "learning_rate": 3.472101885419149e-05, |
| "loss": 0.1061, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10009931772947311, |
| "step": 2085, |
| "valid_targets_mean": 3237.6, |
| "valid_targets_min": 833 |
| }, |
| { |
| "epoch": 2.1976866456361726, |
| "grad_norm": 0.3349162110554798, |
| "learning_rate": 3.468547127932358e-05, |
| "loss": 0.0992, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09597519040107727, |
| "step": 2090, |
| "valid_targets_mean": 3548.4, |
| "valid_targets_min": 820 |
| }, |
| { |
| "epoch": 2.202944269190326, |
| "grad_norm": 0.5542598160258543, |
| "learning_rate": 3.4649822749241525e-05, |
| "loss": 0.1545, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3271830081939697, |
| "step": 2095, |
| "valid_targets_mean": 2446.5, |
| "valid_targets_min": 732 |
| }, |
| { |
| "epoch": 2.2082018927444795, |
| "grad_norm": 0.33183079532234444, |
| "learning_rate": 3.4614073509011e-05, |
| "loss": 0.0958, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0806136280298233, |
| "step": 2100, |
| "valid_targets_mean": 3180.4, |
| "valid_targets_min": 731 |
| }, |
| { |
| "epoch": 2.213459516298633, |
| "grad_norm": 0.6596534677060386, |
| "learning_rate": 3.4578223804390026e-05, |
| "loss": 0.1008, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14313668012619019, |
| "step": 2105, |
| "valid_targets_mean": 1303.2, |
| "valid_targets_min": 699 |
| }, |
| { |
| "epoch": 2.2187171398527865, |
| "grad_norm": 0.3140216907609009, |
| "learning_rate": 3.454227388182725e-05, |
| "loss": 0.0939, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08313123881816864, |
| "step": 2110, |
| "valid_targets_mean": 3714.1, |
| "valid_targets_min": 2353 |
| }, |
| { |
| "epoch": 2.22397476340694, |
| "grad_norm": 0.3586724911370638, |
| "learning_rate": 3.450622398846026e-05, |
| "loss": 0.0968, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09074784815311432, |
| "step": 2115, |
| "valid_targets_mean": 2580.6, |
| "valid_targets_min": 549 |
| }, |
| { |
| "epoch": 2.2292323869610935, |
| "grad_norm": 0.3882621595286078, |
| "learning_rate": 3.447007437211392e-05, |
| "loss": 0.1589, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1036640852689743, |
| "step": 2120, |
| "valid_targets_mean": 3410.4, |
| "valid_targets_min": 908 |
| }, |
| { |
| "epoch": 2.234490010515247, |
| "grad_norm": 0.3650954189123527, |
| "learning_rate": 3.443382528129862e-05, |
| "loss": 0.1278, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1459999680519104, |
| "step": 2125, |
| "valid_targets_mean": 3597.9, |
| "valid_targets_min": 2196 |
| }, |
| { |
| "epoch": 2.2397476340694005, |
| "grad_norm": 0.34573732617092917, |
| "learning_rate": 3.4397476965208604e-05, |
| "loss": 0.1175, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08166644722223282, |
| "step": 2130, |
| "valid_targets_mean": 2547.3, |
| "valid_targets_min": 598 |
| }, |
| { |
| "epoch": 2.245005257623554, |
| "grad_norm": 0.8893621770533435, |
| "learning_rate": 3.43610296737202e-05, |
| "loss": 0.1374, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19288986921310425, |
| "step": 2135, |
| "valid_targets_mean": 1077.8, |
| "valid_targets_min": 578 |
| }, |
| { |
| "epoch": 2.250262881177708, |
| "grad_norm": 0.6296113483255278, |
| "learning_rate": 3.432448365739019e-05, |
| "loss": 0.1612, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1756742000579834, |
| "step": 2140, |
| "valid_targets_mean": 1567.8, |
| "valid_targets_min": 695 |
| }, |
| { |
| "epoch": 2.2555205047318614, |
| "grad_norm": 0.4920335826042508, |
| "learning_rate": 3.4287839167454016e-05, |
| "loss": 0.1115, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1344049721956253, |
| "step": 2145, |
| "valid_targets_mean": 2367.2, |
| "valid_targets_min": 691 |
| }, |
| { |
| "epoch": 2.260778128286015, |
| "grad_norm": 0.3335058788310984, |
| "learning_rate": 3.4251096455824076e-05, |
| "loss": 0.1346, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07991436123847961, |
| "step": 2150, |
| "valid_targets_mean": 2896.5, |
| "valid_targets_min": 728 |
| }, |
| { |
| "epoch": 2.2660357518401684, |
| "grad_norm": 0.566081173021314, |
| "learning_rate": 3.421425577508799e-05, |
| "loss": 0.1179, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14447736740112305, |
| "step": 2155, |
| "valid_targets_mean": 1638.7, |
| "valid_targets_min": 523 |
| }, |
| { |
| "epoch": 2.271293375394322, |
| "grad_norm": 0.29854831308855384, |
| "learning_rate": 3.417731737850687e-05, |
| "loss": 0.1044, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09751242399215698, |
| "step": 2160, |
| "valid_targets_mean": 3837.4, |
| "valid_targets_min": 468 |
| }, |
| { |
| "epoch": 2.2765509989484753, |
| "grad_norm": 0.2768158846593977, |
| "learning_rate": 3.4140281520013595e-05, |
| "loss": 0.1093, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06398525834083557, |
| "step": 2165, |
| "valid_targets_mean": 4283.9, |
| "valid_targets_min": 580 |
| }, |
| { |
| "epoch": 2.281808622502629, |
| "grad_norm": 0.3331129838840239, |
| "learning_rate": 3.4103148454211017e-05, |
| "loss": 0.0987, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08948057889938354, |
| "step": 2170, |
| "valid_targets_mean": 3411.5, |
| "valid_targets_min": 459 |
| }, |
| { |
| "epoch": 2.2870662460567823, |
| "grad_norm": 0.4001155898199451, |
| "learning_rate": 3.4065918436370244e-05, |
| "loss": 0.0986, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10834327340126038, |
| "step": 2175, |
| "valid_targets_mean": 4137.1, |
| "valid_targets_min": 981 |
| }, |
| { |
| "epoch": 2.292323869610936, |
| "grad_norm": 0.42896798476056697, |
| "learning_rate": 3.402859172242889e-05, |
| "loss": 0.111, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14080369472503662, |
| "step": 2180, |
| "valid_targets_mean": 2630.4, |
| "valid_targets_min": 697 |
| }, |
| { |
| "epoch": 2.2975814931650893, |
| "grad_norm": 0.3971238184329431, |
| "learning_rate": 3.399116856898931e-05, |
| "loss": 0.1197, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11015994846820831, |
| "step": 2185, |
| "valid_targets_mean": 3410.7, |
| "valid_targets_min": 904 |
| }, |
| { |
| "epoch": 2.302839116719243, |
| "grad_norm": 0.3768949180388663, |
| "learning_rate": 3.395364923331681e-05, |
| "loss": 0.1163, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10609111189842224, |
| "step": 2190, |
| "valid_targets_mean": 3752.4, |
| "valid_targets_min": 2901 |
| }, |
| { |
| "epoch": 2.3080967402733963, |
| "grad_norm": 0.31074637357652146, |
| "learning_rate": 3.391603397333793e-05, |
| "loss": 0.0998, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0925753265619278, |
| "step": 2195, |
| "valid_targets_mean": 3481.4, |
| "valid_targets_min": 1099 |
| }, |
| { |
| "epoch": 2.3133543638275498, |
| "grad_norm": 0.3695913690140418, |
| "learning_rate": 3.387832304763861e-05, |
| "loss": 0.1026, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10796241462230682, |
| "step": 2200, |
| "valid_targets_mean": 2684.7, |
| "valid_targets_min": 502 |
| }, |
| { |
| "epoch": 2.3186119873817033, |
| "grad_norm": 0.3294638432808144, |
| "learning_rate": 3.384051671546247e-05, |
| "loss": 0.1191, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08635441958904266, |
| "step": 2205, |
| "valid_targets_mean": 3121.1, |
| "valid_targets_min": 724 |
| }, |
| { |
| "epoch": 2.3238696109358568, |
| "grad_norm": 0.3183920344447794, |
| "learning_rate": 3.380261523670899e-05, |
| "loss": 0.0883, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08022461831569672, |
| "step": 2210, |
| "valid_targets_mean": 3789.8, |
| "valid_targets_min": 2769 |
| }, |
| { |
| "epoch": 2.3291272344900107, |
| "grad_norm": 0.4463409820485366, |
| "learning_rate": 3.376461887193173e-05, |
| "loss": 0.116, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1165148913860321, |
| "step": 2215, |
| "valid_targets_mean": 2666.1, |
| "valid_targets_min": 591 |
| }, |
| { |
| "epoch": 2.334384858044164, |
| "grad_norm": 0.33844289941983924, |
| "learning_rate": 3.372652788233656e-05, |
| "loss": 0.1085, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09222675114870071, |
| "step": 2220, |
| "valid_targets_mean": 2923.8, |
| "valid_targets_min": 387 |
| }, |
| { |
| "epoch": 2.3396424815983177, |
| "grad_norm": 0.38701104643296635, |
| "learning_rate": 3.368834252977982e-05, |
| "loss": 0.1276, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10978475213050842, |
| "step": 2225, |
| "valid_targets_mean": 3409.1, |
| "valid_targets_min": 872 |
| }, |
| { |
| "epoch": 2.344900105152471, |
| "grad_norm": 0.43395572047048964, |
| "learning_rate": 3.3650063076766586e-05, |
| "loss": 0.1111, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1017407700419426, |
| "step": 2230, |
| "valid_targets_mean": 2262.9, |
| "valid_targets_min": 457 |
| }, |
| { |
| "epoch": 2.3501577287066246, |
| "grad_norm": 0.8425106620660383, |
| "learning_rate": 3.3611689786448786e-05, |
| "loss": 0.1261, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16855454444885254, |
| "step": 2235, |
| "valid_targets_mean": 910.9, |
| "valid_targets_min": 482 |
| }, |
| { |
| "epoch": 2.355415352260778, |
| "grad_norm": 0.5024866854815814, |
| "learning_rate": 3.357322292262346e-05, |
| "loss": 0.1099, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16090843081474304, |
| "step": 2240, |
| "valid_targets_mean": 2117.8, |
| "valid_targets_min": 808 |
| }, |
| { |
| "epoch": 2.3606729758149316, |
| "grad_norm": 0.40285220293779767, |
| "learning_rate": 3.353466274973092e-05, |
| "loss": 0.1247, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10135935246944427, |
| "step": 2245, |
| "valid_targets_mean": 2893.4, |
| "valid_targets_min": 1010 |
| }, |
| { |
| "epoch": 2.365930599369085, |
| "grad_norm": 0.4015051019169806, |
| "learning_rate": 3.3496009532852907e-05, |
| "loss": 0.1097, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10825712978839874, |
| "step": 2250, |
| "valid_targets_mean": 2790.9, |
| "valid_targets_min": 684 |
| }, |
| { |
| "epoch": 2.3711882229232386, |
| "grad_norm": 0.6342311432473261, |
| "learning_rate": 3.345726353771082e-05, |
| "loss": 0.1021, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13154293596744537, |
| "step": 2255, |
| "valid_targets_mean": 1478.8, |
| "valid_targets_min": 516 |
| }, |
| { |
| "epoch": 2.376445846477392, |
| "grad_norm": 0.5731636192259716, |
| "learning_rate": 3.341842503066384e-05, |
| "loss": 0.1268, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1623716652393341, |
| "step": 2260, |
| "valid_targets_mean": 1547.9, |
| "valid_targets_min": 342 |
| }, |
| { |
| "epoch": 2.3817034700315456, |
| "grad_norm": 0.30202282063557295, |
| "learning_rate": 3.3379494278707136e-05, |
| "loss": 0.099, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07995246350765228, |
| "step": 2265, |
| "valid_targets_mean": 3624.2, |
| "valid_targets_min": 1440 |
| }, |
| { |
| "epoch": 2.386961093585699, |
| "grad_norm": 0.3468460061447606, |
| "learning_rate": 3.334047154947e-05, |
| "loss": 0.0977, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09549038857221603, |
| "step": 2270, |
| "valid_targets_mean": 3963.6, |
| "valid_targets_min": 797 |
| }, |
| { |
| "epoch": 2.392218717139853, |
| "grad_norm": 0.39242180131067933, |
| "learning_rate": 3.330135711121404e-05, |
| "loss": 0.1061, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10692383348941803, |
| "step": 2275, |
| "valid_targets_mean": 3266.2, |
| "valid_targets_min": 762 |
| }, |
| { |
| "epoch": 2.3974763406940065, |
| "grad_norm": 0.3870079009116458, |
| "learning_rate": 3.32621512328313e-05, |
| "loss": 0.0933, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09543338418006897, |
| "step": 2280, |
| "valid_targets_mean": 2855.0, |
| "valid_targets_min": 667 |
| }, |
| { |
| "epoch": 2.40273396424816, |
| "grad_norm": 0.3703157689620131, |
| "learning_rate": 3.3222854183842434e-05, |
| "loss": 0.0883, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10649106651544571, |
| "step": 2285, |
| "valid_targets_mean": 4783.7, |
| "valid_targets_min": 4077 |
| }, |
| { |
| "epoch": 2.4079915878023135, |
| "grad_norm": 0.37296492021660815, |
| "learning_rate": 3.318346623439486e-05, |
| "loss": 0.1122, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10224653780460358, |
| "step": 2290, |
| "valid_targets_mean": 3361.9, |
| "valid_targets_min": 739 |
| }, |
| { |
| "epoch": 2.413249211356467, |
| "grad_norm": 0.613317346389733, |
| "learning_rate": 3.314398765526087e-05, |
| "loss": 0.1255, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18587398529052734, |
| "step": 2295, |
| "valid_targets_mean": 3316.8, |
| "valid_targets_min": 1090 |
| }, |
| { |
| "epoch": 2.4185068349106205, |
| "grad_norm": 0.34799810137644893, |
| "learning_rate": 3.310441871783581e-05, |
| "loss": 0.1041, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11055073142051697, |
| "step": 2300, |
| "valid_targets_mean": 3220.9, |
| "valid_targets_min": 704 |
| }, |
| { |
| "epoch": 2.423764458464774, |
| "grad_norm": 0.3474725759294151, |
| "learning_rate": 3.3064759694136165e-05, |
| "loss": 0.1059, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09245841205120087, |
| "step": 2305, |
| "valid_targets_mean": 2798.9, |
| "valid_targets_min": 774 |
| }, |
| { |
| "epoch": 2.4290220820189274, |
| "grad_norm": 0.3211516971377215, |
| "learning_rate": 3.302501085679776e-05, |
| "loss": 0.1292, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07826435565948486, |
| "step": 2310, |
| "valid_targets_mean": 3335.5, |
| "valid_targets_min": 888 |
| }, |
| { |
| "epoch": 2.434279705573081, |
| "grad_norm": 0.37928323445699264, |
| "learning_rate": 3.29851724790738e-05, |
| "loss": 0.1009, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11344511806964874, |
| "step": 2315, |
| "valid_targets_mean": 3528.7, |
| "valid_targets_min": 1048 |
| }, |
| { |
| "epoch": 2.4395373291272344, |
| "grad_norm": 0.3755096564661837, |
| "learning_rate": 3.294524483483306e-05, |
| "loss": 0.1134, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08853697776794434, |
| "step": 2320, |
| "valid_targets_mean": 2785.6, |
| "valid_targets_min": 722 |
| }, |
| { |
| "epoch": 2.444794952681388, |
| "grad_norm": 0.4064031142972282, |
| "learning_rate": 3.290522819855799e-05, |
| "loss": 0.1093, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13916510343551636, |
| "step": 2325, |
| "valid_targets_mean": 2386.9, |
| "valid_targets_min": 647 |
| }, |
| { |
| "epoch": 2.4500525762355414, |
| "grad_norm": 0.4737468011342821, |
| "learning_rate": 3.2865122845342776e-05, |
| "loss": 0.1521, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1550787091255188, |
| "step": 2330, |
| "valid_targets_mean": 1867.8, |
| "valid_targets_min": 570 |
| }, |
| { |
| "epoch": 2.455310199789695, |
| "grad_norm": 0.40083887878600755, |
| "learning_rate": 3.282492905089151e-05, |
| "loss": 0.1263, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1032135859131813, |
| "step": 2335, |
| "valid_targets_mean": 2887.5, |
| "valid_targets_min": 665 |
| }, |
| { |
| "epoch": 2.4605678233438484, |
| "grad_norm": 0.448529254155525, |
| "learning_rate": 3.2784647091516285e-05, |
| "loss": 0.1044, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10119682550430298, |
| "step": 2340, |
| "valid_targets_mean": 2616.5, |
| "valid_targets_min": 635 |
| }, |
| { |
| "epoch": 2.465825446898002, |
| "grad_norm": 0.3678578316155038, |
| "learning_rate": 3.274427724413527e-05, |
| "loss": 0.1025, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09730895608663559, |
| "step": 2345, |
| "valid_targets_mean": 3352.6, |
| "valid_targets_min": 1591 |
| }, |
| { |
| "epoch": 2.471083070452156, |
| "grad_norm": 0.37357338465385836, |
| "learning_rate": 3.270381978627081e-05, |
| "loss": 0.1009, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09874648600816727, |
| "step": 2350, |
| "valid_targets_mean": 2663.9, |
| "valid_targets_min": 767 |
| }, |
| { |
| "epoch": 2.4763406940063093, |
| "grad_norm": 0.34497476841737584, |
| "learning_rate": 3.266327499604755e-05, |
| "loss": 0.0938, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08213254809379578, |
| "step": 2355, |
| "valid_targets_mean": 2683.7, |
| "valid_targets_min": 785 |
| }, |
| { |
| "epoch": 2.481598317560463, |
| "grad_norm": 0.47614124747407566, |
| "learning_rate": 3.262264315219049e-05, |
| "loss": 0.1269, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10567892342805862, |
| "step": 2360, |
| "valid_targets_mean": 1866.8, |
| "valid_targets_min": 758 |
| }, |
| { |
| "epoch": 2.4868559411146163, |
| "grad_norm": 0.41276266766239855, |
| "learning_rate": 3.258192453402306e-05, |
| "loss": 0.0894, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09172023832798004, |
| "step": 2365, |
| "valid_targets_mean": 3081.9, |
| "valid_targets_min": 797 |
| }, |
| { |
| "epoch": 2.4921135646687698, |
| "grad_norm": 0.4402828465389009, |
| "learning_rate": 3.254111942146526e-05, |
| "loss": 0.1011, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11652339994907379, |
| "step": 2370, |
| "valid_targets_mean": 3014.8, |
| "valid_targets_min": 786 |
| }, |
| { |
| "epoch": 2.4973711882229233, |
| "grad_norm": 0.45876703652725737, |
| "learning_rate": 3.2500228095031677e-05, |
| "loss": 0.1038, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1287243366241455, |
| "step": 2375, |
| "valid_targets_mean": 3246.4, |
| "valid_targets_min": 1825 |
| }, |
| { |
| "epoch": 2.5026288117770767, |
| "grad_norm": 0.330009395243772, |
| "learning_rate": 3.2459250835829553e-05, |
| "loss": 0.1032, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10953538864850998, |
| "step": 2380, |
| "valid_targets_mean": 4573.3, |
| "valid_targets_min": 2274 |
| }, |
| { |
| "epoch": 2.5078864353312302, |
| "grad_norm": 0.38028006305594997, |
| "learning_rate": 3.241818792555692e-05, |
| "loss": 0.091, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1031368225812912, |
| "step": 2385, |
| "valid_targets_mean": 2921.9, |
| "valid_targets_min": 678 |
| }, |
| { |
| "epoch": 2.5131440588853837, |
| "grad_norm": 0.3153215459403795, |
| "learning_rate": 3.2377039646500565e-05, |
| "loss": 0.0989, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08835450559854507, |
| "step": 2390, |
| "valid_targets_mean": 3435.2, |
| "valid_targets_min": 580 |
| }, |
| { |
| "epoch": 2.518401682439537, |
| "grad_norm": 0.5205354367615399, |
| "learning_rate": 3.2335806281534195e-05, |
| "loss": 0.1427, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21413648128509521, |
| "step": 2395, |
| "valid_targets_mean": 2386.3, |
| "valid_targets_min": 709 |
| }, |
| { |
| "epoch": 2.5236593059936907, |
| "grad_norm": 0.3094648425320985, |
| "learning_rate": 3.229448811411639e-05, |
| "loss": 0.1532, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0807393491268158, |
| "step": 2400, |
| "valid_targets_mean": 3576.8, |
| "valid_targets_min": 1097 |
| }, |
| { |
| "epoch": 2.5289169295478446, |
| "grad_norm": 0.34166260473180343, |
| "learning_rate": 3.225308542828874e-05, |
| "loss": 0.1031, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09581205248832703, |
| "step": 2405, |
| "valid_targets_mean": 3323.8, |
| "valid_targets_min": 840 |
| }, |
| { |
| "epoch": 2.534174553101998, |
| "grad_norm": 0.34001978207460315, |
| "learning_rate": 3.221159850867385e-05, |
| "loss": 0.0964, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08724266290664673, |
| "step": 2410, |
| "valid_targets_mean": 3861.2, |
| "valid_targets_min": 2555 |
| }, |
| { |
| "epoch": 2.5394321766561516, |
| "grad_norm": 0.8902490493394284, |
| "learning_rate": 3.217002764047338e-05, |
| "loss": 0.19, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23896415531635284, |
| "step": 2415, |
| "valid_targets_mean": 1816.1, |
| "valid_targets_min": 777 |
| }, |
| { |
| "epoch": 2.544689800210305, |
| "grad_norm": 0.8203150480379091, |
| "learning_rate": 3.212837310946609e-05, |
| "loss": 0.1956, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19169892370700836, |
| "step": 2420, |
| "valid_targets_mean": 1377.1, |
| "valid_targets_min": 705 |
| }, |
| { |
| "epoch": 2.5499474237644586, |
| "grad_norm": 0.6753872059803847, |
| "learning_rate": 3.20866352020059e-05, |
| "loss": 0.187, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19078339636325836, |
| "step": 2425, |
| "valid_targets_mean": 1710.3, |
| "valid_targets_min": 914 |
| }, |
| { |
| "epoch": 2.555205047318612, |
| "grad_norm": 0.706638483600412, |
| "learning_rate": 3.204481420501989e-05, |
| "loss": 0.1831, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16516169905662537, |
| "step": 2430, |
| "valid_targets_mean": 1397.1, |
| "valid_targets_min": 680 |
| }, |
| { |
| "epoch": 2.5604626708727656, |
| "grad_norm": 0.6595471125565786, |
| "learning_rate": 3.200291040600632e-05, |
| "loss": 0.1854, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19127607345581055, |
| "step": 2435, |
| "valid_targets_mean": 1962.8, |
| "valid_targets_min": 819 |
| }, |
| { |
| "epoch": 2.565720294426919, |
| "grad_norm": 1.426160309160804, |
| "learning_rate": 3.196092409303272e-05, |
| "loss": 0.1806, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.175967738032341, |
| "step": 2440, |
| "valid_targets_mean": 1393.1, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 2.5709779179810726, |
| "grad_norm": 0.9093678575023609, |
| "learning_rate": 3.1918855554733804e-05, |
| "loss": 0.1926, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17155486345291138, |
| "step": 2445, |
| "valid_targets_mean": 1529.1, |
| "valid_targets_min": 655 |
| }, |
| { |
| "epoch": 2.576235541535226, |
| "grad_norm": 0.7364876180401076, |
| "learning_rate": 3.187670508030959e-05, |
| "loss": 0.1691, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1728055775165558, |
| "step": 2450, |
| "valid_targets_mean": 1443.4, |
| "valid_targets_min": 737 |
| }, |
| { |
| "epoch": 2.5814931650893795, |
| "grad_norm": 0.7257430614438023, |
| "learning_rate": 3.183447295952334e-05, |
| "loss": 0.192, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16965501010417938, |
| "step": 2455, |
| "valid_targets_mean": 1386.6, |
| "valid_targets_min": 759 |
| }, |
| { |
| "epoch": 2.586750788643533, |
| "grad_norm": 0.9481965876284844, |
| "learning_rate": 3.1792159482699606e-05, |
| "loss": 0.1779, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19058646261692047, |
| "step": 2460, |
| "valid_targets_mean": 1630.4, |
| "valid_targets_min": 750 |
| }, |
| { |
| "epoch": 2.5920084121976865, |
| "grad_norm": 0.6745196252466795, |
| "learning_rate": 3.174976494072222e-05, |
| "loss": 0.1831, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19411690533161163, |
| "step": 2465, |
| "valid_targets_mean": 1679.1, |
| "valid_targets_min": 780 |
| }, |
| { |
| "epoch": 2.59726603575184, |
| "grad_norm": 0.6957842805281405, |
| "learning_rate": 3.170728962503227e-05, |
| "loss": 0.1856, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1874210089445114, |
| "step": 2470, |
| "valid_targets_mean": 1477.2, |
| "valid_targets_min": 679 |
| }, |
| { |
| "epoch": 2.6025236593059935, |
| "grad_norm": 0.7302835064708894, |
| "learning_rate": 3.1664733827626174e-05, |
| "loss": 0.1785, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18315719068050385, |
| "step": 2475, |
| "valid_targets_mean": 1314.2, |
| "valid_targets_min": 771 |
| }, |
| { |
| "epoch": 2.607781282860147, |
| "grad_norm": 0.6771269395041604, |
| "learning_rate": 3.1622097841053574e-05, |
| "loss": 0.1679, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17343896627426147, |
| "step": 2480, |
| "valid_targets_mean": 1557.2, |
| "valid_targets_min": 878 |
| }, |
| { |
| "epoch": 2.6130389064143005, |
| "grad_norm": 0.7236310093579447, |
| "learning_rate": 3.15793819584154e-05, |
| "loss": 0.1666, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16601906716823578, |
| "step": 2485, |
| "valid_targets_mean": 1591.2, |
| "valid_targets_min": 942 |
| }, |
| { |
| "epoch": 2.6182965299684544, |
| "grad_norm": 0.7213200178259118, |
| "learning_rate": 3.1536586473361815e-05, |
| "loss": 0.1749, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18070757389068604, |
| "step": 2490, |
| "valid_targets_mean": 1555.7, |
| "valid_targets_min": 675 |
| }, |
| { |
| "epoch": 2.623554153522608, |
| "grad_norm": 0.7396190616215501, |
| "learning_rate": 3.149371168009022e-05, |
| "loss": 0.1804, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19092756509780884, |
| "step": 2495, |
| "valid_targets_mean": 1650.1, |
| "valid_targets_min": 892 |
| }, |
| { |
| "epoch": 2.6288117770767614, |
| "grad_norm": 0.7750187458534707, |
| "learning_rate": 3.145075787334319e-05, |
| "loss": 0.1823, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17495709657669067, |
| "step": 2500, |
| "valid_targets_mean": 1602.0, |
| "valid_targets_min": 656 |
| }, |
| { |
| "epoch": 2.634069400630915, |
| "grad_norm": 0.7329970218405842, |
| "learning_rate": 3.140772534840652e-05, |
| "loss": 0.1784, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1599145382642746, |
| "step": 2505, |
| "valid_targets_mean": 1368.2, |
| "valid_targets_min": 706 |
| }, |
| { |
| "epoch": 2.6393270241850684, |
| "grad_norm": 0.7142078193526387, |
| "learning_rate": 3.1364614401107126e-05, |
| "loss": 0.1832, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17636436223983765, |
| "step": 2510, |
| "valid_targets_mean": 1528.6, |
| "valid_targets_min": 548 |
| }, |
| { |
| "epoch": 2.644584647739222, |
| "grad_norm": 0.7378142813335541, |
| "learning_rate": 3.1321425327811044e-05, |
| "loss": 0.1757, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1682058572769165, |
| "step": 2515, |
| "valid_targets_mean": 1268.9, |
| "valid_targets_min": 658 |
| }, |
| { |
| "epoch": 2.6498422712933754, |
| "grad_norm": 0.8128386369892511, |
| "learning_rate": 3.127815842542138e-05, |
| "loss": 0.1822, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1758577823638916, |
| "step": 2520, |
| "valid_targets_mean": 1439.2, |
| "valid_targets_min": 650 |
| }, |
| { |
| "epoch": 2.655099894847529, |
| "grad_norm": 0.6819316448947391, |
| "learning_rate": 3.1234813991376296e-05, |
| "loss": 0.1815, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.178232803940773, |
| "step": 2525, |
| "valid_targets_mean": 1575.0, |
| "valid_targets_min": 859 |
| }, |
| { |
| "epoch": 2.6603575184016823, |
| "grad_norm": 0.7946871625400562, |
| "learning_rate": 3.119139232364693e-05, |
| "loss": 0.1629, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17829295992851257, |
| "step": 2530, |
| "valid_targets_mean": 1416.3, |
| "valid_targets_min": 728 |
| }, |
| { |
| "epoch": 2.665615141955836, |
| "grad_norm": 0.6986836916108511, |
| "learning_rate": 3.1147893720735356e-05, |
| "loss": 0.1746, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16103705763816833, |
| "step": 2535, |
| "valid_targets_mean": 1523.5, |
| "valid_targets_min": 686 |
| }, |
| { |
| "epoch": 2.6708727655099898, |
| "grad_norm": 0.7246250341804357, |
| "learning_rate": 3.110431848167255e-05, |
| "loss": 0.1729, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18969683349132538, |
| "step": 2540, |
| "valid_targets_mean": 1661.9, |
| "valid_targets_min": 697 |
| }, |
| { |
| "epoch": 2.6761303890641432, |
| "grad_norm": 0.7382038136062588, |
| "learning_rate": 3.106066690601633e-05, |
| "loss": 0.169, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15889039635658264, |
| "step": 2545, |
| "valid_targets_mean": 1399.0, |
| "valid_targets_min": 779 |
| }, |
| { |
| "epoch": 2.6813880126182967, |
| "grad_norm": 0.7547568720929694, |
| "learning_rate": 3.101693929384927e-05, |
| "loss": 0.1832, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18250948190689087, |
| "step": 2550, |
| "valid_targets_mean": 1434.1, |
| "valid_targets_min": 729 |
| }, |
| { |
| "epoch": 2.6866456361724502, |
| "grad_norm": 0.6893158272637044, |
| "learning_rate": 3.097313594577667e-05, |
| "loss": 0.1643, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15573960542678833, |
| "step": 2555, |
| "valid_targets_mean": 1447.7, |
| "valid_targets_min": 868 |
| }, |
| { |
| "epoch": 2.6919032597266037, |
| "grad_norm": 0.7387192808250229, |
| "learning_rate": 3.092925716292447e-05, |
| "loss": 0.173, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1606055051088333, |
| "step": 2560, |
| "valid_targets_mean": 1375.8, |
| "valid_targets_min": 765 |
| }, |
| { |
| "epoch": 2.697160883280757, |
| "grad_norm": 0.7735403511546811, |
| "learning_rate": 3.088530324693719e-05, |
| "loss": 0.1738, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17704743146896362, |
| "step": 2565, |
| "valid_targets_mean": 1483.0, |
| "valid_targets_min": 793 |
| }, |
| { |
| "epoch": 2.7024185068349107, |
| "grad_norm": 0.7484459012703679, |
| "learning_rate": 3.0841274499975855e-05, |
| "loss": 0.1769, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1768781542778015, |
| "step": 2570, |
| "valid_targets_mean": 1448.5, |
| "valid_targets_min": 806 |
| }, |
| { |
| "epoch": 2.707676130389064, |
| "grad_norm": 0.6794360677514358, |
| "learning_rate": 3.079717122471591e-05, |
| "loss": 0.165, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15198001265525818, |
| "step": 2575, |
| "valid_targets_mean": 1447.2, |
| "valid_targets_min": 803 |
| }, |
| { |
| "epoch": 2.7129337539432177, |
| "grad_norm": 0.7103379285860478, |
| "learning_rate": 3.075299372434515e-05, |
| "loss": 0.1686, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16421151161193848, |
| "step": 2580, |
| "valid_targets_mean": 1570.9, |
| "valid_targets_min": 660 |
| }, |
| { |
| "epoch": 2.718191377497371, |
| "grad_norm": 0.7506927457105123, |
| "learning_rate": 3.0708742302561606e-05, |
| "loss": 0.1565, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.164239764213562, |
| "step": 2585, |
| "valid_targets_mean": 1630.4, |
| "valid_targets_min": 837 |
| }, |
| { |
| "epoch": 2.7234490010515247, |
| "grad_norm": 0.6386773921981006, |
| "learning_rate": 3.066441726357153e-05, |
| "loss": 0.1753, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16314128041267395, |
| "step": 2590, |
| "valid_targets_mean": 1617.9, |
| "valid_targets_min": 719 |
| }, |
| { |
| "epoch": 2.728706624605678, |
| "grad_norm": 0.7158515374905577, |
| "learning_rate": 3.062001891208721e-05, |
| "loss": 0.1725, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18148285150527954, |
| "step": 2595, |
| "valid_targets_mean": 1683.0, |
| "valid_targets_min": 765 |
| }, |
| { |
| "epoch": 2.7339642481598316, |
| "grad_norm": 0.7186144055992262, |
| "learning_rate": 3.0575547553324944e-05, |
| "loss": 0.1688, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17265230417251587, |
| "step": 2600, |
| "valid_targets_mean": 1421.1, |
| "valid_targets_min": 727 |
| }, |
| { |
| "epoch": 2.739221871713985, |
| "grad_norm": 0.7440662806077852, |
| "learning_rate": 3.053100349300291e-05, |
| "loss": 0.1667, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14547862112522125, |
| "step": 2605, |
| "valid_targets_mean": 1201.9, |
| "valid_targets_min": 655 |
| }, |
| { |
| "epoch": 2.7444794952681386, |
| "grad_norm": 0.7784488748328007, |
| "learning_rate": 3.0486387037339074e-05, |
| "loss": 0.1741, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1674884855747223, |
| "step": 2610, |
| "valid_targets_mean": 1548.8, |
| "valid_targets_min": 669 |
| }, |
| { |
| "epoch": 2.749737118822292, |
| "grad_norm": 0.7557133030957722, |
| "learning_rate": 3.0441698493049078e-05, |
| "loss": 0.1627, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1641567349433899, |
| "step": 2615, |
| "valid_targets_mean": 1451.5, |
| "valid_targets_min": 1046 |
| }, |
| { |
| "epoch": 2.7549947423764456, |
| "grad_norm": 0.7410764944434184, |
| "learning_rate": 3.0396938167344153e-05, |
| "loss": 0.1796, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18922118842601776, |
| "step": 2620, |
| "valid_targets_mean": 1700.8, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 2.7602523659305995, |
| "grad_norm": 0.7605801430873814, |
| "learning_rate": 3.0352106367928974e-05, |
| "loss": 0.1756, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17325884103775024, |
| "step": 2625, |
| "valid_targets_mean": 1699.1, |
| "valid_targets_min": 846 |
| }, |
| { |
| "epoch": 2.765509989484753, |
| "grad_norm": 0.8725228877145639, |
| "learning_rate": 3.030720340299957e-05, |
| "loss": 0.1836, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17487359046936035, |
| "step": 2630, |
| "valid_targets_mean": 1531.2, |
| "valid_targets_min": 764 |
| }, |
| { |
| "epoch": 2.7707676130389065, |
| "grad_norm": 0.6826666138018487, |
| "learning_rate": 3.0262229581241197e-05, |
| "loss": 0.163, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15830162167549133, |
| "step": 2635, |
| "valid_targets_mean": 1539.4, |
| "valid_targets_min": 822 |
| }, |
| { |
| "epoch": 2.77602523659306, |
| "grad_norm": 0.7411025839288775, |
| "learning_rate": 3.0217185211826218e-05, |
| "loss": 0.1658, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.172267884016037, |
| "step": 2640, |
| "valid_targets_mean": 1595.1, |
| "valid_targets_min": 982 |
| }, |
| { |
| "epoch": 2.7812828601472135, |
| "grad_norm": 0.6710496334883137, |
| "learning_rate": 3.0172070604411957e-05, |
| "loss": 0.1755, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16107648611068726, |
| "step": 2645, |
| "valid_targets_mean": 1443.9, |
| "valid_targets_min": 713 |
| }, |
| { |
| "epoch": 2.786540483701367, |
| "grad_norm": 0.6758683595199071, |
| "learning_rate": 3.0126886069138623e-05, |
| "loss": 0.1658, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.156482994556427, |
| "step": 2650, |
| "valid_targets_mean": 1529.7, |
| "valid_targets_min": 721 |
| }, |
| { |
| "epoch": 2.7917981072555205, |
| "grad_norm": 0.724592426027824, |
| "learning_rate": 3.0081631916627114e-05, |
| "loss": 0.1631, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1636800765991211, |
| "step": 2655, |
| "valid_targets_mean": 1394.7, |
| "valid_targets_min": 741 |
| }, |
| { |
| "epoch": 2.797055730809674, |
| "grad_norm": 0.7080037251210684, |
| "learning_rate": 3.003630845797693e-05, |
| "loss": 0.1663, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1821160465478897, |
| "step": 2660, |
| "valid_targets_mean": 1693.2, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 2.8023133543638274, |
| "grad_norm": 0.6470876274014894, |
| "learning_rate": 2.9990916004763996e-05, |
| "loss": 0.1784, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17179813981056213, |
| "step": 2665, |
| "valid_targets_mean": 1675.6, |
| "valid_targets_min": 744 |
| }, |
| { |
| "epoch": 2.807570977917981, |
| "grad_norm": 0.6793283565416525, |
| "learning_rate": 2.9945454869038562e-05, |
| "loss": 0.1719, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17891114950180054, |
| "step": 2670, |
| "valid_targets_mean": 1613.5, |
| "valid_targets_min": 620 |
| }, |
| { |
| "epoch": 2.812828601472135, |
| "grad_norm": 0.7133998889044233, |
| "learning_rate": 2.9899925363323022e-05, |
| "loss": 0.1638, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16359588503837585, |
| "step": 2675, |
| "valid_targets_mean": 1419.7, |
| "valid_targets_min": 622 |
| }, |
| { |
| "epoch": 2.8180862250262884, |
| "grad_norm": 0.7225195655382499, |
| "learning_rate": 2.9854327800609775e-05, |
| "loss": 0.1735, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19478288292884827, |
| "step": 2680, |
| "valid_targets_mean": 1880.9, |
| "valid_targets_min": 740 |
| }, |
| { |
| "epoch": 2.823343848580442, |
| "grad_norm": 0.7231916205818729, |
| "learning_rate": 2.98086624943591e-05, |
| "loss": 0.1663, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15764358639717102, |
| "step": 2685, |
| "valid_targets_mean": 1379.8, |
| "valid_targets_min": 694 |
| }, |
| { |
| "epoch": 2.8286014721345953, |
| "grad_norm": 0.6562050600985719, |
| "learning_rate": 2.976292975849696e-05, |
| "loss": 0.1697, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16331803798675537, |
| "step": 2690, |
| "valid_targets_mean": 1691.7, |
| "valid_targets_min": 902 |
| }, |
| { |
| "epoch": 2.833859095688749, |
| "grad_norm": 0.8510035305404722, |
| "learning_rate": 2.9717129907412857e-05, |
| "loss": 0.1681, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1594816893339157, |
| "step": 2695, |
| "valid_targets_mean": 1446.9, |
| "valid_targets_min": 674 |
| }, |
| { |
| "epoch": 2.8391167192429023, |
| "grad_norm": 0.691671902637164, |
| "learning_rate": 2.9671263255957697e-05, |
| "loss": 0.1604, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14799946546554565, |
| "step": 2700, |
| "valid_targets_mean": 1252.9, |
| "valid_targets_min": 567 |
| }, |
| { |
| "epoch": 2.844374342797056, |
| "grad_norm": 0.7378873246640367, |
| "learning_rate": 2.9625330119441584e-05, |
| "loss": 0.1579, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17044302821159363, |
| "step": 2705, |
| "valid_targets_mean": 1609.3, |
| "valid_targets_min": 912 |
| }, |
| { |
| "epoch": 2.8496319663512093, |
| "grad_norm": 0.7998017274571173, |
| "learning_rate": 2.957933081363169e-05, |
| "loss": 0.1766, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1837320774793625, |
| "step": 2710, |
| "valid_targets_mean": 1729.2, |
| "valid_targets_min": 1181 |
| }, |
| { |
| "epoch": 2.854889589905363, |
| "grad_norm": 0.7805127379463831, |
| "learning_rate": 2.953326565475006e-05, |
| "loss": 0.1608, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1533714234828949, |
| "step": 2715, |
| "valid_targets_mean": 1333.9, |
| "valid_targets_min": 773 |
| }, |
| { |
| "epoch": 2.8601472134595163, |
| "grad_norm": 0.7199663789517207, |
| "learning_rate": 2.9487134959471445e-05, |
| "loss": 0.1716, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.164058119058609, |
| "step": 2720, |
| "valid_targets_mean": 1399.3, |
| "valid_targets_min": 679 |
| }, |
| { |
| "epoch": 2.8654048370136698, |
| "grad_norm": 0.7055036362874301, |
| "learning_rate": 2.944093904492113e-05, |
| "loss": 0.1685, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17372094094753265, |
| "step": 2725, |
| "valid_targets_mean": 1636.9, |
| "valid_targets_min": 818 |
| }, |
| { |
| "epoch": 2.8706624605678233, |
| "grad_norm": 0.7240927225149444, |
| "learning_rate": 2.9394678228672737e-05, |
| "loss": 0.1695, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15705692768096924, |
| "step": 2730, |
| "valid_targets_mean": 1466.2, |
| "valid_targets_min": 635 |
| }, |
| { |
| "epoch": 2.8759200841219767, |
| "grad_norm": 0.697968243512, |
| "learning_rate": 2.9348352828746076e-05, |
| "loss": 0.1687, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16323170065879822, |
| "step": 2735, |
| "valid_targets_mean": 1587.8, |
| "valid_targets_min": 592 |
| }, |
| { |
| "epoch": 2.8811777076761302, |
| "grad_norm": 0.7734054606250315, |
| "learning_rate": 2.9301963163604916e-05, |
| "loss": 0.1733, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20132026076316833, |
| "step": 2740, |
| "valid_targets_mean": 1555.1, |
| "valid_targets_min": 662 |
| }, |
| { |
| "epoch": 2.8864353312302837, |
| "grad_norm": 0.7326620478455544, |
| "learning_rate": 2.925550955215483e-05, |
| "loss": 0.1684, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16971275210380554, |
| "step": 2745, |
| "valid_targets_mean": 1444.0, |
| "valid_targets_min": 622 |
| }, |
| { |
| "epoch": 2.891692954784437, |
| "grad_norm": 0.762268565306597, |
| "learning_rate": 2.9208992313740993e-05, |
| "loss": 0.1704, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17945335805416107, |
| "step": 2750, |
| "valid_targets_mean": 1487.4, |
| "valid_targets_min": 625 |
| }, |
| { |
| "epoch": 2.8969505783385907, |
| "grad_norm": 0.8636088215521381, |
| "learning_rate": 2.916241176814596e-05, |
| "loss": 0.1753, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18224063515663147, |
| "step": 2755, |
| "valid_targets_mean": 1779.5, |
| "valid_targets_min": 888 |
| }, |
| { |
| "epoch": 2.9022082018927446, |
| "grad_norm": 0.7167941039962984, |
| "learning_rate": 2.9115768235587526e-05, |
| "loss": 0.1749, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1802193820476532, |
| "step": 2760, |
| "valid_targets_mean": 1764.4, |
| "valid_targets_min": 635 |
| }, |
| { |
| "epoch": 2.907465825446898, |
| "grad_norm": 0.7355150012300485, |
| "learning_rate": 2.9069062036716454e-05, |
| "loss": 0.1739, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1942647099494934, |
| "step": 2765, |
| "valid_targets_mean": 1668.6, |
| "valid_targets_min": 522 |
| }, |
| { |
| "epoch": 2.9127234490010516, |
| "grad_norm": 0.7056003259372422, |
| "learning_rate": 2.9022293492614334e-05, |
| "loss": 0.1655, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15577737987041473, |
| "step": 2770, |
| "valid_targets_mean": 1324.4, |
| "valid_targets_min": 697 |
| }, |
| { |
| "epoch": 2.917981072555205, |
| "grad_norm": 0.7560500384705311, |
| "learning_rate": 2.8975462924791334e-05, |
| "loss": 0.1634, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1751575767993927, |
| "step": 2775, |
| "valid_targets_mean": 1607.7, |
| "valid_targets_min": 868 |
| }, |
| { |
| "epoch": 2.9232386961093586, |
| "grad_norm": 0.7911429850053685, |
| "learning_rate": 2.892857065518401e-05, |
| "loss": 0.1676, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1767704337835312, |
| "step": 2780, |
| "valid_targets_mean": 1528.9, |
| "valid_targets_min": 769 |
| }, |
| { |
| "epoch": 2.928496319663512, |
| "grad_norm": 0.801135279225843, |
| "learning_rate": 2.8881617006153072e-05, |
| "loss": 0.1737, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19087477028369904, |
| "step": 2785, |
| "valid_targets_mean": 1453.0, |
| "valid_targets_min": 745 |
| }, |
| { |
| "epoch": 2.9337539432176656, |
| "grad_norm": 0.7446369931681006, |
| "learning_rate": 2.8834602300481207e-05, |
| "loss": 0.1657, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17077264189720154, |
| "step": 2790, |
| "valid_targets_mean": 1379.4, |
| "valid_targets_min": 680 |
| }, |
| { |
| "epoch": 2.939011566771819, |
| "grad_norm": 0.7315171743238089, |
| "learning_rate": 2.878752686137082e-05, |
| "loss": 0.1664, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1826205849647522, |
| "step": 2795, |
| "valid_targets_mean": 1813.8, |
| "valid_targets_min": 964 |
| }, |
| { |
| "epoch": 2.9442691903259726, |
| "grad_norm": 0.805565046245444, |
| "learning_rate": 2.874039101244183e-05, |
| "loss": 0.1798, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22795671224594116, |
| "step": 2800, |
| "valid_targets_mean": 1656.2, |
| "valid_targets_min": 851 |
| }, |
| { |
| "epoch": 2.949526813880126, |
| "grad_norm": 0.6673400481702775, |
| "learning_rate": 2.869319507772944e-05, |
| "loss": 0.1662, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15091487765312195, |
| "step": 2805, |
| "valid_targets_mean": 1483.2, |
| "valid_targets_min": 727 |
| }, |
| { |
| "epoch": 2.9547844374342795, |
| "grad_norm": 0.6466788920453029, |
| "learning_rate": 2.864593938168192e-05, |
| "loss": 0.1653, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16105708479881287, |
| "step": 2810, |
| "valid_targets_mean": 1464.4, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 2.9600420609884335, |
| "grad_norm": 0.5165730982062974, |
| "learning_rate": 2.8598624249158367e-05, |
| "loss": 0.1621, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12236955761909485, |
| "step": 2815, |
| "valid_targets_mean": 2121.1, |
| "valid_targets_min": 702 |
| }, |
| { |
| "epoch": 2.965299684542587, |
| "grad_norm": 0.6852878654958156, |
| "learning_rate": 2.855125000542647e-05, |
| "loss": 0.1507, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15275967121124268, |
| "step": 2820, |
| "valid_targets_mean": 1543.9, |
| "valid_targets_min": 930 |
| }, |
| { |
| "epoch": 2.9705573080967405, |
| "grad_norm": 0.7083606652510992, |
| "learning_rate": 2.8503816976160278e-05, |
| "loss": 0.1681, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16899517178535461, |
| "step": 2825, |
| "valid_targets_mean": 1603.1, |
| "valid_targets_min": 570 |
| }, |
| { |
| "epoch": 2.975814931650894, |
| "grad_norm": 0.7483848333180418, |
| "learning_rate": 2.8456325487437966e-05, |
| "loss": 0.1664, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17572671175003052, |
| "step": 2830, |
| "valid_targets_mean": 1672.6, |
| "valid_targets_min": 870 |
| }, |
| { |
| "epoch": 2.9810725552050474, |
| "grad_norm": 0.6887776688547632, |
| "learning_rate": 2.8408775865739578e-05, |
| "loss": 0.1705, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17223665118217468, |
| "step": 2835, |
| "valid_targets_mean": 1623.1, |
| "valid_targets_min": 822 |
| }, |
| { |
| "epoch": 2.986330178759201, |
| "grad_norm": 0.7000779962193426, |
| "learning_rate": 2.8361168437944817e-05, |
| "loss": 0.1737, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1977711319923401, |
| "step": 2840, |
| "valid_targets_mean": 1630.5, |
| "valid_targets_min": 626 |
| }, |
| { |
| "epoch": 2.9915878023133544, |
| "grad_norm": 0.7608625024081402, |
| "learning_rate": 2.8313503531330738e-05, |
| "loss": 0.1632, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16275346279144287, |
| "step": 2845, |
| "valid_targets_mean": 1483.1, |
| "valid_targets_min": 591 |
| }, |
| { |
| "epoch": 2.996845425867508, |
| "grad_norm": 0.7748031519882468, |
| "learning_rate": 2.826578147356956e-05, |
| "loss": 0.1729, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16352367401123047, |
| "step": 2850, |
| "valid_targets_mean": 1302.1, |
| "valid_targets_min": 646 |
| }, |
| { |
| "epoch": 3.0021030494216614, |
| "grad_norm": 0.5466222076999223, |
| "learning_rate": 2.8218002592726384e-05, |
| "loss": 0.1512, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12446707487106323, |
| "step": 2855, |
| "valid_targets_mean": 2746.6, |
| "valid_targets_min": 876 |
| }, |
| { |
| "epoch": 3.007360672975815, |
| "grad_norm": 0.521033324722458, |
| "learning_rate": 2.8170167217256934e-05, |
| "loss": 0.1278, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13182267546653748, |
| "step": 2860, |
| "valid_targets_mean": 2116.5, |
| "valid_targets_min": 324 |
| }, |
| { |
| "epoch": 3.0126182965299684, |
| "grad_norm": 0.338373329057547, |
| "learning_rate": 2.8122275676005304e-05, |
| "loss": 0.0988, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10079587996006012, |
| "step": 2865, |
| "valid_targets_mean": 3281.1, |
| "valid_targets_min": 1064 |
| }, |
| { |
| "epoch": 3.017875920084122, |
| "grad_norm": 0.37994597855088297, |
| "learning_rate": 2.807432829820171e-05, |
| "loss": 0.0956, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10244813561439514, |
| "step": 2870, |
| "valid_targets_mean": 3268.5, |
| "valid_targets_min": 710 |
| }, |
| { |
| "epoch": 3.0231335436382754, |
| "grad_norm": 0.33730921505091843, |
| "learning_rate": 2.8026325413460215e-05, |
| "loss": 0.1093, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06904646009206772, |
| "step": 2875, |
| "valid_targets_mean": 3468.9, |
| "valid_targets_min": 1223 |
| }, |
| { |
| "epoch": 3.028391167192429, |
| "grad_norm": 0.3843288226709204, |
| "learning_rate": 2.7978267351776448e-05, |
| "loss": 0.0966, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09345643222332001, |
| "step": 2880, |
| "valid_targets_mean": 2931.2, |
| "valid_targets_min": 889 |
| }, |
| { |
| "epoch": 3.0336487907465823, |
| "grad_norm": 0.6380628691857361, |
| "learning_rate": 2.7930154443525377e-05, |
| "loss": 0.1326, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14252786338329315, |
| "step": 2885, |
| "valid_targets_mean": 1523.7, |
| "valid_targets_min": 559 |
| }, |
| { |
| "epoch": 3.0389064143007363, |
| "grad_norm": 0.3318356464318728, |
| "learning_rate": 2.7881987019458992e-05, |
| "loss": 0.1267, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09030725806951523, |
| "step": 2890, |
| "valid_targets_mean": 3525.1, |
| "valid_targets_min": 1013 |
| }, |
| { |
| "epoch": 3.0441640378548898, |
| "grad_norm": 0.38097964579858057, |
| "learning_rate": 2.7833765410704062e-05, |
| "loss": 0.108, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10663875192403793, |
| "step": 2895, |
| "valid_targets_mean": 3351.7, |
| "valid_targets_min": 846 |
| }, |
| { |
| "epoch": 3.0494216614090432, |
| "grad_norm": 0.63473958615383, |
| "learning_rate": 2.778548994875984e-05, |
| "loss": 0.1464, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1719827950000763, |
| "step": 2900, |
| "valid_targets_mean": 3273.1, |
| "valid_targets_min": 246 |
| }, |
| { |
| "epoch": 3.0546792849631967, |
| "grad_norm": 0.3232383401726629, |
| "learning_rate": 2.7737160965495794e-05, |
| "loss": 0.0794, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0961248129606247, |
| "step": 2905, |
| "valid_targets_mean": 4083.9, |
| "valid_targets_min": 764 |
| }, |
| { |
| "epoch": 3.0599369085173502, |
| "grad_norm": 0.4030969389053521, |
| "learning_rate": 2.768877879314935e-05, |
| "loss": 0.0958, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09496355801820755, |
| "step": 2910, |
| "valid_targets_mean": 2203.9, |
| "valid_targets_min": 447 |
| }, |
| { |
| "epoch": 3.0651945320715037, |
| "grad_norm": 0.4294860925313067, |
| "learning_rate": 2.7640343764323535e-05, |
| "loss": 0.0995, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11138342320919037, |
| "step": 2915, |
| "valid_targets_mean": 3162.2, |
| "valid_targets_min": 754 |
| }, |
| { |
| "epoch": 3.070452155625657, |
| "grad_norm": 0.4453853252160343, |
| "learning_rate": 2.7591856211984783e-05, |
| "loss": 0.1175, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12396380305290222, |
| "step": 2920, |
| "valid_targets_mean": 2070.8, |
| "valid_targets_min": 604 |
| }, |
| { |
| "epoch": 3.0757097791798107, |
| "grad_norm": 0.7900559641665492, |
| "learning_rate": 2.7543316469460565e-05, |
| "loss": 0.1111, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10014769434928894, |
| "step": 2925, |
| "valid_targets_mean": 3348.2, |
| "valid_targets_min": 1743 |
| }, |
| { |
| "epoch": 3.080967402733964, |
| "grad_norm": 0.37525754758104163, |
| "learning_rate": 2.7494724870437147e-05, |
| "loss": 0.097, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09732868522405624, |
| "step": 2930, |
| "valid_targets_mean": 2746.6, |
| "valid_targets_min": 574 |
| }, |
| { |
| "epoch": 3.0862250262881177, |
| "grad_norm": 0.405552883970436, |
| "learning_rate": 2.7446081748957306e-05, |
| "loss": 0.0939, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11305394768714905, |
| "step": 2935, |
| "valid_targets_mean": 2807.6, |
| "valid_targets_min": 523 |
| }, |
| { |
| "epoch": 3.091482649842271, |
| "grad_norm": 0.39390305494009464, |
| "learning_rate": 2.7397387439417963e-05, |
| "loss": 0.0961, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1115940511226654, |
| "step": 2940, |
| "valid_targets_mean": 3306.1, |
| "valid_targets_min": 812 |
| }, |
| { |
| "epoch": 3.0967402733964247, |
| "grad_norm": 0.31902790094323685, |
| "learning_rate": 2.7348642276567973e-05, |
| "loss": 0.1019, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07373203337192535, |
| "step": 2945, |
| "valid_targets_mean": 2966.1, |
| "valid_targets_min": 493 |
| }, |
| { |
| "epoch": 3.101997896950578, |
| "grad_norm": 0.4311137083664932, |
| "learning_rate": 2.729984659550576e-05, |
| "loss": 0.1154, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11428984254598618, |
| "step": 2950, |
| "valid_targets_mean": 2645.6, |
| "valid_targets_min": 597 |
| }, |
| { |
| "epoch": 3.107255520504732, |
| "grad_norm": 0.49175093000351583, |
| "learning_rate": 2.7251000731677035e-05, |
| "loss": 0.1118, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11849726736545563, |
| "step": 2955, |
| "valid_targets_mean": 2493.6, |
| "valid_targets_min": 701 |
| }, |
| { |
| "epoch": 3.1125131440588856, |
| "grad_norm": 0.4604109686567695, |
| "learning_rate": 2.72021050208725e-05, |
| "loss": 0.1335, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20338056981563568, |
| "step": 2960, |
| "valid_targets_mean": 2864.6, |
| "valid_targets_min": 1297 |
| }, |
| { |
| "epoch": 3.117770767613039, |
| "grad_norm": 0.37799843509486336, |
| "learning_rate": 2.715315979922552e-05, |
| "loss": 0.1137, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09397638589143753, |
| "step": 2965, |
| "valid_targets_mean": 2596.0, |
| "valid_targets_min": 786 |
| }, |
| { |
| "epoch": 3.1230283911671926, |
| "grad_norm": 0.5189145881268659, |
| "learning_rate": 2.7104165403209843e-05, |
| "loss": 0.0958, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10702703148126602, |
| "step": 2970, |
| "valid_targets_mean": 2067.4, |
| "valid_targets_min": 550 |
| }, |
| { |
| "epoch": 3.128286014721346, |
| "grad_norm": 0.41140517046560815, |
| "learning_rate": 2.7055122169637224e-05, |
| "loss": 0.133, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09518980979919434, |
| "step": 2975, |
| "valid_targets_mean": 3358.8, |
| "valid_targets_min": 1304 |
| }, |
| { |
| "epoch": 3.1335436382754995, |
| "grad_norm": 0.37779945541074017, |
| "learning_rate": 2.7006030435655205e-05, |
| "loss": 0.1209, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09813253581523895, |
| "step": 2980, |
| "valid_targets_mean": 2746.4, |
| "valid_targets_min": 753 |
| }, |
| { |
| "epoch": 3.138801261829653, |
| "grad_norm": 0.4942296111137624, |
| "learning_rate": 2.6956890538744703e-05, |
| "loss": 0.1057, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11558189988136292, |
| "step": 2985, |
| "valid_targets_mean": 1980.6, |
| "valid_targets_min": 619 |
| }, |
| { |
| "epoch": 3.1440588853838065, |
| "grad_norm": 0.49825957897184714, |
| "learning_rate": 2.6907702816717742e-05, |
| "loss": 0.3, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23753009736537933, |
| "step": 2990, |
| "valid_targets_mean": 2497.7, |
| "valid_targets_min": 807 |
| }, |
| { |
| "epoch": 3.14931650893796, |
| "grad_norm": 0.5358736446407174, |
| "learning_rate": 2.685846760771513e-05, |
| "loss": 0.1211, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.148935005068779, |
| "step": 2995, |
| "valid_targets_mean": 1759.0, |
| "valid_targets_min": 329 |
| }, |
| { |
| "epoch": 3.1545741324921135, |
| "grad_norm": 0.43141437063840454, |
| "learning_rate": 2.6809185250204113e-05, |
| "loss": 0.1069, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0980694591999054, |
| "step": 3000, |
| "valid_targets_mean": 1902.4, |
| "valid_targets_min": 608 |
| }, |
| { |
| "epoch": 3.159831756046267, |
| "grad_norm": 0.4945291811340282, |
| "learning_rate": 2.6759856082976066e-05, |
| "loss": 0.2031, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11495549231767654, |
| "step": 3005, |
| "valid_targets_mean": 2912.9, |
| "valid_targets_min": 666 |
| }, |
| { |
| "epoch": 3.1650893796004205, |
| "grad_norm": 0.28517083163497425, |
| "learning_rate": 2.6710480445144145e-05, |
| "loss": 0.0914, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07156188040971756, |
| "step": 3010, |
| "valid_targets_mean": 5008.8, |
| "valid_targets_min": 3529 |
| }, |
| { |
| "epoch": 3.170347003154574, |
| "grad_norm": 0.38747073824557854, |
| "learning_rate": 2.666105867614099e-05, |
| "loss": 0.1067, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11048409342765808, |
| "step": 3015, |
| "valid_targets_mean": 4143.1, |
| "valid_targets_min": 1746 |
| }, |
| { |
| "epoch": 3.1756046267087275, |
| "grad_norm": 0.37449023233086515, |
| "learning_rate": 2.6611591115716345e-05, |
| "loss": 0.1033, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1028931587934494, |
| "step": 3020, |
| "valid_targets_mean": 3618.5, |
| "valid_targets_min": 1226 |
| }, |
| { |
| "epoch": 3.1808622502628814, |
| "grad_norm": 0.36116914085591356, |
| "learning_rate": 2.6562078103934755e-05, |
| "loss": 0.0958, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1023268923163414, |
| "step": 3025, |
| "valid_targets_mean": 3846.1, |
| "valid_targets_min": 798 |
| }, |
| { |
| "epoch": 3.186119873817035, |
| "grad_norm": 0.38592045301513195, |
| "learning_rate": 2.6512519981173238e-05, |
| "loss": 0.0912, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08848783373832703, |
| "step": 3030, |
| "valid_targets_mean": 2512.2, |
| "valid_targets_min": 687 |
| }, |
| { |
| "epoch": 3.1913774973711884, |
| "grad_norm": 0.3961718456981798, |
| "learning_rate": 2.64629170881189e-05, |
| "loss": 0.0926, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10466080904006958, |
| "step": 3035, |
| "valid_targets_mean": 3475.7, |
| "valid_targets_min": 898 |
| }, |
| { |
| "epoch": 3.196635120925342, |
| "grad_norm": 0.3106930366801356, |
| "learning_rate": 2.641326976576664e-05, |
| "loss": 0.0882, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06668621301651001, |
| "step": 3040, |
| "valid_targets_mean": 3755.8, |
| "valid_targets_min": 1421 |
| }, |
| { |
| "epoch": 3.2018927444794953, |
| "grad_norm": 0.4221301460518302, |
| "learning_rate": 2.6363578355416772e-05, |
| "loss": 0.0943, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10672241449356079, |
| "step": 3045, |
| "valid_targets_mean": 2536.6, |
| "valid_targets_min": 739 |
| }, |
| { |
| "epoch": 3.207150368033649, |
| "grad_norm": 0.5149633330728174, |
| "learning_rate": 2.6313843198672712e-05, |
| "loss": 0.1297, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09203119575977325, |
| "step": 3050, |
| "valid_targets_mean": 1594.4, |
| "valid_targets_min": 535 |
| }, |
| { |
| "epoch": 3.2124079915878023, |
| "grad_norm": 0.35594784901316856, |
| "learning_rate": 2.6264064637438585e-05, |
| "loss": 0.0768, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06688378751277924, |
| "step": 3055, |
| "valid_targets_mean": 2209.4, |
| "valid_targets_min": 585 |
| }, |
| { |
| "epoch": 3.217665615141956, |
| "grad_norm": 0.4630229114458132, |
| "learning_rate": 2.6214243013916915e-05, |
| "loss": 0.0933, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10203917324542999, |
| "step": 3060, |
| "valid_targets_mean": 2656.9, |
| "valid_targets_min": 582 |
| }, |
| { |
| "epoch": 3.2229232386961093, |
| "grad_norm": 0.4252733834393226, |
| "learning_rate": 2.616437867060627e-05, |
| "loss": 0.0839, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09619317948818207, |
| "step": 3065, |
| "valid_targets_mean": 3110.2, |
| "valid_targets_min": 516 |
| }, |
| { |
| "epoch": 3.228180862250263, |
| "grad_norm": 0.39522589716693973, |
| "learning_rate": 2.6114471950298853e-05, |
| "loss": 0.1392, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09734763205051422, |
| "step": 3070, |
| "valid_targets_mean": 3165.1, |
| "valid_targets_min": 647 |
| }, |
| { |
| "epoch": 3.2334384858044163, |
| "grad_norm": 0.4642871840249189, |
| "learning_rate": 2.6064523196078248e-05, |
| "loss": 0.1069, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16460002958774567, |
| "step": 3075, |
| "valid_targets_mean": 2261.0, |
| "valid_targets_min": 696 |
| }, |
| { |
| "epoch": 3.2386961093585698, |
| "grad_norm": 0.3814020577347577, |
| "learning_rate": 2.6014532751316937e-05, |
| "loss": 0.1145, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08565057069063187, |
| "step": 3080, |
| "valid_targets_mean": 2811.5, |
| "valid_targets_min": 635 |
| }, |
| { |
| "epoch": 3.2439537329127233, |
| "grad_norm": 0.4451511598456373, |
| "learning_rate": 2.5964500959674057e-05, |
| "loss": 0.0995, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09862557798624039, |
| "step": 3085, |
| "valid_targets_mean": 2445.8, |
| "valid_targets_min": 536 |
| }, |
| { |
| "epoch": 3.249211356466877, |
| "grad_norm": 0.48137190435019367, |
| "learning_rate": 2.5914428165092956e-05, |
| "loss": 0.1458, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20742422342300415, |
| "step": 3090, |
| "valid_targets_mean": 2535.8, |
| "valid_targets_min": 949 |
| }, |
| { |
| "epoch": 3.2544689800210307, |
| "grad_norm": 0.4042235353079657, |
| "learning_rate": 2.5864314711798856e-05, |
| "loss": 0.1064, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10464179515838623, |
| "step": 3095, |
| "valid_targets_mean": 3448.2, |
| "valid_targets_min": 2201 |
| }, |
| { |
| "epoch": 3.259726603575184, |
| "grad_norm": 0.5301526259442012, |
| "learning_rate": 2.5814160944296495e-05, |
| "loss": 0.1294, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12064434587955475, |
| "step": 3100, |
| "valid_targets_mean": 1526.4, |
| "valid_targets_min": 649 |
| }, |
| { |
| "epoch": 3.2649842271293377, |
| "grad_norm": 0.5015079508563632, |
| "learning_rate": 2.5763967207367752e-05, |
| "loss": 0.0934, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10426744818687439, |
| "step": 3105, |
| "valid_targets_mean": 2170.0, |
| "valid_targets_min": 449 |
| }, |
| { |
| "epoch": 3.270241850683491, |
| "grad_norm": 0.34692324671633057, |
| "learning_rate": 2.5713733846069272e-05, |
| "loss": 0.0994, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08536946028470993, |
| "step": 3110, |
| "valid_targets_mean": 3172.5, |
| "valid_targets_min": 658 |
| }, |
| { |
| "epoch": 3.2754994742376446, |
| "grad_norm": 0.5817428268839887, |
| "learning_rate": 2.56634612057301e-05, |
| "loss": 0.1035, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10349592566490173, |
| "step": 3115, |
| "valid_targets_mean": 1570.4, |
| "valid_targets_min": 516 |
| }, |
| { |
| "epoch": 3.280757097791798, |
| "grad_norm": 0.3467753466515313, |
| "learning_rate": 2.561314963194929e-05, |
| "loss": 0.0833, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09726609289646149, |
| "step": 3120, |
| "valid_targets_mean": 3943.2, |
| "valid_targets_min": 726 |
| }, |
| { |
| "epoch": 3.2860147213459516, |
| "grad_norm": 0.3698412199716944, |
| "learning_rate": 2.556279947059358e-05, |
| "loss": 0.0838, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10808682441711426, |
| "step": 3125, |
| "valid_targets_mean": 3758.2, |
| "valid_targets_min": 2036 |
| }, |
| { |
| "epoch": 3.291272344900105, |
| "grad_norm": 0.40667287615291386, |
| "learning_rate": 2.551241106779494e-05, |
| "loss": 0.0929, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10029004514217377, |
| "step": 3130, |
| "valid_targets_mean": 2494.0, |
| "valid_targets_min": 531 |
| }, |
| { |
| "epoch": 3.2965299684542586, |
| "grad_norm": 0.4275002343456192, |
| "learning_rate": 2.5461984769948244e-05, |
| "loss": 0.1121, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10097934305667877, |
| "step": 3135, |
| "valid_targets_mean": 2782.7, |
| "valid_targets_min": 744 |
| }, |
| { |
| "epoch": 3.301787592008412, |
| "grad_norm": 0.4260689893165757, |
| "learning_rate": 2.5411520923708874e-05, |
| "loss": 0.1046, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10482053458690643, |
| "step": 3140, |
| "valid_targets_mean": 3118.3, |
| "valid_targets_min": 891 |
| }, |
| { |
| "epoch": 3.3070452155625656, |
| "grad_norm": 0.30311426948810755, |
| "learning_rate": 2.536101987599036e-05, |
| "loss": 0.0917, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07310104370117188, |
| "step": 3145, |
| "valid_targets_mean": 3637.3, |
| "valid_targets_min": 2366 |
| }, |
| { |
| "epoch": 3.312302839116719, |
| "grad_norm": 0.3812389555372934, |
| "learning_rate": 2.5310481973961935e-05, |
| "loss": 0.0879, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08005480468273163, |
| "step": 3150, |
| "valid_targets_mean": 2363.1, |
| "valid_targets_min": 669 |
| }, |
| { |
| "epoch": 3.3175604626708726, |
| "grad_norm": 0.4063403424084052, |
| "learning_rate": 2.5259907565046217e-05, |
| "loss": 0.109, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1166294664144516, |
| "step": 3155, |
| "valid_targets_mean": 3721.6, |
| "valid_targets_min": 1785 |
| }, |
| { |
| "epoch": 3.322818086225026, |
| "grad_norm": 0.29744737763100537, |
| "learning_rate": 2.5209296996916774e-05, |
| "loss": 0.0783, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0791168063879013, |
| "step": 3160, |
| "valid_targets_mean": 3911.1, |
| "valid_targets_min": 2848 |
| }, |
| { |
| "epoch": 3.32807570977918, |
| "grad_norm": 0.3892043209014928, |
| "learning_rate": 2.5158650617495753e-05, |
| "loss": 0.0955, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08098890632390976, |
| "step": 3165, |
| "valid_targets_mean": 2296.6, |
| "valid_targets_min": 539 |
| }, |
| { |
| "epoch": 3.3333333333333335, |
| "grad_norm": 0.42339632408381894, |
| "learning_rate": 2.5107968774951504e-05, |
| "loss": 0.0991, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10028016567230225, |
| "step": 3170, |
| "valid_targets_mean": 2896.5, |
| "valid_targets_min": 1016 |
| }, |
| { |
| "epoch": 3.338590956887487, |
| "grad_norm": 0.6887447355394017, |
| "learning_rate": 2.5057251817696138e-05, |
| "loss": 0.1103, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17232894897460938, |
| "step": 3175, |
| "valid_targets_mean": 1443.4, |
| "valid_targets_min": 811 |
| }, |
| { |
| "epoch": 3.3438485804416405, |
| "grad_norm": 0.45470800054544114, |
| "learning_rate": 2.5006500094383176e-05, |
| "loss": 0.099, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09778797626495361, |
| "step": 3180, |
| "valid_targets_mean": 2288.8, |
| "valid_targets_min": 697 |
| }, |
| { |
| "epoch": 3.349106203995794, |
| "grad_norm": 0.5734145517972797, |
| "learning_rate": 2.4955713953905155e-05, |
| "loss": 0.0981, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11736759543418884, |
| "step": 3185, |
| "valid_targets_mean": 1566.6, |
| "valid_targets_min": 605 |
| }, |
| { |
| "epoch": 3.3543638275499474, |
| "grad_norm": 0.4258986637578229, |
| "learning_rate": 2.490489374539118e-05, |
| "loss": 0.0984, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08142179995775223, |
| "step": 3190, |
| "valid_targets_mean": 2678.6, |
| "valid_targets_min": 804 |
| }, |
| { |
| "epoch": 3.359621451104101, |
| "grad_norm": 0.44732484153742635, |
| "learning_rate": 2.4854039818204577e-05, |
| "loss": 0.1227, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08386355638504028, |
| "step": 3195, |
| "valid_targets_mean": 3416.7, |
| "valid_targets_min": 1018 |
| }, |
| { |
| "epoch": 3.3648790746582544, |
| "grad_norm": 0.3720578537553386, |
| "learning_rate": 2.480315252194047e-05, |
| "loss": 0.0962, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08612213283777237, |
| "step": 3200, |
| "valid_targets_mean": 2990.4, |
| "valid_targets_min": 524 |
| }, |
| { |
| "epoch": 3.370136698212408, |
| "grad_norm": 0.44673676067830237, |
| "learning_rate": 2.4752232206423387e-05, |
| "loss": 0.086, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.094891756772995, |
| "step": 3205, |
| "valid_targets_mean": 2421.8, |
| "valid_targets_min": 690 |
| }, |
| { |
| "epoch": 3.3753943217665614, |
| "grad_norm": 0.505487731435433, |
| "learning_rate": 2.4701279221704812e-05, |
| "loss": 0.1079, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1321258842945099, |
| "step": 3210, |
| "valid_targets_mean": 2558.6, |
| "valid_targets_min": 877 |
| }, |
| { |
| "epoch": 3.380651945320715, |
| "grad_norm": 0.36909294639464546, |
| "learning_rate": 2.4650293918060845e-05, |
| "loss": 0.1032, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08483578264713287, |
| "step": 3215, |
| "valid_targets_mean": 3632.8, |
| "valid_targets_min": 2346 |
| }, |
| { |
| "epoch": 3.3859095688748684, |
| "grad_norm": 0.5519706094992273, |
| "learning_rate": 2.4599276645989763e-05, |
| "loss": 0.0826, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11972440034151077, |
| "step": 3220, |
| "valid_targets_mean": 2203.8, |
| "valid_targets_min": 564 |
| }, |
| { |
| "epoch": 3.3911671924290223, |
| "grad_norm": 0.3428223361432121, |
| "learning_rate": 2.4548227756209593e-05, |
| "loss": 0.0928, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09329237043857574, |
| "step": 3225, |
| "valid_targets_mean": 4414.9, |
| "valid_targets_min": 2555 |
| }, |
| { |
| "epoch": 3.396424815983176, |
| "grad_norm": 0.3107495473025833, |
| "learning_rate": 2.4497147599655726e-05, |
| "loss": 0.0845, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07768009603023529, |
| "step": 3230, |
| "valid_targets_mean": 4187.8, |
| "valid_targets_min": 1731 |
| }, |
| { |
| "epoch": 3.4016824395373293, |
| "grad_norm": 0.3865073890727283, |
| "learning_rate": 2.44460365274785e-05, |
| "loss": 0.076, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0749867781996727, |
| "step": 3235, |
| "valid_targets_mean": 2469.8, |
| "valid_targets_min": 618 |
| }, |
| { |
| "epoch": 3.406940063091483, |
| "grad_norm": 0.31260333559826636, |
| "learning_rate": 2.4394894891040774e-05, |
| "loss": 0.1011, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07776013016700745, |
| "step": 3240, |
| "valid_targets_mean": 3974.0, |
| "valid_targets_min": 2944 |
| }, |
| { |
| "epoch": 3.4121976866456363, |
| "grad_norm": 0.35668126808948614, |
| "learning_rate": 2.434372304191553e-05, |
| "loss": 0.0972, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13149991631507874, |
| "step": 3245, |
| "valid_targets_mean": 3446.2, |
| "valid_targets_min": 1539 |
| }, |
| { |
| "epoch": 3.4174553101997898, |
| "grad_norm": 0.353482849500868, |
| "learning_rate": 2.4292521331883432e-05, |
| "loss": 0.1069, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07315802574157715, |
| "step": 3250, |
| "valid_targets_mean": 3172.9, |
| "valid_targets_min": 509 |
| }, |
| { |
| "epoch": 3.4227129337539433, |
| "grad_norm": 0.3127457471763909, |
| "learning_rate": 2.4241290112930448e-05, |
| "loss": 0.0988, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.062242090702056885, |
| "step": 3255, |
| "valid_targets_mean": 2809.9, |
| "valid_targets_min": 629 |
| }, |
| { |
| "epoch": 3.4279705573080967, |
| "grad_norm": 0.41511881465912187, |
| "learning_rate": 2.4190029737245368e-05, |
| "loss": 0.1176, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1011495590209961, |
| "step": 3260, |
| "valid_targets_mean": 2980.1, |
| "valid_targets_min": 737 |
| }, |
| { |
| "epoch": 3.4332281808622502, |
| "grad_norm": 0.34357501486462483, |
| "learning_rate": 2.4138740557217462e-05, |
| "loss": 0.0822, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08056190609931946, |
| "step": 3265, |
| "valid_targets_mean": 3209.1, |
| "valid_targets_min": 492 |
| }, |
| { |
| "epoch": 3.4384858044164037, |
| "grad_norm": 0.5494595490178701, |
| "learning_rate": 2.4087422925433988e-05, |
| "loss": 0.105, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11445383727550507, |
| "step": 3270, |
| "valid_targets_mean": 1736.8, |
| "valid_targets_min": 697 |
| }, |
| { |
| "epoch": 3.443743427970557, |
| "grad_norm": 0.34336146250245775, |
| "learning_rate": 2.4036077194677803e-05, |
| "loss": 0.0869, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07678385078907013, |
| "step": 3275, |
| "valid_targets_mean": 3708.5, |
| "valid_targets_min": 923 |
| }, |
| { |
| "epoch": 3.4490010515247107, |
| "grad_norm": 0.6741890325544422, |
| "learning_rate": 2.3984703717924932e-05, |
| "loss": 0.1314, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13014402985572815, |
| "step": 3280, |
| "valid_targets_mean": 1246.6, |
| "valid_targets_min": 458 |
| }, |
| { |
| "epoch": 3.454258675078864, |
| "grad_norm": 0.5047602662118091, |
| "learning_rate": 2.3933302848342127e-05, |
| "loss": 0.1222, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12619143724441528, |
| "step": 3285, |
| "valid_targets_mean": 1850.8, |
| "valid_targets_min": 459 |
| }, |
| { |
| "epoch": 3.4595162986330177, |
| "grad_norm": 0.424738453472895, |
| "learning_rate": 2.388187493928447e-05, |
| "loss": 0.0927, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10029537230730057, |
| "step": 3290, |
| "valid_targets_mean": 3529.3, |
| "valid_targets_min": 1694 |
| }, |
| { |
| "epoch": 3.464773922187171, |
| "grad_norm": 0.35411830004027156, |
| "learning_rate": 2.3830420344292922e-05, |
| "loss": 0.0908, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08716071397066116, |
| "step": 3295, |
| "valid_targets_mean": 3589.6, |
| "valid_targets_min": 2490 |
| }, |
| { |
| "epoch": 3.470031545741325, |
| "grad_norm": 0.3418023573892603, |
| "learning_rate": 2.377893941709189e-05, |
| "loss": 0.0887, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07180380076169968, |
| "step": 3300, |
| "valid_targets_mean": 2891.9, |
| "valid_targets_min": 970 |
| }, |
| { |
| "epoch": 3.4752891692954786, |
| "grad_norm": 0.45248442268337263, |
| "learning_rate": 2.3727432511586802e-05, |
| "loss": 0.0848, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08174464106559753, |
| "step": 3305, |
| "valid_targets_mean": 1893.4, |
| "valid_targets_min": 729 |
| }, |
| { |
| "epoch": 3.480546792849632, |
| "grad_norm": 0.742214468129363, |
| "learning_rate": 2.3675899981861675e-05, |
| "loss": 0.1085, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14365407824516296, |
| "step": 3310, |
| "valid_targets_mean": 1164.2, |
| "valid_targets_min": 637 |
| }, |
| { |
| "epoch": 3.4858044164037856, |
| "grad_norm": 0.39353361242747475, |
| "learning_rate": 2.362434218217668e-05, |
| "loss": 0.0809, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0775720551609993, |
| "step": 3315, |
| "valid_targets_mean": 2904.2, |
| "valid_targets_min": 701 |
| }, |
| { |
| "epoch": 3.491062039957939, |
| "grad_norm": 0.3601303488243885, |
| "learning_rate": 2.3572759466965706e-05, |
| "loss": 0.0853, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07890958338975906, |
| "step": 3320, |
| "valid_targets_mean": 3281.8, |
| "valid_targets_min": 1606 |
| }, |
| { |
| "epoch": 3.4963196635120926, |
| "grad_norm": 0.39509822138673245, |
| "learning_rate": 2.3521152190833934e-05, |
| "loss": 0.0885, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08546141535043716, |
| "step": 3325, |
| "valid_targets_mean": 3052.1, |
| "valid_targets_min": 678 |
| }, |
| { |
| "epoch": 3.501577287066246, |
| "grad_norm": 0.31671460002836604, |
| "learning_rate": 2.346952070855537e-05, |
| "loss": 0.0954, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0849844440817833, |
| "step": 3330, |
| "valid_targets_mean": 3768.0, |
| "valid_targets_min": 350 |
| }, |
| { |
| "epoch": 3.5068349106203995, |
| "grad_norm": 0.3090278061566263, |
| "learning_rate": 2.3417865375070433e-05, |
| "loss": 0.082, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08871947228908539, |
| "step": 3335, |
| "valid_targets_mean": 4112.0, |
| "valid_targets_min": 761 |
| }, |
| { |
| "epoch": 3.512092534174553, |
| "grad_norm": 0.4460989669300572, |
| "learning_rate": 2.336618654548352e-05, |
| "loss": 0.0892, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09572702646255493, |
| "step": 3340, |
| "valid_targets_mean": 2046.9, |
| "valid_targets_min": 507 |
| }, |
| { |
| "epoch": 3.5173501577287065, |
| "grad_norm": 0.5471827601886656, |
| "learning_rate": 2.331448457506053e-05, |
| "loss": 0.1058, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1673205941915512, |
| "step": 3345, |
| "valid_targets_mean": 2938.8, |
| "valid_targets_min": 780 |
| }, |
| { |
| "epoch": 3.52260778128286, |
| "grad_norm": 0.3382786063306754, |
| "learning_rate": 2.326275981922645e-05, |
| "loss": 0.1641, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08271795511245728, |
| "step": 3350, |
| "valid_targets_mean": 3854.1, |
| "valid_targets_min": 2347 |
| }, |
| { |
| "epoch": 3.527865404837014, |
| "grad_norm": 0.44456261597851254, |
| "learning_rate": 2.3211012633562923e-05, |
| "loss": 0.0884, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09423861652612686, |
| "step": 3355, |
| "valid_targets_mean": 2795.6, |
| "valid_targets_min": 716 |
| }, |
| { |
| "epoch": 3.5331230283911674, |
| "grad_norm": 0.36089701655793555, |
| "learning_rate": 2.3159243373805764e-05, |
| "loss": 0.086, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08504271507263184, |
| "step": 3360, |
| "valid_targets_mean": 3502.3, |
| "valid_targets_min": 2245 |
| }, |
| { |
| "epoch": 3.538380651945321, |
| "grad_norm": 1.0104813147285636, |
| "learning_rate": 2.3107452395842542e-05, |
| "loss": 0.143, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1977672576904297, |
| "step": 3365, |
| "valid_targets_mean": 1521.4, |
| "valid_targets_min": 544 |
| }, |
| { |
| "epoch": 3.5436382754994744, |
| "grad_norm": 0.7476753325688632, |
| "learning_rate": 2.3055640055710132e-05, |
| "loss": 0.1813, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1685527265071869, |
| "step": 3370, |
| "valid_targets_mean": 1463.8, |
| "valid_targets_min": 632 |
| }, |
| { |
| "epoch": 3.548895899053628, |
| "grad_norm": 0.7049824023388825, |
| "learning_rate": 2.3003806709592268e-05, |
| "loss": 0.1634, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1504194587469101, |
| "step": 3375, |
| "valid_targets_mean": 1399.4, |
| "valid_targets_min": 514 |
| }, |
| { |
| "epoch": 3.5541535226077814, |
| "grad_norm": 0.8532699459063282, |
| "learning_rate": 2.295195271381707e-05, |
| "loss": 0.1665, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17392781376838684, |
| "step": 3380, |
| "valid_targets_mean": 1316.6, |
| "valid_targets_min": 701 |
| }, |
| { |
| "epoch": 3.559411146161935, |
| "grad_norm": 0.6893415976424345, |
| "learning_rate": 2.290007842485463e-05, |
| "loss": 0.1557, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17594726383686066, |
| "step": 3385, |
| "valid_targets_mean": 1798.9, |
| "valid_targets_min": 754 |
| }, |
| { |
| "epoch": 3.5646687697160884, |
| "grad_norm": 0.7323589947092218, |
| "learning_rate": 2.2848184199314546e-05, |
| "loss": 0.1597, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14350740611553192, |
| "step": 3390, |
| "valid_targets_mean": 1302.9, |
| "valid_targets_min": 746 |
| }, |
| { |
| "epoch": 3.569926393270242, |
| "grad_norm": 0.7685104995392101, |
| "learning_rate": 2.2796270393943472e-05, |
| "loss": 0.1698, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16896271705627441, |
| "step": 3395, |
| "valid_targets_mean": 1624.1, |
| "valid_targets_min": 774 |
| }, |
| { |
| "epoch": 3.5751840168243953, |
| "grad_norm": 0.7419295482210282, |
| "learning_rate": 2.274433736562264e-05, |
| "loss": 0.1464, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1500275731086731, |
| "step": 3400, |
| "valid_targets_mean": 1371.6, |
| "valid_targets_min": 648 |
| }, |
| { |
| "epoch": 3.580441640378549, |
| "grad_norm": 0.7635824196621789, |
| "learning_rate": 2.2692385471365465e-05, |
| "loss": 0.1684, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15286250412464142, |
| "step": 3405, |
| "valid_targets_mean": 1490.3, |
| "valid_targets_min": 708 |
| }, |
| { |
| "epoch": 3.5856992639327023, |
| "grad_norm": 0.7208409226139617, |
| "learning_rate": 2.264041506831503e-05, |
| "loss": 0.15, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1389751434326172, |
| "step": 3410, |
| "valid_targets_mean": 1482.0, |
| "valid_targets_min": 770 |
| }, |
| { |
| "epoch": 3.590956887486856, |
| "grad_norm": 0.7336459663977433, |
| "learning_rate": 2.258842651374166e-05, |
| "loss": 0.1603, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13388162851333618, |
| "step": 3415, |
| "valid_targets_mean": 1201.6, |
| "valid_targets_min": 572 |
| }, |
| { |
| "epoch": 3.5962145110410093, |
| "grad_norm": 0.7339521194447971, |
| "learning_rate": 2.2536420165040478e-05, |
| "loss": 0.1604, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1521379053592682, |
| "step": 3420, |
| "valid_targets_mean": 1506.8, |
| "valid_targets_min": 627 |
| }, |
| { |
| "epoch": 3.601472134595163, |
| "grad_norm": 0.7725775694226406, |
| "learning_rate": 2.248439637972892e-05, |
| "loss": 0.154, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.160357266664505, |
| "step": 3425, |
| "valid_targets_mean": 1451.6, |
| "valid_targets_min": 765 |
| }, |
| { |
| "epoch": 3.6067297581493163, |
| "grad_norm": 0.7183691089962678, |
| "learning_rate": 2.2432355515444284e-05, |
| "loss": 0.145, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14932133257389069, |
| "step": 3430, |
| "valid_targets_mean": 1457.6, |
| "valid_targets_min": 740 |
| }, |
| { |
| "epoch": 3.61198738170347, |
| "grad_norm": 0.712281040019326, |
| "learning_rate": 2.2380297929941296e-05, |
| "loss": 0.1443, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14289280772209167, |
| "step": 3435, |
| "valid_targets_mean": 1512.8, |
| "valid_targets_min": 821 |
| }, |
| { |
| "epoch": 3.6172450052576237, |
| "grad_norm": 0.7858994711032667, |
| "learning_rate": 2.2328223981089613e-05, |
| "loss": 0.1471, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16713649034500122, |
| "step": 3440, |
| "valid_targets_mean": 1730.6, |
| "valid_targets_min": 691 |
| }, |
| { |
| "epoch": 3.622502628811777, |
| "grad_norm": 0.7101516962409145, |
| "learning_rate": 2.2276134026871393e-05, |
| "loss": 0.1533, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1352025270462036, |
| "step": 3445, |
| "valid_targets_mean": 1252.6, |
| "valid_targets_min": 721 |
| }, |
| { |
| "epoch": 3.6277602523659307, |
| "grad_norm": 0.7137846897634569, |
| "learning_rate": 2.222402842537882e-05, |
| "loss": 0.1584, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14950649440288544, |
| "step": 3450, |
| "valid_targets_mean": 1462.4, |
| "valid_targets_min": 727 |
| }, |
| { |
| "epoch": 3.633017875920084, |
| "grad_norm": 0.676752748047653, |
| "learning_rate": 2.2171907534811652e-05, |
| "loss": 0.1552, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1426226794719696, |
| "step": 3455, |
| "valid_targets_mean": 1440.3, |
| "valid_targets_min": 681 |
| }, |
| { |
| "epoch": 3.6382754994742377, |
| "grad_norm": 0.7526584864977061, |
| "learning_rate": 2.2119771713474732e-05, |
| "loss": 0.1559, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16186939179897308, |
| "step": 3460, |
| "valid_targets_mean": 1622.9, |
| "valid_targets_min": 814 |
| }, |
| { |
| "epoch": 3.643533123028391, |
| "grad_norm": 0.7073239156473662, |
| "learning_rate": 2.2067621319775564e-05, |
| "loss": 0.1533, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16528892517089844, |
| "step": 3465, |
| "valid_targets_mean": 1817.0, |
| "valid_targets_min": 832 |
| }, |
| { |
| "epoch": 3.6487907465825447, |
| "grad_norm": 0.6771018812111878, |
| "learning_rate": 2.201545671222183e-05, |
| "loss": 0.154, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14223238825798035, |
| "step": 3470, |
| "valid_targets_mean": 1605.8, |
| "valid_targets_min": 891 |
| }, |
| { |
| "epoch": 3.654048370136698, |
| "grad_norm": 0.8884046377617928, |
| "learning_rate": 2.1963278249418894e-05, |
| "loss": 0.1539, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16173222661018372, |
| "step": 3475, |
| "valid_targets_mean": 1352.1, |
| "valid_targets_min": 621 |
| }, |
| { |
| "epoch": 3.6593059936908516, |
| "grad_norm": 0.7585262697924833, |
| "learning_rate": 2.191108629006742e-05, |
| "loss": 0.1384, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1297926902770996, |
| "step": 3480, |
| "valid_targets_mean": 1315.7, |
| "valid_targets_min": 704 |
| }, |
| { |
| "epoch": 3.664563617245005, |
| "grad_norm": 0.7540927774084125, |
| "learning_rate": 2.1858881192960814e-05, |
| "loss": 0.1522, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16202481091022491, |
| "step": 3485, |
| "valid_targets_mean": 1641.8, |
| "valid_targets_min": 872 |
| }, |
| { |
| "epoch": 3.669821240799159, |
| "grad_norm": 0.8159633219097113, |
| "learning_rate": 2.180666331698281e-05, |
| "loss": 0.1436, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13622817397117615, |
| "step": 3490, |
| "valid_targets_mean": 1323.2, |
| "valid_targets_min": 584 |
| }, |
| { |
| "epoch": 3.6750788643533125, |
| "grad_norm": 0.692052692751461, |
| "learning_rate": 2.1754433021104985e-05, |
| "loss": 0.1512, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1466284990310669, |
| "step": 3495, |
| "valid_targets_mean": 1830.9, |
| "valid_targets_min": 999 |
| }, |
| { |
| "epoch": 3.680336487907466, |
| "grad_norm": 0.6870543005005051, |
| "learning_rate": 2.170219066438431e-05, |
| "loss": 0.1547, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16461580991744995, |
| "step": 3500, |
| "valid_targets_mean": 1830.8, |
| "valid_targets_min": 750 |
| }, |
| { |
| "epoch": 3.6855941114616195, |
| "grad_norm": 0.7708982306994941, |
| "learning_rate": 2.164993660596065e-05, |
| "loss": 0.1462, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13875049352645874, |
| "step": 3505, |
| "valid_targets_mean": 1344.1, |
| "valid_targets_min": 613 |
| }, |
| { |
| "epoch": 3.690851735015773, |
| "grad_norm": 0.7099231871496336, |
| "learning_rate": 2.1597671205054326e-05, |
| "loss": 0.1486, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14559851586818695, |
| "step": 3510, |
| "valid_targets_mean": 1668.8, |
| "valid_targets_min": 768 |
| }, |
| { |
| "epoch": 3.6961093585699265, |
| "grad_norm": 0.8060373598979466, |
| "learning_rate": 2.1545394820963637e-05, |
| "loss": 0.1454, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13935421407222748, |
| "step": 3515, |
| "valid_targets_mean": 1340.0, |
| "valid_targets_min": 700 |
| }, |
| { |
| "epoch": 3.70136698212408, |
| "grad_norm": 0.7607109285681598, |
| "learning_rate": 2.149310781306237e-05, |
| "loss": 0.1523, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13217228651046753, |
| "step": 3520, |
| "valid_targets_mean": 1266.8, |
| "valid_targets_min": 800 |
| }, |
| { |
| "epoch": 3.7066246056782335, |
| "grad_norm": 0.8758953703245033, |
| "learning_rate": 2.1440810540797354e-05, |
| "loss": 0.1459, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16291630268096924, |
| "step": 3525, |
| "valid_targets_mean": 1674.1, |
| "valid_targets_min": 843 |
| }, |
| { |
| "epoch": 3.711882229232387, |
| "grad_norm": 0.8661060100226162, |
| "learning_rate": 2.1388503363685985e-05, |
| "loss": 0.1423, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14035390317440033, |
| "step": 3530, |
| "valid_targets_mean": 1169.9, |
| "valid_targets_min": 746 |
| }, |
| { |
| "epoch": 3.7171398527865405, |
| "grad_norm": 0.7610300863679027, |
| "learning_rate": 2.133618664131374e-05, |
| "loss": 0.1326, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13772127032279968, |
| "step": 3535, |
| "valid_targets_mean": 1315.5, |
| "valid_targets_min": 772 |
| }, |
| { |
| "epoch": 3.722397476340694, |
| "grad_norm": 0.7794403945443821, |
| "learning_rate": 2.1283860733331722e-05, |
| "loss": 0.1506, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14407244324684143, |
| "step": 3540, |
| "valid_targets_mean": 1417.9, |
| "valid_targets_min": 619 |
| }, |
| { |
| "epoch": 3.7276550998948474, |
| "grad_norm": 0.7766648700042907, |
| "learning_rate": 2.123152599945417e-05, |
| "loss": 0.1424, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1390763223171234, |
| "step": 3545, |
| "valid_targets_mean": 1407.2, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 3.732912723449001, |
| "grad_norm": 0.713784090941053, |
| "learning_rate": 2.1179182799456024e-05, |
| "loss": 0.1459, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14825764298439026, |
| "step": 3550, |
| "valid_targets_mean": 1538.9, |
| "valid_targets_min": 799 |
| }, |
| { |
| "epoch": 3.7381703470031544, |
| "grad_norm": 0.8587832147941542, |
| "learning_rate": 2.112683149317039e-05, |
| "loss": 0.1495, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1628817617893219, |
| "step": 3555, |
| "valid_targets_mean": 1469.2, |
| "valid_targets_min": 722 |
| }, |
| { |
| "epoch": 3.743427970557308, |
| "grad_norm": 0.7424728210631139, |
| "learning_rate": 2.1074472440486118e-05, |
| "loss": 0.1457, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14450980722904205, |
| "step": 3560, |
| "valid_targets_mean": 1341.0, |
| "valid_targets_min": 711 |
| }, |
| { |
| "epoch": 3.7486855941114614, |
| "grad_norm": 0.6974899257322207, |
| "learning_rate": 2.102210600134531e-05, |
| "loss": 0.1394, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13589932024478912, |
| "step": 3565, |
| "valid_targets_mean": 1472.0, |
| "valid_targets_min": 733 |
| }, |
| { |
| "epoch": 3.753943217665615, |
| "grad_norm": 0.792834948827596, |
| "learning_rate": 2.096973253574084e-05, |
| "loss": 0.1501, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1514257788658142, |
| "step": 3570, |
| "valid_targets_mean": 1493.6, |
| "valid_targets_min": 931 |
| }, |
| { |
| "epoch": 3.759200841219769, |
| "grad_norm": 0.6874037953722771, |
| "learning_rate": 2.09173524037139e-05, |
| "loss": 0.1548, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1504008024930954, |
| "step": 3575, |
| "valid_targets_mean": 1773.1, |
| "valid_targets_min": 1011 |
| }, |
| { |
| "epoch": 3.7644584647739223, |
| "grad_norm": 0.7837520816337542, |
| "learning_rate": 2.0864965965351495e-05, |
| "loss": 0.157, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14988698065280914, |
| "step": 3580, |
| "valid_targets_mean": 1372.2, |
| "valid_targets_min": 748 |
| }, |
| { |
| "epoch": 3.769716088328076, |
| "grad_norm": 0.8081712809437585, |
| "learning_rate": 2.081257358078398e-05, |
| "loss": 0.1427, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14466381072998047, |
| "step": 3585, |
| "valid_targets_mean": 1519.7, |
| "valid_targets_min": 699 |
| }, |
| { |
| "epoch": 3.7749737118822293, |
| "grad_norm": 0.7760159006917432, |
| "learning_rate": 2.0760175610182613e-05, |
| "loss": 0.1388, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12998421490192413, |
| "step": 3590, |
| "valid_targets_mean": 1243.5, |
| "valid_targets_min": 534 |
| }, |
| { |
| "epoch": 3.780231335436383, |
| "grad_norm": 0.7584560177318204, |
| "learning_rate": 2.0707772413757016e-05, |
| "loss": 0.1531, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14621761441230774, |
| "step": 3595, |
| "valid_targets_mean": 1522.9, |
| "valid_targets_min": 687 |
| }, |
| { |
| "epoch": 3.7854889589905363, |
| "grad_norm": 1.7509432609069835, |
| "learning_rate": 2.0655364351752763e-05, |
| "loss": 0.1401, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13551291823387146, |
| "step": 3600, |
| "valid_targets_mean": 1458.9, |
| "valid_targets_min": 549 |
| }, |
| { |
| "epoch": 3.7907465825446898, |
| "grad_norm": 0.7384715666894996, |
| "learning_rate": 2.060295178444887e-05, |
| "loss": 0.1367, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1364159733057022, |
| "step": 3605, |
| "valid_targets_mean": 1378.8, |
| "valid_targets_min": 725 |
| }, |
| { |
| "epoch": 3.7960042060988433, |
| "grad_norm": 0.7992737455040028, |
| "learning_rate": 2.055053507215533e-05, |
| "loss": 0.1379, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15726029872894287, |
| "step": 3610, |
| "valid_targets_mean": 1706.8, |
| "valid_targets_min": 852 |
| }, |
| { |
| "epoch": 3.8012618296529967, |
| "grad_norm": 0.749232690670078, |
| "learning_rate": 2.049811457521061e-05, |
| "loss": 0.1545, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1454424262046814, |
| "step": 3615, |
| "valid_targets_mean": 1576.4, |
| "valid_targets_min": 1010 |
| }, |
| { |
| "epoch": 3.8065194532071502, |
| "grad_norm": 0.7663104938841124, |
| "learning_rate": 2.0445690653979216e-05, |
| "loss": 0.148, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13865984976291656, |
| "step": 3620, |
| "valid_targets_mean": 1387.0, |
| "valid_targets_min": 545 |
| }, |
| { |
| "epoch": 3.8117770767613037, |
| "grad_norm": 0.7120351730447476, |
| "learning_rate": 2.039326366884919e-05, |
| "loss": 0.1419, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14631116390228271, |
| "step": 3625, |
| "valid_targets_mean": 1451.8, |
| "valid_targets_min": 843 |
| }, |
| { |
| "epoch": 3.8170347003154577, |
| "grad_norm": 0.7188936868893969, |
| "learning_rate": 2.034083398022963e-05, |
| "loss": 0.1434, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15240274369716644, |
| "step": 3630, |
| "valid_targets_mean": 1780.8, |
| "valid_targets_min": 802 |
| }, |
| { |
| "epoch": 3.822292323869611, |
| "grad_norm": 0.7833295571858446, |
| "learning_rate": 2.028840194854822e-05, |
| "loss": 0.1478, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1410003900527954, |
| "step": 3635, |
| "valid_targets_mean": 1409.9, |
| "valid_targets_min": 612 |
| }, |
| { |
| "epoch": 3.8275499474237646, |
| "grad_norm": 0.7944585877780198, |
| "learning_rate": 2.0235967934248756e-05, |
| "loss": 0.1445, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13537245988845825, |
| "step": 3640, |
| "valid_targets_mean": 1425.5, |
| "valid_targets_min": 673 |
| }, |
| { |
| "epoch": 3.832807570977918, |
| "grad_norm": 0.8094967702366247, |
| "learning_rate": 2.018353229778867e-05, |
| "loss": 0.1443, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1483570635318756, |
| "step": 3645, |
| "valid_targets_mean": 1347.2, |
| "valid_targets_min": 705 |
| }, |
| { |
| "epoch": 3.8380651945320716, |
| "grad_norm": 0.6993189624925312, |
| "learning_rate": 2.0131095399636522e-05, |
| "loss": 0.1414, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13212630152702332, |
| "step": 3650, |
| "valid_targets_mean": 1416.8, |
| "valid_targets_min": 672 |
| }, |
| { |
| "epoch": 3.843322818086225, |
| "grad_norm": 0.6928415473664703, |
| "learning_rate": 2.0078657600269573e-05, |
| "loss": 0.1316, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11715187877416611, |
| "step": 3655, |
| "valid_targets_mean": 1418.4, |
| "valid_targets_min": 604 |
| }, |
| { |
| "epoch": 3.8485804416403786, |
| "grad_norm": 0.7501917663236193, |
| "learning_rate": 2.0026219260171262e-05, |
| "loss": 0.1518, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14008289575576782, |
| "step": 3660, |
| "valid_targets_mean": 1467.6, |
| "valid_targets_min": 647 |
| }, |
| { |
| "epoch": 3.853838065194532, |
| "grad_norm": 0.7446691316933927, |
| "learning_rate": 1.9973780739828748e-05, |
| "loss": 0.1448, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12458867579698563, |
| "step": 3665, |
| "valid_targets_mean": 1283.6, |
| "valid_targets_min": 613 |
| }, |
| { |
| "epoch": 3.8590956887486856, |
| "grad_norm": 0.8358295545742249, |
| "learning_rate": 1.9921342399730433e-05, |
| "loss": 0.1462, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14649547636508942, |
| "step": 3670, |
| "valid_targets_mean": 1288.4, |
| "valid_targets_min": 713 |
| }, |
| { |
| "epoch": 3.864353312302839, |
| "grad_norm": 0.7509432896311811, |
| "learning_rate": 1.9868904600363485e-05, |
| "loss": 0.1437, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13095489144325256, |
| "step": 3675, |
| "valid_targets_mean": 1554.5, |
| "valid_targets_min": 892 |
| }, |
| { |
| "epoch": 3.8696109358569926, |
| "grad_norm": 0.792107584005417, |
| "learning_rate": 1.9816467702211342e-05, |
| "loss": 0.1474, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.150422140955925, |
| "step": 3680, |
| "valid_targets_mean": 1424.2, |
| "valid_targets_min": 772 |
| }, |
| { |
| "epoch": 3.874868559411146, |
| "grad_norm": 0.7493648214407846, |
| "learning_rate": 1.9764032065751248e-05, |
| "loss": 0.144, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1561586856842041, |
| "step": 3685, |
| "valid_targets_mean": 1646.6, |
| "valid_targets_min": 636 |
| }, |
| { |
| "epoch": 3.8801261829652995, |
| "grad_norm": 0.7680634147152421, |
| "learning_rate": 1.971159805145178e-05, |
| "loss": 0.1422, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13870960474014282, |
| "step": 3690, |
| "valid_targets_mean": 1366.1, |
| "valid_targets_min": 641 |
| }, |
| { |
| "epoch": 3.885383806519453, |
| "grad_norm": 0.7670436903492326, |
| "learning_rate": 1.965916601977038e-05, |
| "loss": 0.1488, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14888067543506622, |
| "step": 3695, |
| "valid_targets_mean": 1482.4, |
| "valid_targets_min": 766 |
| }, |
| { |
| "epoch": 3.8906414300736065, |
| "grad_norm": 0.7970428978319392, |
| "learning_rate": 1.9606736331150812e-05, |
| "loss": 0.1423, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13972023129463196, |
| "step": 3700, |
| "valid_targets_mean": 1346.4, |
| "valid_targets_min": 729 |
| }, |
| { |
| "epoch": 3.89589905362776, |
| "grad_norm": 0.7866111704363837, |
| "learning_rate": 1.9554309346020784e-05, |
| "loss": 0.1502, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15238693356513977, |
| "step": 3705, |
| "valid_targets_mean": 1471.1, |
| "valid_targets_min": 682 |
| }, |
| { |
| "epoch": 3.9011566771819135, |
| "grad_norm": 0.8179110532896274, |
| "learning_rate": 1.9501885424789394e-05, |
| "loss": 0.1511, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14223146438598633, |
| "step": 3710, |
| "valid_targets_mean": 1593.8, |
| "valid_targets_min": 738 |
| }, |
| { |
| "epoch": 3.9064143007360674, |
| "grad_norm": 0.7874291856747577, |
| "learning_rate": 1.9449464927844677e-05, |
| "loss": 0.1463, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14259304106235504, |
| "step": 3715, |
| "valid_targets_mean": 1298.9, |
| "valid_targets_min": 731 |
| }, |
| { |
| "epoch": 3.911671924290221, |
| "grad_norm": 0.7550522004516413, |
| "learning_rate": 1.939704821555113e-05, |
| "loss": 0.149, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16015680134296417, |
| "step": 3720, |
| "valid_targets_mean": 1543.5, |
| "valid_targets_min": 801 |
| }, |
| { |
| "epoch": 3.9169295478443744, |
| "grad_norm": 0.7334582520816827, |
| "learning_rate": 1.9344635648247244e-05, |
| "loss": 0.1351, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13253885507583618, |
| "step": 3725, |
| "valid_targets_mean": 1396.4, |
| "valid_targets_min": 564 |
| }, |
| { |
| "epoch": 3.922187171398528, |
| "grad_norm": 0.7417014536963873, |
| "learning_rate": 1.9292227586242994e-05, |
| "loss": 0.142, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14190204441547394, |
| "step": 3730, |
| "valid_targets_mean": 1543.1, |
| "valid_targets_min": 651 |
| }, |
| { |
| "epoch": 3.9274447949526814, |
| "grad_norm": 0.7610265869958812, |
| "learning_rate": 1.9239824389817397e-05, |
| "loss": 0.1455, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1278257519006729, |
| "step": 3735, |
| "valid_targets_mean": 1331.9, |
| "valid_targets_min": 716 |
| }, |
| { |
| "epoch": 3.932702418506835, |
| "grad_norm": 0.7518368918699934, |
| "learning_rate": 1.9187426419216026e-05, |
| "loss": 0.1451, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12716713547706604, |
| "step": 3740, |
| "valid_targets_mean": 1321.7, |
| "valid_targets_min": 703 |
| }, |
| { |
| "epoch": 3.9379600420609884, |
| "grad_norm": 0.7369801637124225, |
| "learning_rate": 1.9135034034648515e-05, |
| "loss": 0.1397, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13780197501182556, |
| "step": 3745, |
| "valid_targets_mean": 1445.0, |
| "valid_targets_min": 1195 |
| }, |
| { |
| "epoch": 3.943217665615142, |
| "grad_norm": 0.9560172569065368, |
| "learning_rate": 1.90826475962861e-05, |
| "loss": 0.1487, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17044293880462646, |
| "step": 3750, |
| "valid_targets_mean": 1594.3, |
| "valid_targets_min": 764 |
| }, |
| { |
| "epoch": 3.9484752891692954, |
| "grad_norm": 0.7569817592758459, |
| "learning_rate": 1.9030267464259164e-05, |
| "loss": 0.1567, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15231093764305115, |
| "step": 3755, |
| "valid_targets_mean": 1516.2, |
| "valid_targets_min": 812 |
| }, |
| { |
| "epoch": 3.953732912723449, |
| "grad_norm": 0.7422459936180924, |
| "learning_rate": 1.8977893998654692e-05, |
| "loss": 0.1406, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15256305038928986, |
| "step": 3760, |
| "valid_targets_mean": 1679.4, |
| "valid_targets_min": 979 |
| }, |
| { |
| "epoch": 3.958990536277603, |
| "grad_norm": 0.7151323665713769, |
| "learning_rate": 1.8925527559513886e-05, |
| "loss": 0.1488, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15546274185180664, |
| "step": 3765, |
| "valid_targets_mean": 1684.2, |
| "valid_targets_min": 823 |
| }, |
| { |
| "epoch": 3.9642481598317563, |
| "grad_norm": 0.6718585422156108, |
| "learning_rate": 1.8873168506829614e-05, |
| "loss": 0.1247, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1253662109375, |
| "step": 3770, |
| "valid_targets_mean": 1546.6, |
| "valid_targets_min": 595 |
| }, |
| { |
| "epoch": 3.9695057833859098, |
| "grad_norm": 0.7900464709650304, |
| "learning_rate": 1.882081720054398e-05, |
| "loss": 0.1414, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1423221230506897, |
| "step": 3775, |
| "valid_targets_mean": 1372.4, |
| "valid_targets_min": 693 |
| }, |
| { |
| "epoch": 3.9747634069400632, |
| "grad_norm": 0.7631080488938405, |
| "learning_rate": 1.876847400054583e-05, |
| "loss": 0.141, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13596129417419434, |
| "step": 3780, |
| "valid_targets_mean": 1407.7, |
| "valid_targets_min": 720 |
| }, |
| { |
| "epoch": 3.9800210304942167, |
| "grad_norm": 0.748150989006652, |
| "learning_rate": 1.8716139266668288e-05, |
| "loss": 0.1492, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15752890706062317, |
| "step": 3785, |
| "valid_targets_mean": 1762.1, |
| "valid_targets_min": 685 |
| }, |
| { |
| "epoch": 3.9852786540483702, |
| "grad_norm": 0.6798309275501556, |
| "learning_rate": 1.8663813358686267e-05, |
| "loss": 0.1444, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14607755839824677, |
| "step": 3790, |
| "valid_targets_mean": 1592.1, |
| "valid_targets_min": 658 |
| }, |
| { |
| "epoch": 3.9905362776025237, |
| "grad_norm": 0.7875602049898909, |
| "learning_rate": 1.8611496636314025e-05, |
| "loss": 0.1463, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1496124118566513, |
| "step": 3795, |
| "valid_targets_mean": 1514.8, |
| "valid_targets_min": 1018 |
| }, |
| { |
| "epoch": 3.995793901156677, |
| "grad_norm": 0.7751342330294595, |
| "learning_rate": 1.8559189459202653e-05, |
| "loss": 0.1471, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14422816038131714, |
| "step": 3800, |
| "valid_targets_mean": 1507.4, |
| "valid_targets_min": 897 |
| }, |
| { |
| "epoch": 4.001051524710831, |
| "grad_norm": 0.687150716302613, |
| "learning_rate": 1.8506892186937636e-05, |
| "loss": 0.1344, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12322714924812317, |
| "step": 3805, |
| "valid_targets_mean": 1699.4, |
| "valid_targets_min": 393 |
| }, |
| { |
| "epoch": 4.006309148264984, |
| "grad_norm": 0.42864035629677005, |
| "learning_rate": 1.845460517903637e-05, |
| "loss": 0.1117, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08149848878383636, |
| "step": 3810, |
| "valid_targets_mean": 2954.8, |
| "valid_targets_min": 834 |
| }, |
| { |
| "epoch": 4.011566771819138, |
| "grad_norm": 0.36298963794579575, |
| "learning_rate": 1.8402328794945678e-05, |
| "loss": 0.0926, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0827195793390274, |
| "step": 3815, |
| "valid_targets_mean": 3410.2, |
| "valid_targets_min": 2790 |
| }, |
| { |
| "epoch": 4.016824395373291, |
| "grad_norm": 0.3914164890824438, |
| "learning_rate": 1.8350063394039352e-05, |
| "loss": 0.0841, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09019855409860611, |
| "step": 3820, |
| "valid_targets_mean": 3594.9, |
| "valid_targets_min": 2133 |
| }, |
| { |
| "epoch": 4.022082018927445, |
| "grad_norm": 0.4163328603662043, |
| "learning_rate": 1.82978093356157e-05, |
| "loss": 0.105, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08957859873771667, |
| "step": 3825, |
| "valid_targets_mean": 2853.9, |
| "valid_targets_min": 526 |
| }, |
| { |
| "epoch": 4.027339642481598, |
| "grad_norm": 0.41682147967247024, |
| "learning_rate": 1.824556697889502e-05, |
| "loss": 0.0819, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08536089211702347, |
| "step": 3830, |
| "valid_targets_mean": 2827.7, |
| "valid_targets_min": 662 |
| }, |
| { |
| "epoch": 4.032597266035752, |
| "grad_norm": 0.9758457355351812, |
| "learning_rate": 1.8193336683017197e-05, |
| "loss": 0.1121, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14917269349098206, |
| "step": 3835, |
| "valid_targets_mean": 1010.2, |
| "valid_targets_min": 525 |
| }, |
| { |
| "epoch": 4.037854889589905, |
| "grad_norm": 0.420354371106784, |
| "learning_rate": 1.8141118807039193e-05, |
| "loss": 0.1233, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08612798154354095, |
| "step": 3840, |
| "valid_targets_mean": 2922.9, |
| "valid_targets_min": 647 |
| }, |
| { |
| "epoch": 4.043112513144059, |
| "grad_norm": 0.40812370482751553, |
| "learning_rate": 1.8088913709932582e-05, |
| "loss": 0.0937, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09145452827215195, |
| "step": 3845, |
| "valid_targets_mean": 2800.7, |
| "valid_targets_min": 718 |
| }, |
| { |
| "epoch": 4.048370136698212, |
| "grad_norm": 0.5811669690772227, |
| "learning_rate": 1.8036721750581106e-05, |
| "loss": 0.1197, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18292278051376343, |
| "step": 3850, |
| "valid_targets_mean": 2503.3, |
| "valid_targets_min": 540 |
| }, |
| { |
| "epoch": 4.053627760252366, |
| "grad_norm": 0.28305317037901473, |
| "learning_rate": 1.7984543287778185e-05, |
| "loss": 0.0853, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07100999355316162, |
| "step": 3855, |
| "valid_targets_mean": 5138.8, |
| "valid_targets_min": 636 |
| }, |
| { |
| "epoch": 4.058885383806519, |
| "grad_norm": 0.36506802248945247, |
| "learning_rate": 1.7932378680224443e-05, |
| "loss": 0.0848, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09302988648414612, |
| "step": 3860, |
| "valid_targets_mean": 2786.8, |
| "valid_targets_min": 818 |
| }, |
| { |
| "epoch": 4.064143007360673, |
| "grad_norm": 0.3681864800332117, |
| "learning_rate": 1.7880228286525275e-05, |
| "loss": 0.0854, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07192498445510864, |
| "step": 3865, |
| "valid_targets_mean": 3787.4, |
| "valid_targets_min": 1006 |
| }, |
| { |
| "epoch": 4.069400630914826, |
| "grad_norm": 0.44709526344713, |
| "learning_rate": 1.782809246518836e-05, |
| "loss": 0.1035, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13080145418643951, |
| "step": 3870, |
| "valid_targets_mean": 2526.6, |
| "valid_targets_min": 688 |
| }, |
| { |
| "epoch": 4.0746582544689804, |
| "grad_norm": 0.379123899973497, |
| "learning_rate": 1.7775971574621186e-05, |
| "loss": 0.1034, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07068104296922684, |
| "step": 3875, |
| "valid_targets_mean": 2956.9, |
| "valid_targets_min": 553 |
| }, |
| { |
| "epoch": 4.079915878023134, |
| "grad_norm": 0.43246617716881486, |
| "learning_rate": 1.772386597312861e-05, |
| "loss": 0.0871, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08573436737060547, |
| "step": 3880, |
| "valid_targets_mean": 2154.8, |
| "valid_targets_min": 566 |
| }, |
| { |
| "epoch": 4.085173501577287, |
| "grad_norm": 0.3018078384691382, |
| "learning_rate": 1.7671776018910397e-05, |
| "loss": 0.0797, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06644061207771301, |
| "step": 3885, |
| "valid_targets_mean": 3934.6, |
| "valid_targets_min": 1111 |
| }, |
| { |
| "epoch": 4.090431125131441, |
| "grad_norm": 0.4293151652745935, |
| "learning_rate": 1.761970207005871e-05, |
| "loss": 0.0854, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10549415647983551, |
| "step": 3890, |
| "valid_targets_mean": 2306.4, |
| "valid_targets_min": 622 |
| }, |
| { |
| "epoch": 4.095688748685594, |
| "grad_norm": 0.5331904265794647, |
| "learning_rate": 1.756764448455572e-05, |
| "loss": 0.0971, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10992026329040527, |
| "step": 3895, |
| "valid_targets_mean": 2033.1, |
| "valid_targets_min": 696 |
| }, |
| { |
| "epoch": 4.100946372239748, |
| "grad_norm": 0.47516133096290825, |
| "learning_rate": 1.7515603620271087e-05, |
| "loss": 0.0952, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10050627589225769, |
| "step": 3900, |
| "valid_targets_mean": 3010.1, |
| "valid_targets_min": 893 |
| }, |
| { |
| "epoch": 4.106203995793901, |
| "grad_norm": 0.4534494965348713, |
| "learning_rate": 1.7463579834959525e-05, |
| "loss": 0.0974, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09654377400875092, |
| "step": 3905, |
| "valid_targets_mean": 2633.4, |
| "valid_targets_min": 802 |
| }, |
| { |
| "epoch": 4.111461619348055, |
| "grad_norm": 0.5367991008352612, |
| "learning_rate": 1.7411573486258343e-05, |
| "loss": 0.1037, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12864451110363007, |
| "step": 3910, |
| "valid_targets_mean": 2308.9, |
| "valid_targets_min": 957 |
| }, |
| { |
| "epoch": 4.116719242902208, |
| "grad_norm": 0.4290677081931766, |
| "learning_rate": 1.735958493168498e-05, |
| "loss": 0.1213, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09149613976478577, |
| "step": 3915, |
| "valid_targets_mean": 3071.3, |
| "valid_targets_min": 641 |
| }, |
| { |
| "epoch": 4.121976866456362, |
| "grad_norm": 0.4280175203325265, |
| "learning_rate": 1.730761452863454e-05, |
| "loss": 0.0819, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09220650792121887, |
| "step": 3920, |
| "valid_targets_mean": 2525.9, |
| "valid_targets_min": 711 |
| }, |
| { |
| "epoch": 4.127234490010515, |
| "grad_norm": 0.4826209997511778, |
| "learning_rate": 1.7255662634377365e-05, |
| "loss": 0.121, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14056621491909027, |
| "step": 3925, |
| "valid_targets_mean": 2187.0, |
| "valid_targets_min": 643 |
| }, |
| { |
| "epoch": 4.132492113564669, |
| "grad_norm": 0.4860783578289778, |
| "learning_rate": 1.720372960605654e-05, |
| "loss": 0.1061, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10677383840084076, |
| "step": 3930, |
| "valid_targets_mean": 2253.0, |
| "valid_targets_min": 538 |
| }, |
| { |
| "epoch": 4.137749737118822, |
| "grad_norm": 0.5167962163863851, |
| "learning_rate": 1.715181580068546e-05, |
| "loss": 0.0908, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11996076256036758, |
| "step": 3935, |
| "valid_targets_mean": 2365.9, |
| "valid_targets_min": 664 |
| }, |
| { |
| "epoch": 4.143007360672976, |
| "grad_norm": 0.6195321805055407, |
| "learning_rate": 1.7099921575145372e-05, |
| "loss": 0.2572, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.38817277550697327, |
| "step": 3940, |
| "valid_targets_mean": 2509.2, |
| "valid_targets_min": 922 |
| }, |
| { |
| "epoch": 4.148264984227129, |
| "grad_norm": 0.4838160894790163, |
| "learning_rate": 1.7048047286182945e-05, |
| "loss": 0.127, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0898803174495697, |
| "step": 3945, |
| "valid_targets_mean": 2140.8, |
| "valid_targets_min": 507 |
| }, |
| { |
| "epoch": 4.153522607781283, |
| "grad_norm": 0.3856936107770497, |
| "learning_rate": 1.6996193290407742e-05, |
| "loss": 0.1048, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10756798833608627, |
| "step": 3950, |
| "valid_targets_mean": 3023.5, |
| "valid_targets_min": 615 |
| }, |
| { |
| "epoch": 4.158780231335436, |
| "grad_norm": 0.44570525600863437, |
| "learning_rate": 1.694435994428987e-05, |
| "loss": 0.1846, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19231784343719482, |
| "step": 3955, |
| "valid_targets_mean": 2874.2, |
| "valid_targets_min": 826 |
| }, |
| { |
| "epoch": 4.16403785488959, |
| "grad_norm": 0.4088175170718333, |
| "learning_rate": 1.6892547604157464e-05, |
| "loss": 0.0889, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09553523361682892, |
| "step": 3960, |
| "valid_targets_mean": 3176.8, |
| "valid_targets_min": 830 |
| }, |
| { |
| "epoch": 4.169295478443743, |
| "grad_norm": 0.4082272081827545, |
| "learning_rate": 1.6840756626194242e-05, |
| "loss": 0.089, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10171765834093094, |
| "step": 3965, |
| "valid_targets_mean": 4479.9, |
| "valid_targets_min": 2665 |
| }, |
| { |
| "epoch": 4.174553101997897, |
| "grad_norm": 0.3419247532155441, |
| "learning_rate": 1.678898736643708e-05, |
| "loss": 0.0935, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0854925662279129, |
| "step": 3970, |
| "valid_targets_mean": 3246.1, |
| "valid_targets_min": 595 |
| }, |
| { |
| "epoch": 4.17981072555205, |
| "grad_norm": 0.42938395652567896, |
| "learning_rate": 1.6737240180773554e-05, |
| "loss": 0.0847, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08609820902347565, |
| "step": 3975, |
| "valid_targets_mean": 2390.4, |
| "valid_targets_min": 779 |
| }, |
| { |
| "epoch": 4.185068349106204, |
| "grad_norm": 0.5480139294102536, |
| "learning_rate": 1.6685515424939478e-05, |
| "loss": 0.0843, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07699918001890182, |
| "step": 3980, |
| "valid_targets_mean": 2643.6, |
| "valid_targets_min": 672 |
| }, |
| { |
| "epoch": 4.190325972660357, |
| "grad_norm": 0.3398786560781086, |
| "learning_rate": 1.6633813454516486e-05, |
| "loss": 0.0783, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06625483185052872, |
| "step": 3985, |
| "valid_targets_mean": 2986.9, |
| "valid_targets_min": 1027 |
| }, |
| { |
| "epoch": 4.195583596214511, |
| "grad_norm": 0.3919954362376148, |
| "learning_rate": 1.658213462492957e-05, |
| "loss": 0.0863, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0802190750837326, |
| "step": 3990, |
| "valid_targets_mean": 3580.1, |
| "valid_targets_min": 2540 |
| }, |
| { |
| "epoch": 4.200841219768664, |
| "grad_norm": 0.4205464998194999, |
| "learning_rate": 1.6530479291444636e-05, |
| "loss": 0.0755, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09197942167520523, |
| "step": 3995, |
| "valid_targets_mean": 2893.3, |
| "valid_targets_min": 576 |
| }, |
| { |
| "epoch": 4.206098843322818, |
| "grad_norm": 0.2808905744460822, |
| "learning_rate": 1.6478847809166066e-05, |
| "loss": 0.1183, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.048266805708408356, |
| "step": 4000, |
| "valid_targets_mean": 3497.9, |
| "valid_targets_min": 623 |
| }, |
| { |
| "epoch": 4.211356466876971, |
| "grad_norm": 0.38695326267770913, |
| "learning_rate": 1.64272405330343e-05, |
| "loss": 0.0716, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07455742359161377, |
| "step": 4005, |
| "valid_targets_mean": 2850.4, |
| "valid_targets_min": 583 |
| }, |
| { |
| "epoch": 4.216614090431126, |
| "grad_norm": 0.35771383205774226, |
| "learning_rate": 1.6375657817823323e-05, |
| "loss": 0.0754, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07963775843381882, |
| "step": 4010, |
| "valid_targets_mean": 3863.2, |
| "valid_targets_min": 3230 |
| }, |
| { |
| "epoch": 4.221871713985279, |
| "grad_norm": 0.40347603356414613, |
| "learning_rate": 1.6324100018138328e-05, |
| "loss": 0.0748, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0651107057929039, |
| "step": 4015, |
| "valid_targets_mean": 2461.8, |
| "valid_targets_min": 526 |
| }, |
| { |
| "epoch": 4.2271293375394325, |
| "grad_norm": 0.725077259640492, |
| "learning_rate": 1.6272567488413204e-05, |
| "loss": 0.1256, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21477793157100677, |
| "step": 4020, |
| "valid_targets_mean": 1658.2, |
| "valid_targets_min": 195 |
| }, |
| { |
| "epoch": 4.232386961093586, |
| "grad_norm": 0.3538915023393407, |
| "learning_rate": 1.6221060582908115e-05, |
| "loss": 0.0832, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09245728701353073, |
| "step": 4025, |
| "valid_targets_mean": 3706.3, |
| "valid_targets_min": 2624 |
| }, |
| { |
| "epoch": 4.2376445846477395, |
| "grad_norm": 0.5000611339552574, |
| "learning_rate": 1.616957965570708e-05, |
| "loss": 0.1158, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1068650484085083, |
| "step": 4030, |
| "valid_targets_mean": 1733.1, |
| "valid_targets_min": 715 |
| }, |
| { |
| "epoch": 4.242902208201893, |
| "grad_norm": 0.3703886251011038, |
| "learning_rate": 1.6118125060715534e-05, |
| "loss": 0.0837, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07927380502223969, |
| "step": 4035, |
| "valid_targets_mean": 3413.1, |
| "valid_targets_min": 847 |
| }, |
| { |
| "epoch": 4.2481598317560465, |
| "grad_norm": 0.5669430744333894, |
| "learning_rate": 1.6066697151657876e-05, |
| "loss": 0.1098, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10927321016788483, |
| "step": 4040, |
| "valid_targets_mean": 2039.8, |
| "valid_targets_min": 824 |
| }, |
| { |
| "epoch": 4.2534174553102, |
| "grad_norm": 0.4546239854389364, |
| "learning_rate": 1.601529628207508e-05, |
| "loss": 0.1147, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08450181037187576, |
| "step": 4045, |
| "valid_targets_mean": 2160.5, |
| "valid_targets_min": 809 |
| }, |
| { |
| "epoch": 4.2586750788643535, |
| "grad_norm": 0.6286036765331103, |
| "learning_rate": 1.5963922805322204e-05, |
| "loss": 0.1136, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20327050983905792, |
| "step": 4050, |
| "valid_targets_mean": 1854.1, |
| "valid_targets_min": 771 |
| }, |
| { |
| "epoch": 4.263932702418507, |
| "grad_norm": 0.4125196051152265, |
| "learning_rate": 1.5912577074566016e-05, |
| "loss": 0.0862, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08141230791807175, |
| "step": 4055, |
| "valid_targets_mean": 3094.5, |
| "valid_targets_min": 707 |
| }, |
| { |
| "epoch": 4.2691903259726605, |
| "grad_norm": 0.35720837148962503, |
| "learning_rate": 1.5861259442782548e-05, |
| "loss": 0.0915, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0740450918674469, |
| "step": 4060, |
| "valid_targets_mean": 3806.2, |
| "valid_targets_min": 2850 |
| }, |
| { |
| "epoch": 4.274447949526814, |
| "grad_norm": 0.40358758473977735, |
| "learning_rate": 1.580997026275464e-05, |
| "loss": 0.0889, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09053555130958557, |
| "step": 4065, |
| "valid_targets_mean": 3537.8, |
| "valid_targets_min": 749 |
| }, |
| { |
| "epoch": 4.279705573080967, |
| "grad_norm": 0.34333954811248674, |
| "learning_rate": 1.5758709887069562e-05, |
| "loss": 0.0746, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0822061225771904, |
| "step": 4070, |
| "valid_targets_mean": 4453.0, |
| "valid_targets_min": 1052 |
| }, |
| { |
| "epoch": 4.284963196635121, |
| "grad_norm": 0.36136388061308067, |
| "learning_rate": 1.570747866811658e-05, |
| "loss": 0.0725, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06539871543645859, |
| "step": 4075, |
| "valid_targets_mean": 4073.1, |
| "valid_targets_min": 896 |
| }, |
| { |
| "epoch": 4.290220820189274, |
| "grad_norm": 0.3385238493016099, |
| "learning_rate": 1.5656276958084478e-05, |
| "loss": 0.0849, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07738714665174484, |
| "step": 4080, |
| "valid_targets_mean": 3921.4, |
| "valid_targets_min": 1859 |
| }, |
| { |
| "epoch": 4.295478443743428, |
| "grad_norm": 0.3523885200042189, |
| "learning_rate": 1.560510510895923e-05, |
| "loss": 0.1003, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06382683664560318, |
| "step": 4085, |
| "valid_targets_mean": 2804.2, |
| "valid_targets_min": 893 |
| }, |
| { |
| "epoch": 4.300736067297581, |
| "grad_norm": 0.464356647875685, |
| "learning_rate": 1.5553963472521506e-05, |
| "loss": 0.0937, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10442212969064713, |
| "step": 4090, |
| "valid_targets_mean": 2879.6, |
| "valid_targets_min": 753 |
| }, |
| { |
| "epoch": 4.305993690851735, |
| "grad_norm": 0.3001537750054545, |
| "learning_rate": 1.5502852400344277e-05, |
| "loss": 0.088, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.05652359127998352, |
| "step": 4095, |
| "valid_targets_mean": 3441.2, |
| "valid_targets_min": 995 |
| }, |
| { |
| "epoch": 4.311251314405888, |
| "grad_norm": 0.4144103671249372, |
| "learning_rate": 1.545177224379041e-05, |
| "loss": 0.0773, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09758152812719345, |
| "step": 4100, |
| "valid_targets_mean": 3682.8, |
| "valid_targets_min": 1576 |
| }, |
| { |
| "epoch": 4.316508937960042, |
| "grad_norm": 0.4657016413112488, |
| "learning_rate": 1.5400723354010244e-05, |
| "loss": 0.0901, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09643582999706268, |
| "step": 4105, |
| "valid_targets_mean": 3230.6, |
| "valid_targets_min": 907 |
| }, |
| { |
| "epoch": 4.321766561514195, |
| "grad_norm": 0.30299818623468733, |
| "learning_rate": 1.5349706081939158e-05, |
| "loss": 0.0756, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.05721421167254448, |
| "step": 4110, |
| "valid_targets_mean": 3664.4, |
| "valid_targets_min": 980 |
| }, |
| { |
| "epoch": 4.327024185068349, |
| "grad_norm": 0.564066101410305, |
| "learning_rate": 1.5298720778295195e-05, |
| "loss": 0.084, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1053677424788475, |
| "step": 4115, |
| "valid_targets_mean": 1743.9, |
| "valid_targets_min": 478 |
| }, |
| { |
| "epoch": 4.332281808622502, |
| "grad_norm": 0.5201688078000634, |
| "learning_rate": 1.5247767793576625e-05, |
| "loss": 0.0833, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10424987971782684, |
| "step": 4120, |
| "valid_targets_mean": 2762.8, |
| "valid_targets_min": 955 |
| }, |
| { |
| "epoch": 4.337539432176656, |
| "grad_norm": 0.5146583332580208, |
| "learning_rate": 1.519684747805953e-05, |
| "loss": 0.0842, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09465573728084564, |
| "step": 4125, |
| "valid_targets_mean": 2030.4, |
| "valid_targets_min": 680 |
| }, |
| { |
| "epoch": 4.342797055730809, |
| "grad_norm": 0.4331588081741131, |
| "learning_rate": 1.5145960181795421e-05, |
| "loss": 0.1012, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09902848303318024, |
| "step": 4130, |
| "valid_targets_mean": 2521.4, |
| "valid_targets_min": 748 |
| }, |
| { |
| "epoch": 4.348054679284963, |
| "grad_norm": 0.589163336741105, |
| "learning_rate": 1.509510625460883e-05, |
| "loss": 0.0823, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09778404980897903, |
| "step": 4135, |
| "valid_targets_mean": 1524.1, |
| "valid_targets_min": 495 |
| }, |
| { |
| "epoch": 4.353312302839116, |
| "grad_norm": 0.3670017348685696, |
| "learning_rate": 1.5044286046094851e-05, |
| "loss": 0.0923, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.059174373745918274, |
| "step": 4140, |
| "valid_targets_mean": 2627.4, |
| "valid_targets_min": 622 |
| }, |
| { |
| "epoch": 4.358569926393271, |
| "grad_norm": 0.48446578892537395, |
| "learning_rate": 1.4993499905616823e-05, |
| "loss": 0.1088, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08301905542612076, |
| "step": 4145, |
| "valid_targets_mean": 3506.1, |
| "valid_targets_min": 1322 |
| }, |
| { |
| "epoch": 4.363827549947424, |
| "grad_norm": 0.38820467984517865, |
| "learning_rate": 1.494274818230387e-05, |
| "loss": 0.0844, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07928691059350967, |
| "step": 4150, |
| "valid_targets_mean": 3012.4, |
| "valid_targets_min": 814 |
| }, |
| { |
| "epoch": 4.369085173501578, |
| "grad_norm": 0.5483956191034934, |
| "learning_rate": 1.4892031225048503e-05, |
| "loss": 0.0742, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09606194496154785, |
| "step": 4155, |
| "valid_targets_mean": 3277.6, |
| "valid_targets_min": 841 |
| }, |
| { |
| "epoch": 4.374342797055731, |
| "grad_norm": 0.45645022712120253, |
| "learning_rate": 1.4841349382504247e-05, |
| "loss": 0.0891, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13126420974731445, |
| "step": 4160, |
| "valid_targets_mean": 3064.9, |
| "valid_targets_min": 1420 |
| }, |
| { |
| "epoch": 4.379600420609885, |
| "grad_norm": 0.44479202991000844, |
| "learning_rate": 1.4790703003083236e-05, |
| "loss": 0.1005, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08161349594593048, |
| "step": 4165, |
| "valid_targets_mean": 3118.6, |
| "valid_targets_min": 1109 |
| }, |
| { |
| "epoch": 4.384858044164038, |
| "grad_norm": 0.3939183122895328, |
| "learning_rate": 1.4740092434953793e-05, |
| "loss": 0.0661, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06900782883167267, |
| "step": 4170, |
| "valid_targets_mean": 2832.8, |
| "valid_targets_min": 619 |
| }, |
| { |
| "epoch": 4.390115667718192, |
| "grad_norm": 0.4395002196837855, |
| "learning_rate": 1.4689518026038065e-05, |
| "loss": 0.0879, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08298580348491669, |
| "step": 4175, |
| "valid_targets_mean": 2430.6, |
| "valid_targets_min": 486 |
| }, |
| { |
| "epoch": 4.395373291272345, |
| "grad_norm": 0.34186551874414745, |
| "learning_rate": 1.4638980124009649e-05, |
| "loss": 0.0774, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07223881781101227, |
| "step": 4180, |
| "valid_targets_mean": 4219.3, |
| "valid_targets_min": 1057 |
| }, |
| { |
| "epoch": 4.400630914826499, |
| "grad_norm": 0.3928156509702832, |
| "learning_rate": 1.458847907629113e-05, |
| "loss": 0.0677, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0738736093044281, |
| "step": 4185, |
| "valid_targets_mean": 4225.4, |
| "valid_targets_min": 1243 |
| }, |
| { |
| "epoch": 4.405888538380652, |
| "grad_norm": 0.3642115953222497, |
| "learning_rate": 1.4538015230051761e-05, |
| "loss": 0.0913, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07985761761665344, |
| "step": 4190, |
| "valid_targets_mean": 4028.9, |
| "valid_targets_min": 3172 |
| }, |
| { |
| "epoch": 4.411146161934806, |
| "grad_norm": 0.5022606162803077, |
| "learning_rate": 1.4487588932205072e-05, |
| "loss": 0.0766, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09595610201358795, |
| "step": 4195, |
| "valid_targets_mean": 1704.1, |
| "valid_targets_min": 660 |
| }, |
| { |
| "epoch": 4.416403785488959, |
| "grad_norm": 0.4345122992348086, |
| "learning_rate": 1.4437200529406425e-05, |
| "loss": 0.1067, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0982901006937027, |
| "step": 4200, |
| "valid_targets_mean": 2431.8, |
| "valid_targets_min": 564 |
| }, |
| { |
| "epoch": 4.421661409043113, |
| "grad_norm": 0.314203606139644, |
| "learning_rate": 1.4386850368050706e-05, |
| "loss": 0.0919, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.04750623181462288, |
| "step": 4205, |
| "valid_targets_mean": 3308.2, |
| "valid_targets_min": 929 |
| }, |
| { |
| "epoch": 4.426919032597266, |
| "grad_norm": 0.5640866700139815, |
| "learning_rate": 1.433653879426991e-05, |
| "loss": 0.0972, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18529458343982697, |
| "step": 4210, |
| "valid_targets_mean": 2929.4, |
| "valid_targets_min": 1301 |
| }, |
| { |
| "epoch": 4.4321766561514195, |
| "grad_norm": 0.36515961212609865, |
| "learning_rate": 1.4286266153930733e-05, |
| "loss": 0.0757, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07569369673728943, |
| "step": 4215, |
| "valid_targets_mean": 3690.6, |
| "valid_targets_min": 2619 |
| }, |
| { |
| "epoch": 4.437434279705573, |
| "grad_norm": 0.6230958647827156, |
| "learning_rate": 1.4236032792632251e-05, |
| "loss": 0.0863, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11252903193235397, |
| "step": 4220, |
| "valid_targets_mean": 1490.4, |
| "valid_targets_min": 559 |
| }, |
| { |
| "epoch": 4.4426919032597265, |
| "grad_norm": 0.38713085150221327, |
| "learning_rate": 1.4185839055703511e-05, |
| "loss": 0.0816, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07943620532751083, |
| "step": 4225, |
| "valid_targets_mean": 3594.6, |
| "valid_targets_min": 953 |
| }, |
| { |
| "epoch": 4.44794952681388, |
| "grad_norm": 0.6564390407327888, |
| "learning_rate": 1.4135685288201151e-05, |
| "loss": 0.1075, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10501672327518463, |
| "step": 4230, |
| "valid_targets_mean": 1447.7, |
| "valid_targets_min": 337 |
| }, |
| { |
| "epoch": 4.4532071503680335, |
| "grad_norm": 0.48223080610365265, |
| "learning_rate": 1.4085571834907046e-05, |
| "loss": 0.1099, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09758482873439789, |
| "step": 4235, |
| "valid_targets_mean": 2567.4, |
| "valid_targets_min": 503 |
| }, |
| { |
| "epoch": 4.458464773922187, |
| "grad_norm": 0.49714117568515587, |
| "learning_rate": 1.4035499040325946e-05, |
| "loss": 0.0866, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10407310724258423, |
| "step": 4240, |
| "valid_targets_mean": 2465.7, |
| "valid_targets_min": 529 |
| }, |
| { |
| "epoch": 4.4637223974763405, |
| "grad_norm": 0.42666048962566805, |
| "learning_rate": 1.3985467248683064e-05, |
| "loss": 0.0826, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0782807245850563, |
| "step": 4245, |
| "valid_targets_mean": 3539.2, |
| "valid_targets_min": 2556 |
| }, |
| { |
| "epoch": 4.468980021030494, |
| "grad_norm": 0.41848352102911673, |
| "learning_rate": 1.3935476803921755e-05, |
| "loss": 0.0808, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08888020366430283, |
| "step": 4250, |
| "valid_targets_mean": 3619.9, |
| "valid_targets_min": 2651 |
| }, |
| { |
| "epoch": 4.4742376445846475, |
| "grad_norm": 0.3516479297759341, |
| "learning_rate": 1.3885528049701148e-05, |
| "loss": 0.0722, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.061628080904483795, |
| "step": 4255, |
| "valid_targets_mean": 2919.1, |
| "valid_targets_min": 856 |
| }, |
| { |
| "epoch": 4.479495268138801, |
| "grad_norm": 0.9349437067749011, |
| "learning_rate": 1.3835621329393738e-05, |
| "loss": 0.0855, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11120863258838654, |
| "step": 4260, |
| "valid_targets_mean": 986.9, |
| "valid_targets_min": 563 |
| }, |
| { |
| "epoch": 4.484752891692954, |
| "grad_norm": 0.4242881723909972, |
| "learning_rate": 1.3785756986083091e-05, |
| "loss": 0.0835, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07287145406007767, |
| "step": 4265, |
| "valid_targets_mean": 2897.8, |
| "valid_targets_min": 719 |
| }, |
| { |
| "epoch": 4.490010515247108, |
| "grad_norm": 0.5127270491401, |
| "learning_rate": 1.3735935362561419e-05, |
| "loss": 0.0748, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0772905945777893, |
| "step": 4270, |
| "valid_targets_mean": 2242.0, |
| "valid_targets_min": 779 |
| }, |
| { |
| "epoch": 4.495268138801261, |
| "grad_norm": 0.4443005590319916, |
| "learning_rate": 1.3686156801327293e-05, |
| "loss": 0.0759, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08193336427211761, |
| "step": 4275, |
| "valid_targets_mean": 3736.4, |
| "valid_targets_min": 2538 |
| }, |
| { |
| "epoch": 4.500525762355416, |
| "grad_norm": 0.3143235531193856, |
| "learning_rate": 1.3636421644583231e-05, |
| "loss": 0.0854, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.05727476254105568, |
| "step": 4280, |
| "valid_targets_mean": 3932.6, |
| "valid_targets_min": 485 |
| }, |
| { |
| "epoch": 4.505783385909568, |
| "grad_norm": 0.2808451740638086, |
| "learning_rate": 1.3586730234233367e-05, |
| "loss": 0.0723, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06968601047992706, |
| "step": 4285, |
| "valid_targets_mean": 5130.1, |
| "valid_targets_min": 2551 |
| }, |
| { |
| "epoch": 4.511041009463723, |
| "grad_norm": 0.344999502670709, |
| "learning_rate": 1.3537082911881106e-05, |
| "loss": 0.0769, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07305177301168442, |
| "step": 4290, |
| "valid_targets_mean": 4516.9, |
| "valid_targets_min": 1320 |
| }, |
| { |
| "epoch": 4.516298633017876, |
| "grad_norm": 0.4689853049134904, |
| "learning_rate": 1.3487480018826772e-05, |
| "loss": 0.0815, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11492998898029327, |
| "step": 4295, |
| "valid_targets_mean": 3007.9, |
| "valid_targets_min": 872 |
| }, |
| { |
| "epoch": 4.52155625657203, |
| "grad_norm": 0.39631399060938494, |
| "learning_rate": 1.343792189606525e-05, |
| "loss": 0.1695, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07661318778991699, |
| "step": 4300, |
| "valid_targets_mean": 3173.8, |
| "valid_targets_min": 1015 |
| }, |
| { |
| "epoch": 4.526813880126183, |
| "grad_norm": 0.40943284951665426, |
| "learning_rate": 1.338840888428366e-05, |
| "loss": 0.0764, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.098414346575737, |
| "step": 4305, |
| "valid_targets_mean": 2640.1, |
| "valid_targets_min": 967 |
| }, |
| { |
| "epoch": 4.532071503680337, |
| "grad_norm": 0.35710688427983905, |
| "learning_rate": 1.3338941323859023e-05, |
| "loss": 0.0775, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06632598489522934, |
| "step": 4310, |
| "valid_targets_mean": 3444.8, |
| "valid_targets_min": 886 |
| }, |
| { |
| "epoch": 4.53732912723449, |
| "grad_norm": 0.3830759877809827, |
| "learning_rate": 1.3289519554855858e-05, |
| "loss": 0.1086, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08790523558855057, |
| "step": 4315, |
| "valid_targets_mean": 3194.1, |
| "valid_targets_min": 791 |
| }, |
| { |
| "epoch": 4.542586750788644, |
| "grad_norm": 0.7945478753892914, |
| "learning_rate": 1.3240143917023938e-05, |
| "loss": 0.166, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14951461553573608, |
| "step": 4320, |
| "valid_targets_mean": 1444.9, |
| "valid_targets_min": 740 |
| }, |
| { |
| "epoch": 4.547844374342797, |
| "grad_norm": 0.8159241018273632, |
| "learning_rate": 1.3190814749795893e-05, |
| "loss": 0.1472, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1459198147058487, |
| "step": 4325, |
| "valid_targets_mean": 1505.5, |
| "valid_targets_min": 612 |
| }, |
| { |
| "epoch": 4.553101997896951, |
| "grad_norm": 0.7303639064389034, |
| "learning_rate": 1.3141532392284873e-05, |
| "loss": 0.1417, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15061330795288086, |
| "step": 4330, |
| "valid_targets_mean": 1533.9, |
| "valid_targets_min": 826 |
| }, |
| { |
| "epoch": 4.558359621451104, |
| "grad_norm": 0.740829826680204, |
| "learning_rate": 1.3092297183282261e-05, |
| "loss": 0.1345, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1273009181022644, |
| "step": 4335, |
| "valid_targets_mean": 1432.6, |
| "valid_targets_min": 742 |
| }, |
| { |
| "epoch": 4.563617245005258, |
| "grad_norm": 0.8158007699745509, |
| "learning_rate": 1.3043109461255305e-05, |
| "loss": 0.1455, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13618069887161255, |
| "step": 4340, |
| "valid_targets_mean": 1454.2, |
| "valid_targets_min": 718 |
| }, |
| { |
| "epoch": 4.568874868559411, |
| "grad_norm": 0.8071721059423621, |
| "learning_rate": 1.29939695643448e-05, |
| "loss": 0.1436, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14438077807426453, |
| "step": 4345, |
| "valid_targets_mean": 1536.6, |
| "valid_targets_min": 764 |
| }, |
| { |
| "epoch": 4.574132492113565, |
| "grad_norm": 0.7059567228513929, |
| "learning_rate": 1.2944877830362777e-05, |
| "loss": 0.13, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12112382799386978, |
| "step": 4350, |
| "valid_targets_mean": 1463.9, |
| "valid_targets_min": 725 |
| }, |
| { |
| "epoch": 4.579390115667718, |
| "grad_norm": 0.7544977448865129, |
| "learning_rate": 1.289583459679017e-05, |
| "loss": 0.1466, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12211626023054123, |
| "step": 4355, |
| "valid_targets_mean": 1309.9, |
| "valid_targets_min": 610 |
| }, |
| { |
| "epoch": 4.584647739221872, |
| "grad_norm": 0.7973666318874467, |
| "learning_rate": 1.2846840200774484e-05, |
| "loss": 0.1319, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12944859266281128, |
| "step": 4360, |
| "valid_targets_mean": 1572.1, |
| "valid_targets_min": 720 |
| }, |
| { |
| "epoch": 4.589905362776025, |
| "grad_norm": 0.7767630256039642, |
| "learning_rate": 1.2797894979127503e-05, |
| "loss": 0.1418, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1361657977104187, |
| "step": 4365, |
| "valid_targets_mean": 1453.9, |
| "valid_targets_min": 615 |
| }, |
| { |
| "epoch": 4.595162986330179, |
| "grad_norm": 0.8626282580061343, |
| "learning_rate": 1.2748999268322977e-05, |
| "loss": 0.1348, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14767375588417053, |
| "step": 4370, |
| "valid_targets_mean": 1378.6, |
| "valid_targets_min": 593 |
| }, |
| { |
| "epoch": 4.600420609884332, |
| "grad_norm": 0.7316399237208097, |
| "learning_rate": 1.2700153404494247e-05, |
| "loss": 0.1313, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12457281351089478, |
| "step": 4375, |
| "valid_targets_mean": 1543.1, |
| "valid_targets_min": 704 |
| }, |
| { |
| "epoch": 4.605678233438486, |
| "grad_norm": 0.7013736108475105, |
| "learning_rate": 1.2651357723432027e-05, |
| "loss": 0.1264, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1074436604976654, |
| "step": 4380, |
| "valid_targets_mean": 1324.4, |
| "valid_targets_min": 722 |
| }, |
| { |
| "epoch": 4.610935856992639, |
| "grad_norm": 0.7946982474845229, |
| "learning_rate": 1.2602612560582044e-05, |
| "loss": 0.1246, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12796643376350403, |
| "step": 4385, |
| "valid_targets_mean": 1525.5, |
| "valid_targets_min": 642 |
| }, |
| { |
| "epoch": 4.616193480546793, |
| "grad_norm": 0.836488544545557, |
| "learning_rate": 1.2553918251042701e-05, |
| "loss": 0.1227, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1317048966884613, |
| "step": 4390, |
| "valid_targets_mean": 1533.2, |
| "valid_targets_min": 518 |
| }, |
| { |
| "epoch": 4.621451104100946, |
| "grad_norm": 0.8514380451001026, |
| "learning_rate": 1.2505275129562851e-05, |
| "loss": 0.1387, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14332294464111328, |
| "step": 4395, |
| "valid_targets_mean": 1576.4, |
| "valid_targets_min": 728 |
| }, |
| { |
| "epoch": 4.6267087276550996, |
| "grad_norm": 1.208697841106686, |
| "learning_rate": 1.2456683530539446e-05, |
| "loss": 0.1329, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1436920166015625, |
| "step": 4400, |
| "valid_targets_mean": 1655.1, |
| "valid_targets_min": 764 |
| }, |
| { |
| "epoch": 4.631966351209253, |
| "grad_norm": 0.897663013325341, |
| "learning_rate": 1.2408143788015225e-05, |
| "loss": 0.1347, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14613816142082214, |
| "step": 4405, |
| "valid_targets_mean": 1437.8, |
| "valid_targets_min": 818 |
| }, |
| { |
| "epoch": 4.6372239747634065, |
| "grad_norm": 0.8310040544135672, |
| "learning_rate": 1.2359656235676468e-05, |
| "loss": 0.132, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.135333850979805, |
| "step": 4410, |
| "valid_targets_mean": 1445.7, |
| "valid_targets_min": 625 |
| }, |
| { |
| "epoch": 4.642481598317561, |
| "grad_norm": 0.7604022833256503, |
| "learning_rate": 1.231122120685066e-05, |
| "loss": 0.132, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14971643686294556, |
| "step": 4415, |
| "valid_targets_mean": 2116.2, |
| "valid_targets_min": 790 |
| }, |
| { |
| "epoch": 4.6477392218717135, |
| "grad_norm": 0.8552001064677958, |
| "learning_rate": 1.2262839034504208e-05, |
| "loss": 0.1364, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15442204475402832, |
| "step": 4420, |
| "valid_targets_mean": 1961.3, |
| "valid_targets_min": 891 |
| }, |
| { |
| "epoch": 4.652996845425868, |
| "grad_norm": 0.7378301844476287, |
| "learning_rate": 1.2214510051240164e-05, |
| "loss": 0.1279, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12409693002700806, |
| "step": 4425, |
| "valid_targets_mean": 1613.9, |
| "valid_targets_min": 719 |
| }, |
| { |
| "epoch": 4.658254468980021, |
| "grad_norm": 0.7693945857058191, |
| "learning_rate": 1.2166234589295951e-05, |
| "loss": 0.1244, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11707378923892975, |
| "step": 4430, |
| "valid_targets_mean": 1345.7, |
| "valid_targets_min": 657 |
| }, |
| { |
| "epoch": 4.663512092534175, |
| "grad_norm": 0.8570609478621783, |
| "learning_rate": 1.2118012980541013e-05, |
| "loss": 0.123, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12476906180381775, |
| "step": 4435, |
| "valid_targets_mean": 1342.1, |
| "valid_targets_min": 783 |
| }, |
| { |
| "epoch": 4.668769716088328, |
| "grad_norm": 0.9049593410924867, |
| "learning_rate": 1.2069845556474626e-05, |
| "loss": 0.1317, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13999861478805542, |
| "step": 4440, |
| "valid_targets_mean": 1577.7, |
| "valid_targets_min": 629 |
| }, |
| { |
| "epoch": 4.674027339642482, |
| "grad_norm": 0.8151535597306059, |
| "learning_rate": 1.2021732648223553e-05, |
| "loss": 0.1286, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13140058517456055, |
| "step": 4445, |
| "valid_targets_mean": 1555.2, |
| "valid_targets_min": 678 |
| }, |
| { |
| "epoch": 4.679284963196635, |
| "grad_norm": 0.8326871207162568, |
| "learning_rate": 1.1973674586539791e-05, |
| "loss": 0.1318, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13513578474521637, |
| "step": 4450, |
| "valid_targets_mean": 1872.7, |
| "valid_targets_min": 1075 |
| }, |
| { |
| "epoch": 4.684542586750789, |
| "grad_norm": 0.7298449021906107, |
| "learning_rate": 1.1925671701798292e-05, |
| "loss": 0.1308, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13214683532714844, |
| "step": 4455, |
| "valid_targets_mean": 1689.4, |
| "valid_targets_min": 816 |
| }, |
| { |
| "epoch": 4.689800210304942, |
| "grad_norm": 0.732212063887265, |
| "learning_rate": 1.1877724323994704e-05, |
| "loss": 0.1265, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1377766877412796, |
| "step": 4460, |
| "valid_targets_mean": 1590.6, |
| "valid_targets_min": 957 |
| }, |
| { |
| "epoch": 4.695057833859096, |
| "grad_norm": 0.7988303959515105, |
| "learning_rate": 1.1829832782743074e-05, |
| "loss": 0.126, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11175388097763062, |
| "step": 4465, |
| "valid_targets_mean": 1282.1, |
| "valid_targets_min": 643 |
| }, |
| { |
| "epoch": 4.700315457413249, |
| "grad_norm": 1.2617076920205101, |
| "learning_rate": 1.178199740727362e-05, |
| "loss": 0.1326, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12699368596076965, |
| "step": 4470, |
| "valid_targets_mean": 1499.7, |
| "valid_targets_min": 726 |
| }, |
| { |
| "epoch": 4.705573080967403, |
| "grad_norm": 0.785573476623652, |
| "learning_rate": 1.1734218526430446e-05, |
| "loss": 0.1196, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12680059671401978, |
| "step": 4475, |
| "valid_targets_mean": 1661.6, |
| "valid_targets_min": 705 |
| }, |
| { |
| "epoch": 4.710830704521556, |
| "grad_norm": 0.7920478719928555, |
| "learning_rate": 1.1686496468669269e-05, |
| "loss": 0.1259, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.129095658659935, |
| "step": 4480, |
| "valid_targets_mean": 1541.8, |
| "valid_targets_min": 700 |
| }, |
| { |
| "epoch": 4.71608832807571, |
| "grad_norm": 0.8046030564615865, |
| "learning_rate": 1.1638831562055191e-05, |
| "loss": 0.1144, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1118820309638977, |
| "step": 4485, |
| "valid_targets_mean": 1254.4, |
| "valid_targets_min": 627 |
| }, |
| { |
| "epoch": 4.721345951629863, |
| "grad_norm": 0.8216827190777027, |
| "learning_rate": 1.1591224134260425e-05, |
| "loss": 0.1291, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12793757021427155, |
| "step": 4490, |
| "valid_targets_mean": 1480.7, |
| "valid_targets_min": 817 |
| }, |
| { |
| "epoch": 4.726603575184017, |
| "grad_norm": 0.7664188966315137, |
| "learning_rate": 1.1543674512562037e-05, |
| "loss": 0.1221, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11799920350313187, |
| "step": 4495, |
| "valid_targets_mean": 1500.8, |
| "valid_targets_min": 859 |
| }, |
| { |
| "epoch": 4.73186119873817, |
| "grad_norm": 0.8143892390058612, |
| "learning_rate": 1.1496183023839729e-05, |
| "loss": 0.1228, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12582817673683167, |
| "step": 4500, |
| "valid_targets_mean": 1444.4, |
| "valid_targets_min": 657 |
| }, |
| { |
| "epoch": 4.737118822292324, |
| "grad_norm": 0.8079274500118241, |
| "learning_rate": 1.144874999457354e-05, |
| "loss": 0.127, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1219254806637764, |
| "step": 4505, |
| "valid_targets_mean": 1543.0, |
| "valid_targets_min": 746 |
| }, |
| { |
| "epoch": 4.742376445846477, |
| "grad_norm": 1.015280520568438, |
| "learning_rate": 1.1401375750841637e-05, |
| "loss": 0.1278, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14074096083641052, |
| "step": 4510, |
| "valid_targets_mean": 1537.0, |
| "valid_targets_min": 739 |
| }, |
| { |
| "epoch": 4.747634069400631, |
| "grad_norm": 0.7962125243018413, |
| "learning_rate": 1.1354060618318086e-05, |
| "loss": 0.1201, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11099829524755478, |
| "step": 4515, |
| "valid_targets_mean": 1405.6, |
| "valid_targets_min": 682 |
| }, |
| { |
| "epoch": 4.752891692954784, |
| "grad_norm": 0.8283255518293589, |
| "learning_rate": 1.1306804922270568e-05, |
| "loss": 0.1273, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12911732494831085, |
| "step": 4520, |
| "valid_targets_mean": 1288.9, |
| "valid_targets_min": 703 |
| }, |
| { |
| "epoch": 4.758149316508938, |
| "grad_norm": 0.8385770475579886, |
| "learning_rate": 1.1259608987558175e-05, |
| "loss": 0.1326, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1268160194158554, |
| "step": 4525, |
| "valid_targets_mean": 1417.9, |
| "valid_targets_min": 864 |
| }, |
| { |
| "epoch": 4.763406940063091, |
| "grad_norm": 0.7967087061254764, |
| "learning_rate": 1.1212473138629187e-05, |
| "loss": 0.1357, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15874139964580536, |
| "step": 4530, |
| "valid_targets_mean": 1802.4, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 4.768664563617245, |
| "grad_norm": 0.7687312421179785, |
| "learning_rate": 1.1165397699518797e-05, |
| "loss": 0.122, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12358520925045013, |
| "step": 4535, |
| "valid_targets_mean": 1598.1, |
| "valid_targets_min": 607 |
| }, |
| { |
| "epoch": 4.773922187171398, |
| "grad_norm": 0.7880613162003823, |
| "learning_rate": 1.1118382993846933e-05, |
| "loss": 0.123, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1260160207748413, |
| "step": 4540, |
| "valid_targets_mean": 1596.9, |
| "valid_targets_min": 551 |
| }, |
| { |
| "epoch": 4.779179810725552, |
| "grad_norm": 0.9236915829620165, |
| "learning_rate": 1.1071429344816003e-05, |
| "loss": 0.1283, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13443315029144287, |
| "step": 4545, |
| "valid_targets_mean": 1560.6, |
| "valid_targets_min": 676 |
| }, |
| { |
| "epoch": 4.784437434279706, |
| "grad_norm": 0.7743973423226425, |
| "learning_rate": 1.102453707520867e-05, |
| "loss": 0.121, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11765165627002716, |
| "step": 4550, |
| "valid_targets_mean": 1433.0, |
| "valid_targets_min": 904 |
| }, |
| { |
| "epoch": 4.789695057833859, |
| "grad_norm": 0.8071992905794766, |
| "learning_rate": 1.0977706507385673e-05, |
| "loss": 0.1183, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1253742277622223, |
| "step": 4555, |
| "valid_targets_mean": 1579.9, |
| "valid_targets_min": 859 |
| }, |
| { |
| "epoch": 4.794952681388013, |
| "grad_norm": 0.868862346119955, |
| "learning_rate": 1.0930937963283554e-05, |
| "loss": 0.1139, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1047426164150238, |
| "step": 4560, |
| "valid_targets_mean": 1260.7, |
| "valid_targets_min": 737 |
| }, |
| { |
| "epoch": 4.8002103049421665, |
| "grad_norm": 1.0201634985518764, |
| "learning_rate": 1.088423176441248e-05, |
| "loss": 0.1372, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1578216701745987, |
| "step": 4565, |
| "valid_targets_mean": 1363.2, |
| "valid_targets_min": 791 |
| }, |
| { |
| "epoch": 4.80546792849632, |
| "grad_norm": 1.3970164039340136, |
| "learning_rate": 1.0837588231854044e-05, |
| "loss": 0.1273, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12821730971336365, |
| "step": 4570, |
| "valid_targets_mean": 1556.6, |
| "valid_targets_min": 786 |
| }, |
| { |
| "epoch": 4.8107255520504735, |
| "grad_norm": 0.7615654323398265, |
| "learning_rate": 1.0791007686259019e-05, |
| "loss": 0.1212, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12050158530473709, |
| "step": 4575, |
| "valid_targets_mean": 1497.9, |
| "valid_targets_min": 944 |
| }, |
| { |
| "epoch": 4.815983175604627, |
| "grad_norm": 0.7560936854789975, |
| "learning_rate": 1.0744490447845172e-05, |
| "loss": 0.1212, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11557275056838989, |
| "step": 4580, |
| "valid_targets_mean": 1512.4, |
| "valid_targets_min": 1075 |
| }, |
| { |
| "epoch": 4.8212407991587805, |
| "grad_norm": 0.76464313423748, |
| "learning_rate": 1.0698036836395084e-05, |
| "loss": 0.1298, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11230018734931946, |
| "step": 4585, |
| "valid_targets_mean": 1369.5, |
| "valid_targets_min": 740 |
| }, |
| { |
| "epoch": 4.826498422712934, |
| "grad_norm": 0.754682059107476, |
| "learning_rate": 1.0651647171253936e-05, |
| "loss": 0.1258, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13564129173755646, |
| "step": 4590, |
| "valid_targets_mean": 1787.8, |
| "valid_targets_min": 727 |
| }, |
| { |
| "epoch": 4.831756046267087, |
| "grad_norm": 0.8308300539524623, |
| "learning_rate": 1.0605321771327267e-05, |
| "loss": 0.1214, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12371359765529633, |
| "step": 4595, |
| "valid_targets_mean": 1276.7, |
| "valid_targets_min": 636 |
| }, |
| { |
| "epoch": 4.837013669821241, |
| "grad_norm": 0.7805308522905999, |
| "learning_rate": 1.0559060955078873e-05, |
| "loss": 0.1241, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1222592443227768, |
| "step": 4600, |
| "valid_targets_mean": 1357.9, |
| "valid_targets_min": 684 |
| }, |
| { |
| "epoch": 4.842271293375394, |
| "grad_norm": 0.7912110021336274, |
| "learning_rate": 1.0512865040528558e-05, |
| "loss": 0.1151, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11543069779872894, |
| "step": 4605, |
| "valid_targets_mean": 1406.5, |
| "valid_targets_min": 798 |
| }, |
| { |
| "epoch": 4.847528916929548, |
| "grad_norm": 0.8003234420781086, |
| "learning_rate": 1.0466734345249946e-05, |
| "loss": 0.1261, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12565967440605164, |
| "step": 4610, |
| "valid_targets_mean": 1440.1, |
| "valid_targets_min": 661 |
| }, |
| { |
| "epoch": 4.852786540483701, |
| "grad_norm": 0.7882384000400848, |
| "learning_rate": 1.0420669186368311e-05, |
| "loss": 0.1276, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.120156429708004, |
| "step": 4615, |
| "valid_targets_mean": 1596.6, |
| "valid_targets_min": 665 |
| }, |
| { |
| "epoch": 4.858044164037855, |
| "grad_norm": 0.8009284309186396, |
| "learning_rate": 1.0374669880558419e-05, |
| "loss": 0.1223, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1342923641204834, |
| "step": 4620, |
| "valid_targets_mean": 1530.6, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 4.863301787592008, |
| "grad_norm": 1.7711500546802992, |
| "learning_rate": 1.0328736744042311e-05, |
| "loss": 0.1248, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13028481602668762, |
| "step": 4625, |
| "valid_targets_mean": 1283.8, |
| "valid_targets_min": 632 |
| }, |
| { |
| "epoch": 4.868559411146162, |
| "grad_norm": 0.8468071375182229, |
| "learning_rate": 1.0282870092587144e-05, |
| "loss": 0.1232, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1261577606201172, |
| "step": 4630, |
| "valid_targets_mean": 1624.0, |
| "valid_targets_min": 922 |
| }, |
| { |
| "epoch": 4.873817034700315, |
| "grad_norm": 0.8198781196743831, |
| "learning_rate": 1.023707024150305e-05, |
| "loss": 0.1215, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1221533939242363, |
| "step": 4635, |
| "valid_targets_mean": 1669.9, |
| "valid_targets_min": 710 |
| }, |
| { |
| "epoch": 4.879074658254469, |
| "grad_norm": 0.8275894146719602, |
| "learning_rate": 1.0191337505640905e-05, |
| "loss": 0.1247, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12306816130876541, |
| "step": 4640, |
| "valid_targets_mean": 1442.4, |
| "valid_targets_min": 750 |
| }, |
| { |
| "epoch": 4.884332281808622, |
| "grad_norm": 0.9384229870980241, |
| "learning_rate": 1.0145672199390226e-05, |
| "loss": 0.1266, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13839933276176453, |
| "step": 4645, |
| "valid_targets_mean": 1527.7, |
| "valid_targets_min": 750 |
| }, |
| { |
| "epoch": 4.889589905362776, |
| "grad_norm": 0.8101343521882212, |
| "learning_rate": 1.010007463667699e-05, |
| "loss": 0.1213, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10069465637207031, |
| "step": 4650, |
| "valid_targets_mean": 1314.2, |
| "valid_targets_min": 748 |
| }, |
| { |
| "epoch": 4.894847528916929, |
| "grad_norm": 0.8541728633286423, |
| "learning_rate": 1.0054545130961441e-05, |
| "loss": 0.1266, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13769134879112244, |
| "step": 4655, |
| "valid_targets_mean": 1612.8, |
| "valid_targets_min": 729 |
| }, |
| { |
| "epoch": 4.900105152471083, |
| "grad_norm": 0.7799175937067486, |
| "learning_rate": 1.0009083995236009e-05, |
| "loss": 0.1326, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1174919605255127, |
| "step": 4660, |
| "valid_targets_mean": 1687.0, |
| "valid_targets_min": 1219 |
| }, |
| { |
| "epoch": 4.905362776025236, |
| "grad_norm": 1.3613215932621778, |
| "learning_rate": 9.963691542023079e-06, |
| "loss": 0.1269, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13345009088516235, |
| "step": 4665, |
| "valid_targets_mean": 1607.8, |
| "valid_targets_min": 782 |
| }, |
| { |
| "epoch": 4.91062039957939, |
| "grad_norm": 0.8126163300119403, |
| "learning_rate": 9.918368083372884e-06, |
| "loss": 0.1279, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12136229872703552, |
| "step": 4670, |
| "valid_targets_mean": 1379.3, |
| "valid_targets_min": 646 |
| }, |
| { |
| "epoch": 4.915878023133543, |
| "grad_norm": 0.8639388638908597, |
| "learning_rate": 9.87311393086138e-06, |
| "loss": 0.1196, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10908423364162445, |
| "step": 4675, |
| "valid_targets_mean": 1256.9, |
| "valid_targets_min": 723 |
| }, |
| { |
| "epoch": 4.921135646687697, |
| "grad_norm": 0.7963428047425778, |
| "learning_rate": 9.827929395588048e-06, |
| "loss": 0.1188, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11582878232002258, |
| "step": 4680, |
| "valid_targets_mean": 1459.7, |
| "valid_targets_min": 808 |
| }, |
| { |
| "epoch": 4.926393270241851, |
| "grad_norm": 0.8657933451916608, |
| "learning_rate": 9.782814788173787e-06, |
| "loss": 0.1268, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11620990931987762, |
| "step": 4685, |
| "valid_targets_mean": 1199.5, |
| "valid_targets_min": 687 |
| }, |
| { |
| "epoch": 4.931650893796004, |
| "grad_norm": 0.9637532954258561, |
| "learning_rate": 9.737770418758808e-06, |
| "loss": 0.1275, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13756226003170013, |
| "step": 4690, |
| "valid_targets_mean": 1432.8, |
| "valid_targets_min": 821 |
| }, |
| { |
| "epoch": 4.936908517350158, |
| "grad_norm": 0.7850173702703062, |
| "learning_rate": 9.692796597000438e-06, |
| "loss": 0.1165, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1191292256116867, |
| "step": 4695, |
| "valid_targets_mean": 1396.9, |
| "valid_targets_min": 849 |
| }, |
| { |
| "epoch": 4.942166140904312, |
| "grad_norm": 0.7210857731252445, |
| "learning_rate": 9.64789363207103e-06, |
| "loss": 0.1232, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11677803844213486, |
| "step": 4700, |
| "valid_targets_mean": 1501.5, |
| "valid_targets_min": 781 |
| }, |
| { |
| "epoch": 4.947423764458465, |
| "grad_norm": 1.0059628711103958, |
| "learning_rate": 9.603061832655847e-06, |
| "loss": 0.1393, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12605084478855133, |
| "step": 4705, |
| "valid_targets_mean": 1288.9, |
| "valid_targets_min": 522 |
| }, |
| { |
| "epoch": 4.952681388012619, |
| "grad_norm": 0.7556576345689628, |
| "learning_rate": 9.55830150695093e-06, |
| "loss": 0.1203, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11564737558364868, |
| "step": 4710, |
| "valid_targets_mean": 1319.4, |
| "valid_targets_min": 694 |
| }, |
| { |
| "epoch": 4.957939011566772, |
| "grad_norm": 0.7452979604008588, |
| "learning_rate": 9.513612962660935e-06, |
| "loss": 0.1283, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1319214403629303, |
| "step": 4715, |
| "valid_targets_mean": 1891.6, |
| "valid_targets_min": 868 |
| }, |
| { |
| "epoch": 4.963196635120926, |
| "grad_norm": 0.7258473263248048, |
| "learning_rate": 9.468996506997093e-06, |
| "loss": 0.1132, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10901002585887909, |
| "step": 4720, |
| "valid_targets_mean": 1526.8, |
| "valid_targets_min": 682 |
| }, |
| { |
| "epoch": 4.968454258675079, |
| "grad_norm": 1.2246128753791785, |
| "learning_rate": 9.424452446675059e-06, |
| "loss": 0.1205, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1299336850643158, |
| "step": 4725, |
| "valid_targets_mean": 1459.1, |
| "valid_targets_min": 797 |
| }, |
| { |
| "epoch": 4.9737118822292326, |
| "grad_norm": 0.7683030748729777, |
| "learning_rate": 9.379981087912795e-06, |
| "loss": 0.1217, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1210971400141716, |
| "step": 4730, |
| "valid_targets_mean": 1645.1, |
| "valid_targets_min": 639 |
| }, |
| { |
| "epoch": 4.978969505783386, |
| "grad_norm": 0.8315456582596747, |
| "learning_rate": 9.33558273642848e-06, |
| "loss": 0.1238, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1232328936457634, |
| "step": 4735, |
| "valid_targets_mean": 1465.1, |
| "valid_targets_min": 721 |
| }, |
| { |
| "epoch": 4.9842271293375395, |
| "grad_norm": 0.7864143724400168, |
| "learning_rate": 9.291257697438393e-06, |
| "loss": 0.1259, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11987664550542831, |
| "step": 4740, |
| "valid_targets_mean": 1330.8, |
| "valid_targets_min": 874 |
| }, |
| { |
| "epoch": 4.989484752891693, |
| "grad_norm": 0.7133269460670625, |
| "learning_rate": 9.247006275654861e-06, |
| "loss": 0.1257, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11359377950429916, |
| "step": 4745, |
| "valid_targets_mean": 1435.4, |
| "valid_targets_min": 557 |
| }, |
| { |
| "epoch": 4.9947423764458465, |
| "grad_norm": 0.7784602365116468, |
| "learning_rate": 9.202828775284101e-06, |
| "loss": 0.1272, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1337217092514038, |
| "step": 4750, |
| "valid_targets_mean": 1512.6, |
| "valid_targets_min": 713 |
| }, |
| { |
| "epoch": 5.0, |
| "grad_norm": 1.6038131287991952, |
| "learning_rate": 9.158725500024148e-06, |
| "loss": 0.1169, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09238367527723312, |
| "step": 4755, |
| "valid_targets_mean": 1517.8, |
| "valid_targets_min": 393 |
| }, |
| { |
| "epoch": 5.0052576235541535, |
| "grad_norm": 0.6514182119046302, |
| "learning_rate": 9.114696753062816e-06, |
| "loss": 0.1084, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10457351058721542, |
| "step": 4760, |
| "valid_targets_mean": 3146.7, |
| "valid_targets_min": 458 |
| }, |
| { |
| "epoch": 5.010515247108307, |
| "grad_norm": 0.5332647148272626, |
| "learning_rate": 9.07074283707554e-06, |
| "loss": 0.0834, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0893528163433075, |
| "step": 4765, |
| "valid_targets_mean": 3025.6, |
| "valid_targets_min": 1024 |
| }, |
| { |
| "epoch": 5.0157728706624605, |
| "grad_norm": 0.4048154278319103, |
| "learning_rate": 9.026864054223337e-06, |
| "loss": 0.0743, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07158604264259338, |
| "step": 4770, |
| "valid_targets_mean": 3472.4, |
| "valid_targets_min": 2068 |
| }, |
| { |
| "epoch": 5.021030494216614, |
| "grad_norm": 0.41699658709527704, |
| "learning_rate": 8.98306070615073e-06, |
| "loss": 0.0961, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0876985713839531, |
| "step": 4775, |
| "valid_targets_mean": 3615.2, |
| "valid_targets_min": 2425 |
| }, |
| { |
| "epoch": 5.0262881177707674, |
| "grad_norm": 0.44506837741995803, |
| "learning_rate": 8.93933309398368e-06, |
| "loss": 0.0753, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08160410076379776, |
| "step": 4780, |
| "valid_targets_mean": 2989.8, |
| "valid_targets_min": 1134 |
| }, |
| { |
| "epoch": 5.031545741324921, |
| "grad_norm": 0.7118010340465436, |
| "learning_rate": 8.89568151832745e-06, |
| "loss": 0.0902, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13030403852462769, |
| "step": 4785, |
| "valid_targets_mean": 1482.1, |
| "valid_targets_min": 663 |
| }, |
| { |
| "epoch": 5.036803364879074, |
| "grad_norm": 0.43286415544488827, |
| "learning_rate": 8.852106279264643e-06, |
| "loss": 0.1251, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07963715493679047, |
| "step": 4790, |
| "valid_targets_mean": 3055.2, |
| "valid_targets_min": 535 |
| }, |
| { |
| "epoch": 5.042060988433228, |
| "grad_norm": 0.9861467550286874, |
| "learning_rate": 8.808607676353074e-06, |
| "loss": 0.0839, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1039944589138031, |
| "step": 4795, |
| "valid_targets_mean": 2707.1, |
| "valid_targets_min": 781 |
| }, |
| { |
| "epoch": 5.047318611987381, |
| "grad_norm": 0.40964999165357524, |
| "learning_rate": 8.765186008623706e-06, |
| "loss": 0.0923, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06370392441749573, |
| "step": 4800, |
| "valid_targets_mean": 3210.4, |
| "valid_targets_min": 799 |
| }, |
| { |
| "epoch": 5.052576235541535, |
| "grad_norm": 0.3516054895874076, |
| "learning_rate": 8.721841574578617e-06, |
| "loss": 0.1002, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06767348200082779, |
| "step": 4805, |
| "valid_targets_mean": 4841.1, |
| "valid_targets_min": 2802 |
| }, |
| { |
| "epoch": 5.057833859095688, |
| "grad_norm": 0.3481304659858112, |
| "learning_rate": 8.678574672188963e-06, |
| "loss": 0.0726, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0681026354432106, |
| "step": 4810, |
| "valid_targets_mean": 3151.8, |
| "valid_targets_min": 574 |
| }, |
| { |
| "epoch": 5.063091482649842, |
| "grad_norm": 0.40107835502295897, |
| "learning_rate": 8.635385598892881e-06, |
| "loss": 0.0808, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07781557738780975, |
| "step": 4815, |
| "valid_targets_mean": 3383.4, |
| "valid_targets_min": 813 |
| }, |
| { |
| "epoch": 5.068349106203995, |
| "grad_norm": 0.5052660946712588, |
| "learning_rate": 8.592274651593482e-06, |
| "loss": 0.0826, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10154666751623154, |
| "step": 4820, |
| "valid_targets_mean": 1778.0, |
| "valid_targets_min": 593 |
| }, |
| { |
| "epoch": 5.07360672975815, |
| "grad_norm": 0.3967680488405485, |
| "learning_rate": 8.549242126656814e-06, |
| "loss": 0.1055, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0746898278594017, |
| "step": 4825, |
| "valid_targets_mean": 3196.0, |
| "valid_targets_min": 1185 |
| }, |
| { |
| "epoch": 5.078864353312303, |
| "grad_norm": 0.48598413120719736, |
| "learning_rate": 8.506288319909793e-06, |
| "loss": 0.0761, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09186248481273651, |
| "step": 4830, |
| "valid_targets_mean": 2149.3, |
| "valid_targets_min": 376 |
| }, |
| { |
| "epoch": 5.084121976866457, |
| "grad_norm": 0.3694068547296513, |
| "learning_rate": 8.463413526638186e-06, |
| "loss": 0.0743, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.05531078949570656, |
| "step": 4835, |
| "valid_targets_mean": 2858.6, |
| "valid_targets_min": 910 |
| }, |
| { |
| "epoch": 5.08937960042061, |
| "grad_norm": 0.36398983255043665, |
| "learning_rate": 8.420618041584604e-06, |
| "loss": 0.0695, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06922632455825806, |
| "step": 4840, |
| "valid_targets_mean": 3631.7, |
| "valid_targets_min": 2798 |
| }, |
| { |
| "epoch": 5.094637223974764, |
| "grad_norm": 0.4399738570718081, |
| "learning_rate": 8.377902158946427e-06, |
| "loss": 0.088, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07904906570911407, |
| "step": 4845, |
| "valid_targets_mean": 2579.2, |
| "valid_targets_min": 471 |
| }, |
| { |
| "epoch": 5.099894847528917, |
| "grad_norm": 0.43699878117852287, |
| "learning_rate": 8.335266172373832e-06, |
| "loss": 0.0868, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09182636439800262, |
| "step": 4850, |
| "valid_targets_mean": 2538.1, |
| "valid_targets_min": 592 |
| }, |
| { |
| "epoch": 5.105152471083071, |
| "grad_norm": 0.4276822940660941, |
| "learning_rate": 8.292710374967737e-06, |
| "loss": 0.0883, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07803415507078171, |
| "step": 4855, |
| "valid_targets_mean": 3127.5, |
| "valid_targets_min": 474 |
| }, |
| { |
| "epoch": 5.110410094637224, |
| "grad_norm": 0.3933818399998093, |
| "learning_rate": 8.250235059277792e-06, |
| "loss": 0.087, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06888704001903534, |
| "step": 4860, |
| "valid_targets_mean": 3146.4, |
| "valid_targets_min": 511 |
| }, |
| { |
| "epoch": 5.115667718191378, |
| "grad_norm": 0.33976806239483487, |
| "learning_rate": 8.207840517300398e-06, |
| "loss": 0.1173, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06624825298786163, |
| "step": 4865, |
| "valid_targets_mean": 3607.5, |
| "valid_targets_min": 902 |
| }, |
| { |
| "epoch": 5.120925341745531, |
| "grad_norm": 0.3779553364618703, |
| "learning_rate": 8.165527040476666e-06, |
| "loss": 0.0727, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07322365790605545, |
| "step": 4870, |
| "valid_targets_mean": 3110.1, |
| "valid_targets_min": 1643 |
| }, |
| { |
| "epoch": 5.126182965299685, |
| "grad_norm": 0.7347127055328346, |
| "learning_rate": 8.123294919690413e-06, |
| "loss": 0.0997, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1254892796278, |
| "step": 4875, |
| "valid_targets_mean": 1258.1, |
| "valid_targets_min": 534 |
| }, |
| { |
| "epoch": 5.131440588853838, |
| "grad_norm": 0.5231134248611237, |
| "learning_rate": 8.081144445266201e-06, |
| "loss": 0.1016, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11238907277584076, |
| "step": 4880, |
| "valid_targets_mean": 2217.8, |
| "valid_targets_min": 568 |
| }, |
| { |
| "epoch": 5.136698212407992, |
| "grad_norm": 0.40060853601446167, |
| "learning_rate": 8.039075906967293e-06, |
| "loss": 0.0796, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06358352303504944, |
| "step": 4885, |
| "valid_targets_mean": 3244.5, |
| "valid_targets_min": 895 |
| }, |
| { |
| "epoch": 5.141955835962145, |
| "grad_norm": 0.5898279787013545, |
| "learning_rate": 7.99708959399368e-06, |
| "loss": 0.1907, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33314186334609985, |
| "step": 4890, |
| "valid_targets_mean": 2774.1, |
| "valid_targets_min": 652 |
| }, |
| { |
| "epoch": 5.147213459516299, |
| "grad_norm": 0.5900615778222683, |
| "learning_rate": 7.955185794980117e-06, |
| "loss": 0.1752, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09325223416090012, |
| "step": 4895, |
| "valid_targets_mean": 2957.4, |
| "valid_targets_min": 756 |
| }, |
| { |
| "epoch": 5.152471083070452, |
| "grad_norm": 0.3493784700696294, |
| "learning_rate": 7.913364797994111e-06, |
| "loss": 0.0909, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06689581274986267, |
| "step": 4900, |
| "valid_targets_mean": 3300.6, |
| "valid_targets_min": 1332 |
| }, |
| { |
| "epoch": 5.157728706624606, |
| "grad_norm": 0.6890612781720892, |
| "learning_rate": 7.871626890533917e-06, |
| "loss": 0.1563, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.38341882824897766, |
| "step": 4905, |
| "valid_targets_mean": 2650.0, |
| "valid_targets_min": 1153 |
| }, |
| { |
| "epoch": 5.162986330178759, |
| "grad_norm": 0.26960096488962104, |
| "learning_rate": 7.829972359526626e-06, |
| "loss": 0.099, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.05556825175881386, |
| "step": 4910, |
| "valid_targets_mean": 3956.4, |
| "valid_targets_min": 636 |
| }, |
| { |
| "epoch": 5.168243953732913, |
| "grad_norm": 0.4073505139709832, |
| "learning_rate": 7.788401491326155e-06, |
| "loss": 0.0814, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07316970080137253, |
| "step": 4915, |
| "valid_targets_mean": 4346.1, |
| "valid_targets_min": 789 |
| }, |
| { |
| "epoch": 5.173501577287066, |
| "grad_norm": 0.4741269825632689, |
| "learning_rate": 7.746914571711264e-06, |
| "loss": 0.0876, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09850576519966125, |
| "step": 4920, |
| "valid_targets_mean": 3998.4, |
| "valid_targets_min": 995 |
| }, |
| { |
| "epoch": 5.1787592008412195, |
| "grad_norm": 0.35573245348833904, |
| "learning_rate": 7.705511885883612e-06, |
| "loss": 0.0766, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06487403064966202, |
| "step": 4925, |
| "valid_targets_mean": 2673.9, |
| "valid_targets_min": 488 |
| }, |
| { |
| "epoch": 5.184016824395373, |
| "grad_norm": 0.42349130867265483, |
| "learning_rate": 7.664193718465814e-06, |
| "loss": 0.0775, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08160026371479034, |
| "step": 4930, |
| "valid_targets_mean": 3398.1, |
| "valid_targets_min": 829 |
| }, |
| { |
| "epoch": 5.1892744479495265, |
| "grad_norm": 0.47272980154521393, |
| "learning_rate": 7.622960353499438e-06, |
| "loss": 0.0719, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07984272390604019, |
| "step": 4935, |
| "valid_targets_mean": 1999.6, |
| "valid_targets_min": 712 |
| }, |
| { |
| "epoch": 5.19453207150368, |
| "grad_norm": 0.43914782298921917, |
| "learning_rate": 7.581812074443084e-06, |
| "loss": 0.0756, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06791958212852478, |
| "step": 4940, |
| "valid_targets_mean": 3241.9, |
| "valid_targets_min": 1770 |
| }, |
| { |
| "epoch": 5.1997896950578335, |
| "grad_norm": 0.3864436152446525, |
| "learning_rate": 7.5407491641704464e-06, |
| "loss": 0.0663, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07457704097032547, |
| "step": 4945, |
| "valid_targets_mean": 3626.0, |
| "valid_targets_min": 2141 |
| }, |
| { |
| "epoch": 5.205047318611987, |
| "grad_norm": 0.35044737647984947, |
| "learning_rate": 7.499771904968332e-06, |
| "loss": 0.1158, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.052602969110012054, |
| "step": 4950, |
| "valid_targets_mean": 3509.4, |
| "valid_targets_min": 772 |
| }, |
| { |
| "epoch": 5.2103049421661405, |
| "grad_norm": 0.3682233382984248, |
| "learning_rate": 7.45888057853474e-06, |
| "loss": 0.0591, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0617450550198555, |
| "step": 4955, |
| "valid_targets_mean": 3345.5, |
| "valid_targets_min": 722 |
| }, |
| { |
| "epoch": 5.215562565720294, |
| "grad_norm": 0.32195724343265864, |
| "learning_rate": 7.418075465976944e-06, |
| "loss": 0.0659, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0546148344874382, |
| "step": 4960, |
| "valid_targets_mean": 3691.8, |
| "valid_targets_min": 2535 |
| }, |
| { |
| "epoch": 5.220820189274448, |
| "grad_norm": 0.41300333178467796, |
| "learning_rate": 7.3773568478095184e-06, |
| "loss": 0.0698, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07229484617710114, |
| "step": 4965, |
| "valid_targets_mean": 3218.2, |
| "valid_targets_min": 792 |
| }, |
| { |
| "epoch": 5.226077812828602, |
| "grad_norm": 0.5937927789787139, |
| "learning_rate": 7.336725003952456e-06, |
| "loss": 0.0855, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1006106436252594, |
| "step": 4970, |
| "valid_targets_mean": 1420.5, |
| "valid_targets_min": 490 |
| }, |
| { |
| "epoch": 5.231335436382755, |
| "grad_norm": 0.39459409655587835, |
| "learning_rate": 7.296180213729196e-06, |
| "loss": 0.0973, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07352457195520401, |
| "step": 4975, |
| "valid_targets_mean": 3622.2, |
| "valid_targets_min": 1196 |
| }, |
| { |
| "epoch": 5.236593059936909, |
| "grad_norm": 0.5448656901779764, |
| "learning_rate": 7.255722755864734e-06, |
| "loss": 0.1023, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09215372055768967, |
| "step": 4980, |
| "valid_targets_mean": 1924.2, |
| "valid_targets_min": 575 |
| }, |
| { |
| "epoch": 5.241850683491062, |
| "grad_norm": 0.4629237288534348, |
| "learning_rate": 7.21535290848372e-06, |
| "loss": 0.0792, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07311743497848511, |
| "step": 4985, |
| "valid_targets_mean": 2185.2, |
| "valid_targets_min": 524 |
| }, |
| { |
| "epoch": 5.247108307045216, |
| "grad_norm": 0.48104993266342294, |
| "learning_rate": 7.175070949108496e-06, |
| "loss": 0.0926, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08028687536716461, |
| "step": 4990, |
| "valid_targets_mean": 2365.2, |
| "valid_targets_min": 542 |
| }, |
| { |
| "epoch": 5.252365930599369, |
| "grad_norm": 0.4173499338874757, |
| "learning_rate": 7.1348771546572315e-06, |
| "loss": 0.1088, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07379268109798431, |
| "step": 4995, |
| "valid_targets_mean": 2925.8, |
| "valid_targets_min": 803 |
| }, |
| { |
| "epoch": 5.257623554153523, |
| "grad_norm": 0.41167750219474414, |
| "learning_rate": 7.09477180144202e-06, |
| "loss": 0.0805, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0672680214047432, |
| "step": 5000, |
| "valid_targets_mean": 2462.1, |
| "valid_targets_min": 629 |
| }, |
| { |
| "epoch": 5.262881177707676, |
| "grad_norm": 0.5108952717509712, |
| "learning_rate": 7.054755165166945e-06, |
| "loss": 0.0991, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07695017009973526, |
| "step": 5005, |
| "valid_targets_mean": 3909.5, |
| "valid_targets_min": 2393 |
| }, |
| { |
| "epoch": 5.26813880126183, |
| "grad_norm": 0.4127112236560906, |
| "learning_rate": 7.014827520926206e-06, |
| "loss": 0.0822, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07801535725593567, |
| "step": 5010, |
| "valid_targets_mean": 3106.2, |
| "valid_targets_min": 804 |
| }, |
| { |
| "epoch": 5.273396424815983, |
| "grad_norm": 0.40217260439051994, |
| "learning_rate": 6.9749891432022505e-06, |
| "loss": 0.0777, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.096265509724617, |
| "step": 5015, |
| "valid_targets_mean": 4407.3, |
| "valid_targets_min": 1549 |
| }, |
| { |
| "epoch": 5.278654048370137, |
| "grad_norm": 0.48236759326871753, |
| "learning_rate": 6.935240305863844e-06, |
| "loss": 0.0683, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07525777816772461, |
| "step": 5020, |
| "valid_targets_mean": 2631.7, |
| "valid_targets_min": 596 |
| }, |
| { |
| "epoch": 5.28391167192429, |
| "grad_norm": 0.3804505362132347, |
| "learning_rate": 6.895581282164201e-06, |
| "loss": 0.0686, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.062346745282411575, |
| "step": 5025, |
| "valid_targets_mean": 4891.2, |
| "valid_targets_min": 3804 |
| }, |
| { |
| "epoch": 5.289169295478444, |
| "grad_norm": 0.35942813155955783, |
| "learning_rate": 6.856012344739138e-06, |
| "loss": 0.0743, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06715020537376404, |
| "step": 5030, |
| "valid_targets_mean": 3792.2, |
| "valid_targets_min": 1864 |
| }, |
| { |
| "epoch": 5.294426919032597, |
| "grad_norm": 0.5721295114760007, |
| "learning_rate": 6.816533765605144e-06, |
| "loss": 0.0936, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1071794256567955, |
| "step": 5035, |
| "valid_targets_mean": 1649.4, |
| "valid_targets_min": 203 |
| }, |
| { |
| "epoch": 5.299684542586751, |
| "grad_norm": 0.36871543590956724, |
| "learning_rate": 6.7771458161575685e-06, |
| "loss": 0.0779, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0813429206609726, |
| "step": 5040, |
| "valid_targets_mean": 3947.8, |
| "valid_targets_min": 2443 |
| }, |
| { |
| "epoch": 5.304942166140904, |
| "grad_norm": 0.5173666859681757, |
| "learning_rate": 6.737848767168709e-06, |
| "loss": 0.0888, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08036038279533386, |
| "step": 5045, |
| "valid_targets_mean": 1698.5, |
| "valid_targets_min": 716 |
| }, |
| { |
| "epoch": 5.310199789695058, |
| "grad_norm": 0.44656650764418876, |
| "learning_rate": 6.698642888785965e-06, |
| "loss": 0.0619, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06723786890506744, |
| "step": 5050, |
| "valid_targets_mean": 3700.4, |
| "valid_targets_min": 905 |
| }, |
| { |
| "epoch": 5.315457413249211, |
| "grad_norm": 0.5734786496911749, |
| "learning_rate": 6.659528450530006e-06, |
| "loss": 0.0816, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08682894706726074, |
| "step": 5055, |
| "valid_targets_mean": 2566.2, |
| "valid_targets_min": 657 |
| }, |
| { |
| "epoch": 5.320715036803365, |
| "grad_norm": 0.41141747921359295, |
| "learning_rate": 6.6205057212928755e-06, |
| "loss": 0.0762, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06644845008850098, |
| "step": 5060, |
| "valid_targets_mean": 3215.8, |
| "valid_targets_min": 1584 |
| }, |
| { |
| "epoch": 5.325972660357518, |
| "grad_norm": 0.525125144293566, |
| "learning_rate": 6.5815749693361645e-06, |
| "loss": 0.0672, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0902470201253891, |
| "step": 5065, |
| "valid_targets_mean": 2246.6, |
| "valid_targets_min": 627 |
| }, |
| { |
| "epoch": 5.331230283911672, |
| "grad_norm": 0.5065649776077946, |
| "learning_rate": 6.542736462289188e-06, |
| "loss": 0.074, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08061222732067108, |
| "step": 5070, |
| "valid_targets_mean": 2176.4, |
| "valid_targets_min": 560 |
| }, |
| { |
| "epoch": 5.336487907465825, |
| "grad_norm": 0.5109118931177348, |
| "learning_rate": 6.503990467147101e-06, |
| "loss": 0.0767, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08474268764257431, |
| "step": 5075, |
| "valid_targets_mean": 2364.9, |
| "valid_targets_min": 613 |
| }, |
| { |
| "epoch": 5.341745531019979, |
| "grad_norm": 0.4081072934025734, |
| "learning_rate": 6.465337250269086e-06, |
| "loss": 0.0902, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07859212905168533, |
| "step": 5080, |
| "valid_targets_mean": 3067.3, |
| "valid_targets_min": 958 |
| }, |
| { |
| "epoch": 5.347003154574132, |
| "grad_norm": 0.45584852013478594, |
| "learning_rate": 6.426777077376538e-06, |
| "loss": 0.073, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07042613625526428, |
| "step": 5085, |
| "valid_targets_mean": 2553.5, |
| "valid_targets_min": 719 |
| }, |
| { |
| "epoch": 5.352260778128286, |
| "grad_norm": 0.51992474024479, |
| "learning_rate": 6.388310213551223e-06, |
| "loss": 0.0888, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07838479429483414, |
| "step": 5090, |
| "valid_targets_mean": 2510.1, |
| "valid_targets_min": 759 |
| }, |
| { |
| "epoch": 5.357518401682439, |
| "grad_norm": 0.7533992295551967, |
| "learning_rate": 6.349936923233422e-06, |
| "loss": 0.0938, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13972869515419006, |
| "step": 5095, |
| "valid_targets_mean": 1322.8, |
| "valid_targets_min": 521 |
| }, |
| { |
| "epoch": 5.3627760252365935, |
| "grad_norm": 0.5026457931348792, |
| "learning_rate": 6.311657470220178e-06, |
| "loss": 0.0765, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08562415838241577, |
| "step": 5100, |
| "valid_targets_mean": 3135.9, |
| "valid_targets_min": 729 |
| }, |
| { |
| "epoch": 5.368033648790747, |
| "grad_norm": 0.34054178945958086, |
| "learning_rate": 6.273472117663446e-06, |
| "loss": 0.0636, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.050133928656578064, |
| "step": 5105, |
| "valid_targets_mean": 3760.6, |
| "valid_targets_min": 2741 |
| }, |
| { |
| "epoch": 5.3732912723449004, |
| "grad_norm": 0.3885091004231832, |
| "learning_rate": 6.2353811280682715e-06, |
| "loss": 0.0734, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06262253224849701, |
| "step": 5110, |
| "valid_targets_mean": 2938.2, |
| "valid_targets_min": 927 |
| }, |
| { |
| "epoch": 5.378548895899054, |
| "grad_norm": 0.43692980379618307, |
| "learning_rate": 6.19738476329101e-06, |
| "loss": 0.1007, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07717005908489227, |
| "step": 5115, |
| "valid_targets_mean": 2925.2, |
| "valid_targets_min": 935 |
| }, |
| { |
| "epoch": 5.383806519453207, |
| "grad_norm": 0.35315279628559126, |
| "learning_rate": 6.159483284537533e-06, |
| "loss": 0.0608, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.050791092216968536, |
| "step": 5120, |
| "valid_targets_mean": 2759.2, |
| "valid_targets_min": 647 |
| }, |
| { |
| "epoch": 5.389064143007361, |
| "grad_norm": 0.3608958409269021, |
| "learning_rate": 6.121676952361395e-06, |
| "loss": 0.0771, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06702587008476257, |
| "step": 5125, |
| "valid_targets_mean": 5071.6, |
| "valid_targets_min": 976 |
| }, |
| { |
| "epoch": 5.394321766561514, |
| "grad_norm": 0.35183119939495017, |
| "learning_rate": 6.083966026662076e-06, |
| "loss": 0.0714, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06202121078968048, |
| "step": 5130, |
| "valid_targets_mean": 4252.0, |
| "valid_targets_min": 484 |
| }, |
| { |
| "epoch": 5.399579390115668, |
| "grad_norm": 0.3261126309681644, |
| "learning_rate": 6.046350766683194e-06, |
| "loss": 0.0605, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.05470889061689377, |
| "step": 5135, |
| "valid_targets_mean": 4528.9, |
| "valid_targets_min": 949 |
| }, |
| { |
| "epoch": 5.404837013669821, |
| "grad_norm": 0.4954119712097256, |
| "learning_rate": 6.0088314310107e-06, |
| "loss": 0.0822, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10348522663116455, |
| "step": 5140, |
| "valid_targets_mean": 4286.2, |
| "valid_targets_min": 2724 |
| }, |
| { |
| "epoch": 5.410094637223975, |
| "grad_norm": 0.36103261045653023, |
| "learning_rate": 5.9714082775711115e-06, |
| "loss": 0.0664, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0526675209403038, |
| "step": 5145, |
| "valid_targets_mean": 3200.5, |
| "valid_targets_min": 424 |
| }, |
| { |
| "epoch": 5.415352260778128, |
| "grad_norm": 0.4368982987072569, |
| "learning_rate": 5.934081563629764e-06, |
| "loss": 0.0968, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06551353633403778, |
| "step": 5150, |
| "valid_targets_mean": 2660.9, |
| "valid_targets_min": 531 |
| }, |
| { |
| "epoch": 5.420609884332282, |
| "grad_norm": 0.3548086350431451, |
| "learning_rate": 5.896851545788987e-06, |
| "loss": 0.0934, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06340889632701874, |
| "step": 5155, |
| "valid_targets_mean": 2755.6, |
| "valid_targets_min": 616 |
| }, |
| { |
| "epoch": 5.425867507886435, |
| "grad_norm": 0.4171249629888677, |
| "learning_rate": 5.859718479986407e-06, |
| "loss": 0.0622, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0826362669467926, |
| "step": 5160, |
| "valid_targets_mean": 2762.3, |
| "valid_targets_min": 602 |
| }, |
| { |
| "epoch": 5.431125131440589, |
| "grad_norm": 0.4571193577823833, |
| "learning_rate": 5.822682621493132e-06, |
| "loss": 0.0882, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06665949523448944, |
| "step": 5165, |
| "valid_targets_mean": 3793.9, |
| "valid_targets_min": 1251 |
| }, |
| { |
| "epoch": 5.436382754994742, |
| "grad_norm": 0.4117689522523735, |
| "learning_rate": 5.7857442249120155e-06, |
| "loss": 0.0711, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06694171577692032, |
| "step": 5170, |
| "valid_targets_mean": 2517.1, |
| "valid_targets_min": 596 |
| }, |
| { |
| "epoch": 5.441640378548896, |
| "grad_norm": 0.5627606235847757, |
| "learning_rate": 5.748903544175934e-06, |
| "loss": 0.0777, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08376845717430115, |
| "step": 5175, |
| "valid_targets_mean": 1704.4, |
| "valid_targets_min": 595 |
| }, |
| { |
| "epoch": 5.446898002103049, |
| "grad_norm": 0.6092775010665742, |
| "learning_rate": 5.712160832545992e-06, |
| "loss": 0.0927, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11150792986154556, |
| "step": 5180, |
| "valid_targets_mean": 1854.3, |
| "valid_targets_min": 520 |
| }, |
| { |
| "epoch": 5.452155625657203, |
| "grad_norm": 0.4168724812857841, |
| "learning_rate": 5.675516342609811e-06, |
| "loss": 0.1011, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07382281869649887, |
| "step": 5185, |
| "valid_targets_mean": 2596.6, |
| "valid_targets_min": 593 |
| }, |
| { |
| "epoch": 5.457413249211356, |
| "grad_norm": 0.4600180348961421, |
| "learning_rate": 5.638970326279802e-06, |
| "loss": 0.076, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.05095517262816429, |
| "step": 5190, |
| "valid_targets_mean": 3657.7, |
| "valid_targets_min": 647 |
| }, |
| { |
| "epoch": 5.46267087276551, |
| "grad_norm": 0.4572683288643564, |
| "learning_rate": 5.602523034791407e-06, |
| "loss": 0.0786, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07281236350536346, |
| "step": 5195, |
| "valid_targets_mean": 2984.0, |
| "valid_targets_min": 676 |
| }, |
| { |
| "epoch": 5.467928496319663, |
| "grad_norm": 0.5275783021604797, |
| "learning_rate": 5.566174718701378e-06, |
| "loss": 0.0702, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07366063445806503, |
| "step": 5200, |
| "valid_targets_mean": 2498.0, |
| "valid_targets_min": 616 |
| }, |
| { |
| "epoch": 5.473186119873817, |
| "grad_norm": 0.4582123770578222, |
| "learning_rate": 5.529925627886079e-06, |
| "loss": 0.0694, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06654085218906403, |
| "step": 5205, |
| "valid_targets_mean": 2706.7, |
| "valid_targets_min": 541 |
| }, |
| { |
| "epoch": 5.47844374342797, |
| "grad_norm": 0.8097632886957944, |
| "learning_rate": 5.493776011539749e-06, |
| "loss": 0.067, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09758926928043365, |
| "step": 5210, |
| "valid_targets_mean": 1267.9, |
| "valid_targets_min": 598 |
| }, |
| { |
| "epoch": 5.483701366982124, |
| "grad_norm": 0.44272409947549385, |
| "learning_rate": 5.457726118172761e-06, |
| "loss": 0.0812, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06550884991884232, |
| "step": 5215, |
| "valid_targets_mean": 3047.2, |
| "valid_targets_min": 756 |
| }, |
| { |
| "epoch": 5.488958990536277, |
| "grad_norm": 0.4764468537489189, |
| "learning_rate": 5.421776195609982e-06, |
| "loss": 0.066, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07326117157936096, |
| "step": 5220, |
| "valid_targets_mean": 2821.1, |
| "valid_targets_min": 680 |
| }, |
| { |
| "epoch": 5.494216614090431, |
| "grad_norm": 0.4021561108212554, |
| "learning_rate": 5.385926490989e-06, |
| "loss": 0.0664, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06522674858570099, |
| "step": 5225, |
| "valid_targets_mean": 3039.8, |
| "valid_targets_min": 774 |
| }, |
| { |
| "epoch": 5.499474237644584, |
| "grad_norm": 0.523663617725543, |
| "learning_rate": 5.350177250758479e-06, |
| "loss": 0.0816, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08613230288028717, |
| "step": 5230, |
| "valid_targets_mean": 4018.3, |
| "valid_targets_min": 1474 |
| }, |
| { |
| "epoch": 5.504731861198739, |
| "grad_norm": 0.28324475517994413, |
| "learning_rate": 5.314528720676424e-06, |
| "loss": 0.0631, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.04647863283753395, |
| "step": 5235, |
| "valid_targets_mean": 5695.4, |
| "valid_targets_min": 3677 |
| }, |
| { |
| "epoch": 5.509989484752892, |
| "grad_norm": 0.42248417809857786, |
| "learning_rate": 5.2789811458085085e-06, |
| "loss": 0.0684, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06635622680187225, |
| "step": 5240, |
| "valid_targets_mean": 2872.4, |
| "valid_targets_min": 675 |
| }, |
| { |
| "epoch": 5.515247108307046, |
| "grad_norm": 0.36562751871981114, |
| "learning_rate": 5.243534770526404e-06, |
| "loss": 0.0656, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06769625842571259, |
| "step": 5245, |
| "valid_targets_mean": 3971.9, |
| "valid_targets_min": 795 |
| }, |
| { |
| "epoch": 5.520504731861199, |
| "grad_norm": 0.5223514205188766, |
| "learning_rate": 5.208189838506074e-06, |
| "loss": 0.1677, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18373407423496246, |
| "step": 5250, |
| "valid_targets_mean": 2743.6, |
| "valid_targets_min": 605 |
| }, |
| { |
| "epoch": 5.5257623554153525, |
| "grad_norm": 0.3611828476769945, |
| "learning_rate": 5.172946592726109e-06, |
| "loss": 0.0647, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.060649264603853226, |
| "step": 5255, |
| "valid_targets_mean": 3250.8, |
| "valid_targets_min": 941 |
| }, |
| { |
| "epoch": 5.531019978969506, |
| "grad_norm": 0.43785332717968023, |
| "learning_rate": 5.137805275466072e-06, |
| "loss": 0.0758, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06450430303812027, |
| "step": 5260, |
| "valid_targets_mean": 2529.4, |
| "valid_targets_min": 773 |
| }, |
| { |
| "epoch": 5.5362776025236595, |
| "grad_norm": 0.6422137444773365, |
| "learning_rate": 5.1027661283048036e-06, |
| "loss": 0.0954, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2036164253950119, |
| "step": 5265, |
| "valid_targets_mean": 2282.3, |
| "valid_targets_min": 955 |
| }, |
| { |
| "epoch": 5.541535226077813, |
| "grad_norm": 0.8927515312722403, |
| "learning_rate": 5.067829392118775e-06, |
| "loss": 0.1397, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1356879472732544, |
| "step": 5270, |
| "valid_targets_mean": 1554.4, |
| "valid_targets_min": 715 |
| }, |
| { |
| "epoch": 5.5467928496319665, |
| "grad_norm": 0.7823867701884833, |
| "learning_rate": 5.03299530708045e-06, |
| "loss": 0.1331, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12987178564071655, |
| "step": 5275, |
| "valid_targets_mean": 1621.1, |
| "valid_targets_min": 725 |
| }, |
| { |
| "epoch": 5.55205047318612, |
| "grad_norm": 0.7969129758197263, |
| "learning_rate": 4.998264112656617e-06, |
| "loss": 0.1254, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13153094053268433, |
| "step": 5280, |
| "valid_targets_mean": 1469.3, |
| "valid_targets_min": 714 |
| }, |
| { |
| "epoch": 5.5573080967402735, |
| "grad_norm": 0.7412478937421575, |
| "learning_rate": 4.963636047606712e-06, |
| "loss": 0.1239, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1237417683005333, |
| "step": 5285, |
| "valid_targets_mean": 1483.8, |
| "valid_targets_min": 615 |
| }, |
| { |
| "epoch": 5.562565720294427, |
| "grad_norm": 0.8946395840082104, |
| "learning_rate": 4.929111349981244e-06, |
| "loss": 0.1289, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12845805287361145, |
| "step": 5290, |
| "valid_targets_mean": 1436.4, |
| "valid_targets_min": 715 |
| }, |
| { |
| "epoch": 5.5678233438485805, |
| "grad_norm": 0.8144822556388317, |
| "learning_rate": 4.894690257120114e-06, |
| "loss": 0.127, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14884218573570251, |
| "step": 5295, |
| "valid_targets_mean": 1576.6, |
| "valid_targets_min": 625 |
| }, |
| { |
| "epoch": 5.573080967402734, |
| "grad_norm": 0.761151170140929, |
| "learning_rate": 4.860373005650985e-06, |
| "loss": 0.1198, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11141712963581085, |
| "step": 5300, |
| "valid_targets_mean": 1417.9, |
| "valid_targets_min": 761 |
| }, |
| { |
| "epoch": 5.578338590956887, |
| "grad_norm": 0.7780506070761738, |
| "learning_rate": 4.826159831487656e-06, |
| "loss": 0.1305, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20513752102851868, |
| "step": 5305, |
| "valid_targets_mean": 1609.2, |
| "valid_targets_min": 703 |
| }, |
| { |
| "epoch": 5.583596214511041, |
| "grad_norm": 0.8088661347693589, |
| "learning_rate": 4.792050969828474e-06, |
| "loss": 0.1163, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1333039104938507, |
| "step": 5310, |
| "valid_targets_mean": 1623.3, |
| "valid_targets_min": 733 |
| }, |
| { |
| "epoch": 5.588853838065194, |
| "grad_norm": 0.8136376560184408, |
| "learning_rate": 4.758046655154664e-06, |
| "loss": 0.1261, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12402161955833435, |
| "step": 5315, |
| "valid_targets_mean": 1673.9, |
| "valid_targets_min": 835 |
| }, |
| { |
| "epoch": 5.594111461619348, |
| "grad_norm": 0.7883143282521403, |
| "learning_rate": 4.72414712122875e-06, |
| "loss": 0.1169, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11638303101062775, |
| "step": 5320, |
| "valid_targets_mean": 1542.9, |
| "valid_targets_min": 815 |
| }, |
| { |
| "epoch": 5.599369085173501, |
| "grad_norm": 0.808589877779708, |
| "learning_rate": 4.690352601092954e-06, |
| "loss": 0.1205, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11564275622367859, |
| "step": 5325, |
| "valid_targets_mean": 1620.6, |
| "valid_targets_min": 797 |
| }, |
| { |
| "epoch": 5.604626708727655, |
| "grad_norm": 0.8277035785586666, |
| "learning_rate": 4.656663327067563e-06, |
| "loss": 0.1147, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10620623826980591, |
| "step": 5330, |
| "valid_targets_mean": 1417.6, |
| "valid_targets_min": 570 |
| }, |
| { |
| "epoch": 5.609884332281808, |
| "grad_norm": 0.7371391718872009, |
| "learning_rate": 4.623079530749355e-06, |
| "loss": 0.1068, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.104159876704216, |
| "step": 5335, |
| "valid_targets_mean": 1507.0, |
| "valid_targets_min": 548 |
| }, |
| { |
| "epoch": 5.615141955835962, |
| "grad_norm": 0.8279690788966232, |
| "learning_rate": 4.589601443010012e-06, |
| "loss": 0.1081, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10407021641731262, |
| "step": 5340, |
| "valid_targets_mean": 1278.8, |
| "valid_targets_min": 682 |
| }, |
| { |
| "epoch": 5.620399579390115, |
| "grad_norm": 0.8866533143229981, |
| "learning_rate": 4.55622929399451e-06, |
| "loss": 0.1208, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13973957300186157, |
| "step": 5345, |
| "valid_targets_mean": 1824.2, |
| "valid_targets_min": 896 |
| }, |
| { |
| "epoch": 5.625657202944269, |
| "grad_norm": 0.8723904794701348, |
| "learning_rate": 4.522963313119564e-06, |
| "loss": 0.118, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11792799830436707, |
| "step": 5350, |
| "valid_targets_mean": 1513.9, |
| "valid_targets_min": 597 |
| }, |
| { |
| "epoch": 5.630914826498422, |
| "grad_norm": 0.7668798259158432, |
| "learning_rate": 4.48980372907202e-06, |
| "loss": 0.1203, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1086680144071579, |
| "step": 5355, |
| "valid_targets_mean": 1559.0, |
| "valid_targets_min": 706 |
| }, |
| { |
| "epoch": 5.636172450052577, |
| "grad_norm": 0.730780751238011, |
| "learning_rate": 4.456750769807303e-06, |
| "loss": 0.1198, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10303068906068802, |
| "step": 5360, |
| "valid_targets_mean": 1439.2, |
| "valid_targets_min": 754 |
| }, |
| { |
| "epoch": 5.641430073606729, |
| "grad_norm": 0.7538778090731447, |
| "learning_rate": 4.4238046625478635e-06, |
| "loss": 0.1156, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10241428017616272, |
| "step": 5365, |
| "valid_targets_mean": 1424.6, |
| "valid_targets_min": 785 |
| }, |
| { |
| "epoch": 5.646687697160884, |
| "grad_norm": 0.8139457939152851, |
| "learning_rate": 4.390965633781579e-06, |
| "loss": 0.1204, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1071196049451828, |
| "step": 5370, |
| "valid_targets_mean": 1526.2, |
| "valid_targets_min": 617 |
| }, |
| { |
| "epoch": 5.651945320715037, |
| "grad_norm": 0.8797432185625972, |
| "learning_rate": 4.358233909260215e-06, |
| "loss": 0.1185, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11576948314905167, |
| "step": 5375, |
| "valid_targets_mean": 1218.8, |
| "valid_targets_min": 648 |
| }, |
| { |
| "epoch": 5.657202944269191, |
| "grad_norm": 0.782319638339579, |
| "learning_rate": 4.3256097139978934e-06, |
| "loss": 0.1114, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11541301757097244, |
| "step": 5380, |
| "valid_targets_mean": 1642.6, |
| "valid_targets_min": 1184 |
| }, |
| { |
| "epoch": 5.662460567823344, |
| "grad_norm": 0.7941877596689658, |
| "learning_rate": 4.293093272269513e-06, |
| "loss": 0.107, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10624723881483078, |
| "step": 5385, |
| "valid_targets_mean": 1437.6, |
| "valid_targets_min": 774 |
| }, |
| { |
| "epoch": 5.667718191377498, |
| "grad_norm": 0.8360194376781426, |
| "learning_rate": 4.260684807609217e-06, |
| "loss": 0.1141, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12845048308372498, |
| "step": 5390, |
| "valid_targets_mean": 1799.9, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 5.672975814931651, |
| "grad_norm": 0.8534566702779152, |
| "learning_rate": 4.22838454280887e-06, |
| "loss": 0.1163, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12031950801610947, |
| "step": 5395, |
| "valid_targets_mean": 1542.4, |
| "valid_targets_min": 1004 |
| }, |
| { |
| "epoch": 5.678233438485805, |
| "grad_norm": 0.8647913690545027, |
| "learning_rate": 4.196192699916528e-06, |
| "loss": 0.1173, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1266537308692932, |
| "step": 5400, |
| "valid_targets_mean": 1532.9, |
| "valid_targets_min": 803 |
| }, |
| { |
| "epoch": 5.683491062039958, |
| "grad_norm": 0.7853288032101916, |
| "learning_rate": 4.164109500234865e-06, |
| "loss": 0.1177, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10197249054908752, |
| "step": 5405, |
| "valid_targets_mean": 1341.6, |
| "valid_targets_min": 782 |
| }, |
| { |
| "epoch": 5.688748685594112, |
| "grad_norm": 0.7776379678897548, |
| "learning_rate": 4.1321351643197235e-06, |
| "loss": 0.1135, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1157107800245285, |
| "step": 5410, |
| "valid_targets_mean": 1656.5, |
| "valid_targets_min": 646 |
| }, |
| { |
| "epoch": 5.694006309148265, |
| "grad_norm": 0.8521608963513301, |
| "learning_rate": 4.100269911978549e-06, |
| "loss": 0.1166, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12401511520147324, |
| "step": 5415, |
| "valid_targets_mean": 1465.2, |
| "valid_targets_min": 591 |
| }, |
| { |
| "epoch": 5.699263932702419, |
| "grad_norm": 0.8537600043399772, |
| "learning_rate": 4.068513962268892e-06, |
| "loss": 0.1148, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14338678121566772, |
| "step": 5420, |
| "valid_targets_mean": 1781.1, |
| "valid_targets_min": 796 |
| }, |
| { |
| "epoch": 5.704521556256572, |
| "grad_norm": 0.7601025515799135, |
| "learning_rate": 4.036867533496895e-06, |
| "loss": 0.1061, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09701358526945114, |
| "step": 5425, |
| "valid_targets_mean": 1453.8, |
| "valid_targets_min": 848 |
| }, |
| { |
| "epoch": 5.709779179810726, |
| "grad_norm": 0.797638177971665, |
| "learning_rate": 4.00533084321582e-06, |
| "loss": 0.1111, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10164414346218109, |
| "step": 5430, |
| "valid_targets_mean": 1281.6, |
| "valid_targets_min": 665 |
| }, |
| { |
| "epoch": 5.715036803364879, |
| "grad_norm": 0.7429062760056755, |
| "learning_rate": 3.9739041082245114e-06, |
| "loss": 0.1039, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0835316926240921, |
| "step": 5435, |
| "valid_targets_mean": 1267.4, |
| "valid_targets_min": 640 |
| }, |
| { |
| "epoch": 5.720294426919033, |
| "grad_norm": 0.9547603862930152, |
| "learning_rate": 3.942587544565932e-06, |
| "loss": 0.1123, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1358034312725067, |
| "step": 5440, |
| "valid_targets_mean": 1699.9, |
| "valid_targets_min": 662 |
| }, |
| { |
| "epoch": 5.725552050473186, |
| "grad_norm": 0.8214131940863713, |
| "learning_rate": 3.9113813675256816e-06, |
| "loss": 0.1093, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10168406367301941, |
| "step": 5445, |
| "valid_targets_mean": 1296.8, |
| "valid_targets_min": 724 |
| }, |
| { |
| "epoch": 5.7308096740273395, |
| "grad_norm": 0.9057829722158285, |
| "learning_rate": 3.8802857916305006e-06, |
| "loss": 0.1081, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1101183146238327, |
| "step": 5450, |
| "valid_targets_mean": 1328.3, |
| "valid_targets_min": 924 |
| }, |
| { |
| "epoch": 5.736067297581493, |
| "grad_norm": 0.9821323782217289, |
| "learning_rate": 3.849301030646797e-06, |
| "loss": 0.1129, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11183630675077438, |
| "step": 5455, |
| "valid_targets_mean": 1520.8, |
| "valid_targets_min": 773 |
| }, |
| { |
| "epoch": 5.7413249211356465, |
| "grad_norm": 1.0181874517708396, |
| "learning_rate": 3.818427297579186e-06, |
| "loss": 0.1092, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11038393527269363, |
| "step": 5460, |
| "valid_targets_mean": 1378.1, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 5.7465825446898, |
| "grad_norm": 0.839505968391763, |
| "learning_rate": 3.787664804669027e-06, |
| "loss": 0.1116, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09288961440324783, |
| "step": 5465, |
| "valid_targets_mean": 1174.9, |
| "valid_targets_min": 776 |
| }, |
| { |
| "epoch": 5.7518401682439535, |
| "grad_norm": 0.8011801234265912, |
| "learning_rate": 3.7570137633929647e-06, |
| "loss": 0.11, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1223113015294075, |
| "step": 5470, |
| "valid_targets_mean": 1885.7, |
| "valid_targets_min": 634 |
| }, |
| { |
| "epoch": 5.757097791798107, |
| "grad_norm": 0.8833011436691228, |
| "learning_rate": 3.7264743844614424e-06, |
| "loss": 0.118, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12675189971923828, |
| "step": 5475, |
| "valid_targets_mean": 1791.7, |
| "valid_targets_min": 573 |
| }, |
| { |
| "epoch": 5.7623554153522605, |
| "grad_norm": 0.799115627466568, |
| "learning_rate": 3.6960468778173097e-06, |
| "loss": 0.1153, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12185445427894592, |
| "step": 5480, |
| "valid_targets_mean": 1866.8, |
| "valid_targets_min": 718 |
| }, |
| { |
| "epoch": 5.767613038906414, |
| "grad_norm": 0.7399390292716921, |
| "learning_rate": 3.665731452634347e-06, |
| "loss": 0.1151, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09636998176574707, |
| "step": 5485, |
| "valid_targets_mean": 1395.6, |
| "valid_targets_min": 841 |
| }, |
| { |
| "epoch": 5.7728706624605675, |
| "grad_norm": 0.8358972490536069, |
| "learning_rate": 3.6355283173158153e-06, |
| "loss": 0.1084, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10667166113853455, |
| "step": 5490, |
| "valid_targets_mean": 1506.6, |
| "valid_targets_min": 956 |
| }, |
| { |
| "epoch": 5.778128286014722, |
| "grad_norm": 0.8896797913260035, |
| "learning_rate": 3.6054376794930467e-06, |
| "loss": 0.1141, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11211952567100525, |
| "step": 5495, |
| "valid_targets_mean": 1253.3, |
| "valid_targets_min": 650 |
| }, |
| { |
| "epoch": 5.783385909568874, |
| "grad_norm": 0.7609384554857924, |
| "learning_rate": 3.5754597460240216e-06, |
| "loss": 0.1093, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1054326742887497, |
| "step": 5500, |
| "valid_targets_mean": 1461.0, |
| "valid_targets_min": 780 |
| }, |
| { |
| "epoch": 5.788643533123029, |
| "grad_norm": 0.8486515544659494, |
| "learning_rate": 3.5455947229919185e-06, |
| "loss": 0.1026, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10305467247962952, |
| "step": 5505, |
| "valid_targets_mean": 1344.5, |
| "valid_targets_min": 677 |
| }, |
| { |
| "epoch": 5.793901156677181, |
| "grad_norm": 0.9233269628204959, |
| "learning_rate": 3.515842815703716e-06, |
| "loss": 0.1044, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10098401457071304, |
| "step": 5510, |
| "valid_targets_mean": 1378.5, |
| "valid_targets_min": 727 |
| }, |
| { |
| "epoch": 5.799158780231336, |
| "grad_norm": 0.9182835647399459, |
| "learning_rate": 3.4862042286887943e-06, |
| "loss": 0.1127, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11836811900138855, |
| "step": 5515, |
| "valid_targets_mean": 1498.6, |
| "valid_targets_min": 726 |
| }, |
| { |
| "epoch": 5.804416403785489, |
| "grad_norm": 1.0514207204129027, |
| "learning_rate": 3.456679165697494e-06, |
| "loss": 0.1184, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11834096908569336, |
| "step": 5520, |
| "valid_targets_mean": 1692.6, |
| "valid_targets_min": 669 |
| }, |
| { |
| "epoch": 5.809674027339643, |
| "grad_norm": 0.7672095834640549, |
| "learning_rate": 3.427267829699741e-06, |
| "loss": 0.1109, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09786675870418549, |
| "step": 5525, |
| "valid_targets_mean": 1561.1, |
| "valid_targets_min": 750 |
| }, |
| { |
| "epoch": 5.814931650893796, |
| "grad_norm": 0.8156687422713675, |
| "learning_rate": 3.3979704228836586e-06, |
| "loss": 0.1081, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11254370212554932, |
| "step": 5530, |
| "valid_targets_mean": 1549.7, |
| "valid_targets_min": 736 |
| }, |
| { |
| "epoch": 5.82018927444795, |
| "grad_norm": 1.5149884126544182, |
| "learning_rate": 3.3687871466541424e-06, |
| "loss": 0.1176, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12426459044218063, |
| "step": 5535, |
| "valid_targets_mean": 1574.6, |
| "valid_targets_min": 694 |
| }, |
| { |
| "epoch": 5.825446898002103, |
| "grad_norm": 0.8278558166237175, |
| "learning_rate": 3.339718201631521e-06, |
| "loss": 0.1069, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11466335505247116, |
| "step": 5540, |
| "valid_targets_mean": 1547.6, |
| "valid_targets_min": 753 |
| }, |
| { |
| "epoch": 5.830704521556257, |
| "grad_norm": 0.7886210142606758, |
| "learning_rate": 3.3107637876501352e-06, |
| "loss": 0.1098, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11021450161933899, |
| "step": 5545, |
| "valid_targets_mean": 1558.7, |
| "valid_targets_min": 809 |
| }, |
| { |
| "epoch": 5.83596214511041, |
| "grad_norm": 0.7843221578168094, |
| "learning_rate": 3.2819241037569838e-06, |
| "loss": 0.1102, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09781582653522491, |
| "step": 5550, |
| "valid_targets_mean": 1292.3, |
| "valid_targets_min": 698 |
| }, |
| { |
| "epoch": 5.841219768664564, |
| "grad_norm": 1.264177097958958, |
| "learning_rate": 3.253199348210372e-06, |
| "loss": 0.104, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11650004237890244, |
| "step": 5555, |
| "valid_targets_mean": 1500.9, |
| "valid_targets_min": 750 |
| }, |
| { |
| "epoch": 5.846477392218717, |
| "grad_norm": 0.960507640171679, |
| "learning_rate": 3.2245897184785103e-06, |
| "loss": 0.11, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1276053637266159, |
| "step": 5560, |
| "valid_targets_mean": 1598.8, |
| "valid_targets_min": 733 |
| }, |
| { |
| "epoch": 5.851735015772871, |
| "grad_norm": 1.0285014351563064, |
| "learning_rate": 3.1960954112381825e-06, |
| "loss": 0.1164, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11357375979423523, |
| "step": 5565, |
| "valid_targets_mean": 1636.2, |
| "valid_targets_min": 907 |
| }, |
| { |
| "epoch": 5.856992639327024, |
| "grad_norm": 0.9389765089611094, |
| "learning_rate": 3.1677166223733934e-06, |
| "loss": 0.1064, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12928201258182526, |
| "step": 5570, |
| "valid_targets_mean": 1564.9, |
| "valid_targets_min": 898 |
| }, |
| { |
| "epoch": 5.862250262881178, |
| "grad_norm": 0.8243127375717243, |
| "learning_rate": 3.1394535469740273e-06, |
| "loss": 0.1119, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12254712730646133, |
| "step": 5575, |
| "valid_targets_mean": 1685.4, |
| "valid_targets_min": 1119 |
| }, |
| { |
| "epoch": 5.867507886435331, |
| "grad_norm": 7.250778834635482, |
| "learning_rate": 3.111306379334462e-06, |
| "loss": 0.1116, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11494173109531403, |
| "step": 5580, |
| "valid_targets_mean": 1480.4, |
| "valid_targets_min": 700 |
| }, |
| { |
| "epoch": 5.872765509989485, |
| "grad_norm": 0.8450981184211277, |
| "learning_rate": 3.083275312952301e-06, |
| "loss": 0.1081, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11233916878700256, |
| "step": 5585, |
| "valid_targets_mean": 1457.9, |
| "valid_targets_min": 798 |
| }, |
| { |
| "epoch": 5.878023133543638, |
| "grad_norm": 0.8587719740924644, |
| "learning_rate": 3.055360540527006e-06, |
| "loss": 0.111, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09841004759073257, |
| "step": 5590, |
| "valid_targets_mean": 1237.5, |
| "valid_targets_min": 589 |
| }, |
| { |
| "epoch": 5.883280757097792, |
| "grad_norm": 0.8964996986405162, |
| "learning_rate": 3.0275622539585556e-06, |
| "loss": 0.1097, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09610142558813095, |
| "step": 5595, |
| "valid_targets_mean": 1234.1, |
| "valid_targets_min": 244 |
| }, |
| { |
| "epoch": 5.888538380651945, |
| "grad_norm": 0.8889742165626472, |
| "learning_rate": 2.999880644346165e-06, |
| "loss": 0.1142, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11000069975852966, |
| "step": 5600, |
| "valid_targets_mean": 1229.9, |
| "valid_targets_min": 641 |
| }, |
| { |
| "epoch": 5.893796004206099, |
| "grad_norm": 0.8053125075648936, |
| "learning_rate": 2.9723159019869597e-06, |
| "loss": 0.1055, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10099741816520691, |
| "step": 5605, |
| "valid_targets_mean": 1430.4, |
| "valid_targets_min": 585 |
| }, |
| { |
| "epoch": 5.899053627760252, |
| "grad_norm": 0.848686466603683, |
| "learning_rate": 2.9448682163746413e-06, |
| "loss": 0.1224, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12405399233102798, |
| "step": 5610, |
| "valid_targets_mean": 1902.6, |
| "valid_targets_min": 1156 |
| }, |
| { |
| "epoch": 5.904311251314406, |
| "grad_norm": 0.7842265180102828, |
| "learning_rate": 2.917537776198216e-06, |
| "loss": 0.111, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10859636962413788, |
| "step": 5615, |
| "valid_targets_mean": 1476.2, |
| "valid_targets_min": 657 |
| }, |
| { |
| "epoch": 5.909568874868559, |
| "grad_norm": 0.8343349399625959, |
| "learning_rate": 2.8903247693406932e-06, |
| "loss": 0.117, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10311952233314514, |
| "step": 5620, |
| "valid_targets_mean": 1440.7, |
| "valid_targets_min": 672 |
| }, |
| { |
| "epoch": 5.914826498422713, |
| "grad_norm": 0.8544991628930565, |
| "learning_rate": 2.863229382877777e-06, |
| "loss": 0.1089, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11789187788963318, |
| "step": 5625, |
| "valid_targets_mean": 1651.1, |
| "valid_targets_min": 973 |
| }, |
| { |
| "epoch": 5.920084121976867, |
| "grad_norm": 1.0223544518034609, |
| "learning_rate": 2.8362518030765904e-06, |
| "loss": 0.1038, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10354115068912506, |
| "step": 5630, |
| "valid_targets_mean": 1404.6, |
| "valid_targets_min": 732 |
| }, |
| { |
| "epoch": 5.9253417455310196, |
| "grad_norm": 0.8746485467055685, |
| "learning_rate": 2.8093922153944065e-06, |
| "loss": 0.113, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1060469001531601, |
| "step": 5635, |
| "valid_targets_mean": 1414.5, |
| "valid_targets_min": 634 |
| }, |
| { |
| "epoch": 5.930599369085174, |
| "grad_norm": 0.8894607541492047, |
| "learning_rate": 2.782650804477347e-06, |
| "loss": 0.1096, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11496523767709732, |
| "step": 5640, |
| "valid_targets_mean": 1663.4, |
| "valid_targets_min": 905 |
| }, |
| { |
| "epoch": 5.9358569926393265, |
| "grad_norm": 1.1569714936611488, |
| "learning_rate": 2.7560277541591427e-06, |
| "loss": 0.107, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10737825930118561, |
| "step": 5645, |
| "valid_targets_mean": 1482.2, |
| "valid_targets_min": 596 |
| }, |
| { |
| "epoch": 5.941114616193481, |
| "grad_norm": 0.9910365409328719, |
| "learning_rate": 2.7295232474598445e-06, |
| "loss": 0.1116, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12495561689138412, |
| "step": 5650, |
| "valid_targets_mean": 1422.8, |
| "valid_targets_min": 687 |
| }, |
| { |
| "epoch": 5.946372239747634, |
| "grad_norm": 0.8406537552450949, |
| "learning_rate": 2.703137466584571e-06, |
| "loss": 0.1229, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11254848539829254, |
| "step": 5655, |
| "valid_targets_mean": 1684.7, |
| "valid_targets_min": 567 |
| }, |
| { |
| "epoch": 5.951629863301788, |
| "grad_norm": 0.7773746827781078, |
| "learning_rate": 2.6768705929222827e-06, |
| "loss": 0.1092, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11341319233179092, |
| "step": 5660, |
| "valid_targets_mean": 1780.8, |
| "valid_targets_min": 810 |
| }, |
| { |
| "epoch": 5.956887486855941, |
| "grad_norm": 0.9810693086020438, |
| "learning_rate": 2.6507228070444922e-06, |
| "loss": 0.1123, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1387912929058075, |
| "step": 5665, |
| "valid_targets_mean": 1872.5, |
| "valid_targets_min": 1047 |
| }, |
| { |
| "epoch": 5.962145110410095, |
| "grad_norm": 0.8049687560693292, |
| "learning_rate": 2.6246942887040416e-06, |
| "loss": 0.1055, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1077866181731224, |
| "step": 5670, |
| "valid_targets_mean": 1659.1, |
| "valid_targets_min": 829 |
| }, |
| { |
| "epoch": 5.967402733964248, |
| "grad_norm": 0.8121712245315897, |
| "learning_rate": 2.5987852168338922e-06, |
| "loss": 0.1036, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11688219010829926, |
| "step": 5675, |
| "valid_targets_mean": 1739.2, |
| "valid_targets_min": 1141 |
| }, |
| { |
| "epoch": 5.972660357518402, |
| "grad_norm": 0.8318369671861803, |
| "learning_rate": 2.5729957695458454e-06, |
| "loss": 0.1107, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10558823496103287, |
| "step": 5680, |
| "valid_targets_mean": 1412.8, |
| "valid_targets_min": 935 |
| }, |
| { |
| "epoch": 5.977917981072555, |
| "grad_norm": 0.8248283067340154, |
| "learning_rate": 2.5473261241293547e-06, |
| "loss": 0.1099, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.119807668030262, |
| "step": 5685, |
| "valid_targets_mean": 1618.1, |
| "valid_targets_min": 684 |
| }, |
| { |
| "epoch": 5.983175604626709, |
| "grad_norm": 0.8107606296650032, |
| "learning_rate": 2.521776457050302e-06, |
| "loss": 0.1136, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10684174299240112, |
| "step": 5690, |
| "valid_targets_mean": 1520.9, |
| "valid_targets_min": 847 |
| }, |
| { |
| "epoch": 5.988433228180862, |
| "grad_norm": 0.7684078944413081, |
| "learning_rate": 2.4963469439497703e-06, |
| "loss": 0.1134, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11041624844074249, |
| "step": 5695, |
| "valid_targets_mean": 1646.8, |
| "valid_targets_min": 738 |
| }, |
| { |
| "epoch": 5.993690851735016, |
| "grad_norm": 0.9079673210746894, |
| "learning_rate": 2.4710377596428404e-06, |
| "loss": 0.11, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11681301891803741, |
| "step": 5700, |
| "valid_targets_mean": 1528.8, |
| "valid_targets_min": 594 |
| }, |
| { |
| "epoch": 5.998948475289169, |
| "grad_norm": 0.7796924099446964, |
| "learning_rate": 2.4458490781174084e-06, |
| "loss": 0.1113, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11313343793153763, |
| "step": 5705, |
| "valid_targets_mean": 1938.9, |
| "valid_targets_min": 918 |
| }, |
| { |
| "epoch": 6.004206098843323, |
| "grad_norm": 0.6164304564007929, |
| "learning_rate": 2.4207810725329583e-06, |
| "loss": 0.0977, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07638208568096161, |
| "step": 5710, |
| "valid_targets_mean": 2562.4, |
| "valid_targets_min": 543 |
| }, |
| { |
| "epoch": 6.009463722397476, |
| "grad_norm": 0.46766374672773636, |
| "learning_rate": 2.395833915219401e-06, |
| "loss": 0.0806, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06537511944770813, |
| "step": 5715, |
| "valid_targets_mean": 3733.2, |
| "valid_targets_min": 2731 |
| }, |
| { |
| "epoch": 6.01472134595163, |
| "grad_norm": 0.417678420585131, |
| "learning_rate": 2.3710077776758713e-06, |
| "loss": 0.0731, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0560794472694397, |
| "step": 5720, |
| "valid_targets_mean": 3446.4, |
| "valid_targets_min": 700 |
| }, |
| { |
| "epoch": 6.019978969505783, |
| "grad_norm": 0.500173322201823, |
| "learning_rate": 2.3463028305695447e-06, |
| "loss": 0.0876, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08729185163974762, |
| "step": 5725, |
| "valid_targets_mean": 3481.1, |
| "valid_targets_min": 1095 |
| }, |
| { |
| "epoch": 6.025236593059937, |
| "grad_norm": 0.4973920654135491, |
| "learning_rate": 2.3217192437344925e-06, |
| "loss": 0.0713, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08152356743812561, |
| "step": 5730, |
| "valid_targets_mean": 2304.1, |
| "valid_targets_min": 560 |
| }, |
| { |
| "epoch": 6.03049421661409, |
| "grad_norm": 0.48505242955633593, |
| "learning_rate": 2.2972571861704784e-06, |
| "loss": 0.0748, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08020097762346268, |
| "step": 5735, |
| "valid_targets_mean": 2921.5, |
| "valid_targets_min": 806 |
| }, |
| { |
| "epoch": 6.035751840168244, |
| "grad_norm": 0.7443459360769227, |
| "learning_rate": 2.2729168260418224e-06, |
| "loss": 0.1273, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13294632732868195, |
| "step": 5740, |
| "valid_targets_mean": 1657.2, |
| "valid_targets_min": 650 |
| }, |
| { |
| "epoch": 6.041009463722397, |
| "grad_norm": 0.41999144975528696, |
| "learning_rate": 2.2486983306762332e-06, |
| "loss": 0.0737, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07060514390468597, |
| "step": 5745, |
| "valid_targets_mean": 3432.3, |
| "valid_targets_min": 1037 |
| }, |
| { |
| "epoch": 6.046267087276551, |
| "grad_norm": 0.5465591943922049, |
| "learning_rate": 2.224601866563665e-06, |
| "loss": 0.0943, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12094777822494507, |
| "step": 5750, |
| "valid_targets_mean": 2068.1, |
| "valid_targets_min": 859 |
| }, |
| { |
| "epoch": 6.051524710830704, |
| "grad_norm": 0.5008681047165554, |
| "learning_rate": 2.2006275993551563e-06, |
| "loss": 0.0942, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.04573003202676773, |
| "step": 5755, |
| "valid_targets_mean": 5273.1, |
| "valid_targets_min": 3285 |
| }, |
| { |
| "epoch": 6.056782334384858, |
| "grad_norm": 0.41245881830042963, |
| "learning_rate": 2.176775693861719e-06, |
| "loss": 0.0678, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06577026844024658, |
| "step": 5760, |
| "valid_targets_mean": 3644.8, |
| "valid_targets_min": 502 |
| }, |
| { |
| "epoch": 6.062039957939011, |
| "grad_norm": 0.41283288274139973, |
| "learning_rate": 2.1530463140531886e-06, |
| "loss": 0.0742, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07683008909225464, |
| "step": 5765, |
| "valid_targets_mean": 3477.0, |
| "valid_targets_min": 600 |
| }, |
| { |
| "epoch": 6.067297581493165, |
| "grad_norm": 0.4876567921617298, |
| "learning_rate": 2.129439623057077e-06, |
| "loss": 0.0729, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07183055579662323, |
| "step": 5770, |
| "valid_targets_mean": 2120.4, |
| "valid_targets_min": 492 |
| }, |
| { |
| "epoch": 6.072555205047319, |
| "grad_norm": 0.3507456966673695, |
| "learning_rate": 2.105955783157498e-06, |
| "loss": 0.105, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.05326332896947861, |
| "step": 5775, |
| "valid_targets_mean": 4264.1, |
| "valid_targets_min": 1961 |
| }, |
| { |
| "epoch": 6.0778128286014725, |
| "grad_norm": 0.3481507279931147, |
| "learning_rate": 2.0825949557940174e-06, |
| "loss": 0.0677, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06237358599901199, |
| "step": 5780, |
| "valid_targets_mean": 3787.4, |
| "valid_targets_min": 1822 |
| }, |
| { |
| "epoch": 6.083070452155626, |
| "grad_norm": 0.49442891947849943, |
| "learning_rate": 2.059357301560547e-06, |
| "loss": 0.0757, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06717673689126968, |
| "step": 5785, |
| "valid_targets_mean": 2376.2, |
| "valid_targets_min": 644 |
| }, |
| { |
| "epoch": 6.0883280757097795, |
| "grad_norm": 0.4078173248116549, |
| "learning_rate": 2.036242980204244e-06, |
| "loss": 0.062, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06533263623714447, |
| "step": 5790, |
| "valid_targets_mean": 2907.6, |
| "valid_targets_min": 720 |
| }, |
| { |
| "epoch": 6.093585699263933, |
| "grad_norm": 0.6665405987602719, |
| "learning_rate": 2.0132521506244294e-06, |
| "loss": 0.0809, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08121780306100845, |
| "step": 5795, |
| "valid_targets_mean": 1197.8, |
| "valid_targets_min": 515 |
| }, |
| { |
| "epoch": 6.0988433228180865, |
| "grad_norm": 0.37854485203567, |
| "learning_rate": 1.9903849708714664e-06, |
| "loss": 0.0783, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06120346114039421, |
| "step": 5800, |
| "valid_targets_mean": 2553.1, |
| "valid_targets_min": 589 |
| }, |
| { |
| "epoch": 6.10410094637224, |
| "grad_norm": 0.5119318289182734, |
| "learning_rate": 1.967641598145684e-06, |
| "loss": 0.0854, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09212484955787659, |
| "step": 5805, |
| "valid_targets_mean": 3193.4, |
| "valid_targets_min": 1086 |
| }, |
| { |
| "epoch": 6.1093585699263935, |
| "grad_norm": 0.43967340509014186, |
| "learning_rate": 1.9450221887963194e-06, |
| "loss": 0.0833, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1033715009689331, |
| "step": 5810, |
| "valid_targets_mean": 3228.1, |
| "valid_targets_min": 1341 |
| }, |
| { |
| "epoch": 6.114616193480547, |
| "grad_norm": 0.4623742678519191, |
| "learning_rate": 1.922526898320407e-06, |
| "loss": 0.1118, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07212347537279129, |
| "step": 5815, |
| "valid_targets_mean": 3338.1, |
| "valid_targets_min": 714 |
| }, |
| { |
| "epoch": 6.1198738170347005, |
| "grad_norm": 0.4299499990472975, |
| "learning_rate": 1.900155881361727e-06, |
| "loss": 0.0671, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06847988814115524, |
| "step": 5820, |
| "valid_targets_mean": 3436.3, |
| "valid_targets_min": 669 |
| }, |
| { |
| "epoch": 6.125131440588854, |
| "grad_norm": 1.8445362617170389, |
| "learning_rate": 1.8779092917097564e-06, |
| "loss": 0.084, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10603557527065277, |
| "step": 5825, |
| "valid_targets_mean": 1240.5, |
| "valid_targets_min": 598 |
| }, |
| { |
| "epoch": 6.130389064143007, |
| "grad_norm": 0.7026706550906237, |
| "learning_rate": 1.85578728229858e-06, |
| "loss": 0.0981, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10679394751787186, |
| "step": 5830, |
| "valid_targets_mean": 1436.1, |
| "valid_targets_min": 323 |
| }, |
| { |
| "epoch": 6.135646687697161, |
| "grad_norm": 0.4408363531107394, |
| "learning_rate": 1.8337900052058732e-06, |
| "loss": 0.0838, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07777391374111176, |
| "step": 5835, |
| "valid_targets_mean": 3868.8, |
| "valid_targets_min": 2827 |
| }, |
| { |
| "epoch": 6.140904311251314, |
| "grad_norm": 0.50844572178296, |
| "learning_rate": 1.811917611651821e-06, |
| "loss": 0.1296, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19302478432655334, |
| "step": 5840, |
| "valid_targets_mean": 3063.6, |
| "valid_targets_min": 900 |
| }, |
| { |
| "epoch": 6.146161934805468, |
| "grad_norm": 0.44923524554562805, |
| "learning_rate": 1.7901702519981068e-06, |
| "loss": 0.2161, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07664000988006592, |
| "step": 5845, |
| "valid_targets_mean": 3590.4, |
| "valid_targets_min": 1932 |
| }, |
| { |
| "epoch": 6.151419558359621, |
| "grad_norm": 0.5578137665626356, |
| "learning_rate": 1.7685480757468765e-06, |
| "loss": 0.09, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10205794870853424, |
| "step": 5850, |
| "valid_targets_mean": 2208.4, |
| "valid_targets_min": 820 |
| }, |
| { |
| "epoch": 6.156677181913775, |
| "grad_norm": 0.529644129513382, |
| "learning_rate": 1.7470512315396894e-06, |
| "loss": 0.0871, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12911146879196167, |
| "step": 5855, |
| "valid_targets_mean": 2673.4, |
| "valid_targets_min": 727 |
| }, |
| { |
| "epoch": 6.161934805467928, |
| "grad_norm": 0.4326293192219862, |
| "learning_rate": 1.7256798671565111e-06, |
| "loss": 0.1593, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06629829853773117, |
| "step": 5860, |
| "valid_targets_mean": 4382.8, |
| "valid_targets_min": 2258 |
| }, |
| { |
| "epoch": 6.167192429022082, |
| "grad_norm": 0.5496191397710165, |
| "learning_rate": 1.7044341295147116e-06, |
| "loss": 0.0735, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1292692869901657, |
| "step": 5865, |
| "valid_targets_mean": 3836.1, |
| "valid_targets_min": 1142 |
| }, |
| { |
| "epoch": 6.172450052576235, |
| "grad_norm": 0.4353897412844269, |
| "learning_rate": 1.683314164668024e-06, |
| "loss": 0.0779, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08961884677410126, |
| "step": 5870, |
| "valid_targets_mean": 3908.0, |
| "valid_targets_min": 513 |
| }, |
| { |
| "epoch": 6.177707676130389, |
| "grad_norm": 0.3225554954630526, |
| "learning_rate": 1.6623201178055603e-06, |
| "loss": 0.0776, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.05820852890610695, |
| "step": 5875, |
| "valid_targets_mean": 3853.7, |
| "valid_targets_min": 1189 |
| }, |
| { |
| "epoch": 6.182965299684542, |
| "grad_norm": 0.3468714512725517, |
| "learning_rate": 1.6414521332508183e-06, |
| "loss": 0.0692, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0660017728805542, |
| "step": 5880, |
| "valid_targets_mean": 3941.4, |
| "valid_targets_min": 748 |
| }, |
| { |
| "epoch": 6.188222923238696, |
| "grad_norm": 0.43266553635121274, |
| "learning_rate": 1.6207103544606795e-06, |
| "loss": 0.0667, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07093233615159988, |
| "step": 5885, |
| "valid_targets_mean": 3278.1, |
| "valid_targets_min": 886 |
| }, |
| { |
| "epoch": 6.193480546792849, |
| "grad_norm": 0.5249482409449687, |
| "learning_rate": 1.6000949240244047e-06, |
| "loss": 0.0727, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08785708248615265, |
| "step": 5890, |
| "valid_targets_mean": 2903.9, |
| "valid_targets_min": 1939 |
| }, |
| { |
| "epoch": 6.198738170347003, |
| "grad_norm": 0.40365908187845856, |
| "learning_rate": 1.5796059836626998e-06, |
| "loss": 0.0603, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.061510659754276276, |
| "step": 5895, |
| "valid_targets_mean": 2530.4, |
| "valid_targets_min": 519 |
| }, |
| { |
| "epoch": 6.203995793901156, |
| "grad_norm": 0.5942504193604885, |
| "learning_rate": 1.5592436742267048e-06, |
| "loss": 0.1136, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.099820077419281, |
| "step": 5900, |
| "valid_targets_mean": 2007.8, |
| "valid_targets_min": 645 |
| }, |
| { |
| "epoch": 6.20925341745531, |
| "grad_norm": 0.43391116999315654, |
| "learning_rate": 1.5390081356970331e-06, |
| "loss": 0.0535, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.059852153062820435, |
| "step": 5905, |
| "valid_targets_mean": 2953.2, |
| "valid_targets_min": 472 |
| }, |
| { |
| "epoch": 6.214511041009464, |
| "grad_norm": 0.3870159740992711, |
| "learning_rate": 1.5188995071828117e-06, |
| "loss": 0.0632, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.058814555406570435, |
| "step": 5910, |
| "valid_targets_mean": 2605.6, |
| "valid_targets_min": 616 |
| }, |
| { |
| "epoch": 6.219768664563618, |
| "grad_norm": 0.39081230166828385, |
| "learning_rate": 1.498917926920731e-06, |
| "loss": 0.0618, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06334024667739868, |
| "step": 5915, |
| "valid_targets_mean": 4023.8, |
| "valid_targets_min": 2852 |
| }, |
| { |
| "epoch": 6.225026288117771, |
| "grad_norm": 0.45290694163216644, |
| "learning_rate": 1.4790635322740855e-06, |
| "loss": 0.0752, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12766267359256744, |
| "step": 5920, |
| "valid_targets_mean": 2697.2, |
| "valid_targets_min": 792 |
| }, |
| { |
| "epoch": 6.230283911671925, |
| "grad_norm": 0.39657851683572753, |
| "learning_rate": 1.4593364597318305e-06, |
| "loss": 0.0966, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06264358013868332, |
| "step": 5925, |
| "valid_targets_mean": 3389.0, |
| "valid_targets_min": 729 |
| }, |
| { |
| "epoch": 6.235541535226078, |
| "grad_norm": 0.5588729799355684, |
| "learning_rate": 1.4397368449076443e-06, |
| "loss": 0.093, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07792548835277557, |
| "step": 5930, |
| "valid_targets_mean": 1641.5, |
| "valid_targets_min": 612 |
| }, |
| { |
| "epoch": 6.240799158780232, |
| "grad_norm": 0.7245417171689901, |
| "learning_rate": 1.4202648225390103e-06, |
| "loss": 0.0771, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10067835450172424, |
| "step": 5935, |
| "valid_targets_mean": 1712.1, |
| "valid_targets_min": 664 |
| }, |
| { |
| "epoch": 6.246056782334385, |
| "grad_norm": 0.47810203140768753, |
| "learning_rate": 1.4009205264862646e-06, |
| "loss": 0.0853, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09814393520355225, |
| "step": 5940, |
| "valid_targets_mean": 2137.5, |
| "valid_targets_min": 747 |
| }, |
| { |
| "epoch": 6.251314405888539, |
| "grad_norm": 0.3851129988378668, |
| "learning_rate": 1.3817040897316903e-06, |
| "loss": 0.104, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06479619443416595, |
| "step": 5945, |
| "valid_targets_mean": 3752.8, |
| "valid_targets_min": 945 |
| }, |
| { |
| "epoch": 6.256572029442692, |
| "grad_norm": 0.44195473787918366, |
| "learning_rate": 1.362615644378611e-06, |
| "loss": 0.0769, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07227888703346252, |
| "step": 5950, |
| "valid_targets_mean": 3276.1, |
| "valid_targets_min": 840 |
| }, |
| { |
| "epoch": 6.261829652996846, |
| "grad_norm": 0.44124334261681175, |
| "learning_rate": 1.3436553216504721e-06, |
| "loss": 0.0911, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07587052881717682, |
| "step": 5955, |
| "valid_targets_mean": 3255.8, |
| "valid_targets_min": 755 |
| }, |
| { |
| "epoch": 6.267087276550999, |
| "grad_norm": 0.473734924760576, |
| "learning_rate": 1.324823251889924e-06, |
| "loss": 0.0765, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08050830662250519, |
| "step": 5960, |
| "valid_targets_mean": 1867.9, |
| "valid_targets_min": 485 |
| }, |
| { |
| "epoch": 6.2723449001051526, |
| "grad_norm": 0.46915276897607694, |
| "learning_rate": 1.3061195645579661e-06, |
| "loss": 0.07, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08968427777290344, |
| "step": 5965, |
| "valid_targets_mean": 2776.2, |
| "valid_targets_min": 605 |
| }, |
| { |
| "epoch": 6.277602523659306, |
| "grad_norm": 0.34860304064979913, |
| "learning_rate": 1.2875443882330218e-06, |
| "loss": 0.0688, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.055561311542987823, |
| "step": 5970, |
| "valid_targets_mean": 4657.1, |
| "valid_targets_min": 848 |
| }, |
| { |
| "epoch": 6.2828601472134595, |
| "grad_norm": 0.4563431302881125, |
| "learning_rate": 1.269097850610066e-06, |
| "loss": 0.0667, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06106171756982803, |
| "step": 5975, |
| "valid_targets_mean": 2842.2, |
| "valid_targets_min": 677 |
| }, |
| { |
| "epoch": 6.288117770767613, |
| "grad_norm": 0.410608868406299, |
| "learning_rate": 1.250780078499747e-06, |
| "loss": 0.0691, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07612607628107071, |
| "step": 5980, |
| "valid_targets_mean": 3812.6, |
| "valid_targets_min": 905 |
| }, |
| { |
| "epoch": 6.2933753943217665, |
| "grad_norm": 0.48629069977992023, |
| "learning_rate": 1.2325911978275196e-06, |
| "loss": 0.0807, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10084628313779831, |
| "step": 5985, |
| "valid_targets_mean": 2703.1, |
| "valid_targets_min": 808 |
| }, |
| { |
| "epoch": 6.29863301787592, |
| "grad_norm": 0.43877735850713584, |
| "learning_rate": 1.214531333632769e-06, |
| "loss": 0.078, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08358561992645264, |
| "step": 5990, |
| "valid_targets_mean": 3409.4, |
| "valid_targets_min": 1814 |
| }, |
| { |
| "epoch": 6.3038906414300735, |
| "grad_norm": 0.5070722475094578, |
| "learning_rate": 1.1966006100679596e-06, |
| "loss": 0.0848, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09752842783927917, |
| "step": 5995, |
| "valid_targets_mean": 3388.2, |
| "valid_targets_min": 931 |
| }, |
| { |
| "epoch": 6.309148264984227, |
| "grad_norm": 0.3615555878918015, |
| "learning_rate": 1.1787991503977846e-06, |
| "loss": 0.0603, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06607545912265778, |
| "step": 6000, |
| "valid_targets_mean": 3544.8, |
| "valid_targets_min": 868 |
| }, |
| { |
| "epoch": 6.3144058885383805, |
| "grad_norm": 0.6105031898931423, |
| "learning_rate": 1.1611270769983051e-06, |
| "loss": 0.073, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08485215902328491, |
| "step": 6005, |
| "valid_targets_mean": 1959.2, |
| "valid_targets_min": 664 |
| }, |
| { |
| "epoch": 6.319663512092534, |
| "grad_norm": 0.4039326314081248, |
| "learning_rate": 1.143584511356115e-06, |
| "loss": 0.0755, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06285867094993591, |
| "step": 6010, |
| "valid_targets_mean": 3505.8, |
| "valid_targets_min": 1141 |
| }, |
| { |
| "epoch": 6.3249211356466875, |
| "grad_norm": 0.39878608005935273, |
| "learning_rate": 1.1261715740675205e-06, |
| "loss": 0.0581, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07127206772565842, |
| "step": 6015, |
| "valid_targets_mean": 3273.2, |
| "valid_targets_min": 1003 |
| }, |
| { |
| "epoch": 6.330178759200841, |
| "grad_norm": 0.34049728245840616, |
| "learning_rate": 1.108888384837683e-06, |
| "loss": 0.0709, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0528426356613636, |
| "step": 6020, |
| "valid_targets_mean": 3075.9, |
| "valid_targets_min": 531 |
| }, |
| { |
| "epoch": 6.335436382754994, |
| "grad_norm": 0.38543778229175274, |
| "learning_rate": 1.0917350624798262e-06, |
| "loss": 0.0711, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.059685684740543365, |
| "step": 6025, |
| "valid_targets_mean": 3199.6, |
| "valid_targets_min": 1003 |
| }, |
| { |
| "epoch": 6.340694006309148, |
| "grad_norm": 0.5866997736744608, |
| "learning_rate": 1.07471172491439e-06, |
| "loss": 0.0859, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06620640307664871, |
| "step": 6030, |
| "valid_targets_mean": 2010.4, |
| "valid_targets_min": 597 |
| }, |
| { |
| "epoch": 6.345951629863301, |
| "grad_norm": 0.4218366338287908, |
| "learning_rate": 1.0578184891682408e-06, |
| "loss": 0.07, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.05886366590857506, |
| "step": 6035, |
| "valid_targets_mean": 2575.9, |
| "valid_targets_min": 665 |
| }, |
| { |
| "epoch": 6.351209253417455, |
| "grad_norm": 0.514711264411394, |
| "learning_rate": 1.041055471373864e-06, |
| "loss": 0.0824, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06725460290908813, |
| "step": 6040, |
| "valid_targets_mean": 1814.0, |
| "valid_targets_min": 853 |
| }, |
| { |
| "epoch": 6.356466876971609, |
| "grad_norm": 0.4646177375237913, |
| "learning_rate": 1.0244227867685597e-06, |
| "loss": 0.0768, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09085972607135773, |
| "step": 6045, |
| "valid_targets_mean": 2043.7, |
| "valid_targets_min": 708 |
| }, |
| { |
| "epoch": 6.361724500525763, |
| "grad_norm": 0.5211840081964356, |
| "learning_rate": 1.0079205496936484e-06, |
| "loss": 0.0818, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07873266935348511, |
| "step": 6050, |
| "valid_targets_mean": 1978.1, |
| "valid_targets_min": 617 |
| }, |
| { |
| "epoch": 6.366982124079916, |
| "grad_norm": 0.4816633059927123, |
| "learning_rate": 9.915488735936995e-07, |
| "loss": 0.0665, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.04688303545117378, |
| "step": 6055, |
| "valid_targets_mean": 3022.0, |
| "valid_targets_min": 720 |
| }, |
| { |
| "epoch": 6.37223974763407, |
| "grad_norm": 0.3997640765524085, |
| "learning_rate": 9.753078710157316e-07, |
| "loss": 0.0664, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.04926668107509613, |
| "step": 6060, |
| "valid_targets_mean": 3080.2, |
| "valid_targets_min": 785 |
| }, |
| { |
| "epoch": 6.377497371188223, |
| "grad_norm": 0.4935264978908819, |
| "learning_rate": 9.59197653608448e-07, |
| "loss": 0.0923, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07814300805330276, |
| "step": 6065, |
| "valid_targets_mean": 1886.2, |
| "valid_targets_min": 446 |
| }, |
| { |
| "epoch": 6.382754994742377, |
| "grad_norm": 0.43068276799584315, |
| "learning_rate": 9.432183321214805e-07, |
| "loss": 0.0619, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.05629979446530342, |
| "step": 6070, |
| "valid_targets_mean": 3074.6, |
| "valid_targets_min": 681 |
| }, |
| { |
| "epoch": 6.38801261829653, |
| "grad_norm": 0.5259671776588661, |
| "learning_rate": 9.273700164046162e-07, |
| "loss": 0.0692, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08238188922405243, |
| "step": 6075, |
| "valid_targets_mean": 3278.7, |
| "valid_targets_min": 555 |
| }, |
| { |
| "epoch": 6.393270241850684, |
| "grad_norm": 0.427123503344758, |
| "learning_rate": 9.11652815407027e-07, |
| "loss": 0.068, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06752338260412216, |
| "step": 6080, |
| "valid_targets_mean": 3133.0, |
| "valid_targets_min": 721 |
| }, |
| { |
| "epoch": 6.398527865404837, |
| "grad_norm": 0.40238439200388754, |
| "learning_rate": 8.960668371765569e-07, |
| "loss": 0.0585, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.05478310585021973, |
| "step": 6085, |
| "valid_targets_mean": 4206.8, |
| "valid_targets_min": 861 |
| }, |
| { |
| "epoch": 6.403785488958991, |
| "grad_norm": 0.5012583322548877, |
| "learning_rate": 8.806121888589492e-07, |
| "loss": 0.0685, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09788995236158371, |
| "step": 6090, |
| "valid_targets_mean": 4073.1, |
| "valid_targets_min": 2020 |
| }, |
| { |
| "epoch": 6.409043112513144, |
| "grad_norm": 0.39678947745875487, |
| "learning_rate": 8.652889766971229e-07, |
| "loss": 0.0724, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06645464897155762, |
| "step": 6095, |
| "valid_targets_mean": 3804.0, |
| "valid_targets_min": 1286 |
| }, |
| { |
| "epoch": 6.414300736067298, |
| "grad_norm": 0.43888122503682775, |
| "learning_rate": 8.500973060304374e-07, |
| "loss": 0.0898, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06902484595775604, |
| "step": 6100, |
| "valid_targets_mean": 3684.8, |
| "valid_targets_min": 2652 |
| }, |
| { |
| "epoch": 6.419558359621451, |
| "grad_norm": 0.49679489392286674, |
| "learning_rate": 8.350372812939778e-07, |
| "loss": 0.0892, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17613235116004944, |
| "step": 6105, |
| "valid_targets_mean": 3169.3, |
| "valid_targets_min": 764 |
| }, |
| { |
| "epoch": 6.424815983175605, |
| "grad_norm": 0.4694097500119007, |
| "learning_rate": 8.201090060178174e-07, |
| "loss": 0.0545, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07272839546203613, |
| "step": 6110, |
| "valid_targets_mean": 2353.6, |
| "valid_targets_min": 815 |
| }, |
| { |
| "epoch": 6.430073606729758, |
| "grad_norm": 0.4012052378346957, |
| "learning_rate": 8.053125828263297e-07, |
| "loss": 0.0863, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06625877320766449, |
| "step": 6115, |
| "valid_targets_mean": 2968.9, |
| "valid_targets_min": 485 |
| }, |
| { |
| "epoch": 6.435331230283912, |
| "grad_norm": 0.41460384833810077, |
| "learning_rate": 7.906481134374688e-07, |
| "loss": 0.067, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07116558402776718, |
| "step": 6120, |
| "valid_targets_mean": 3372.6, |
| "valid_targets_min": 854 |
| }, |
| { |
| "epoch": 6.440588853838065, |
| "grad_norm": 0.3682859692923111, |
| "learning_rate": 7.761156986620677e-07, |
| "loss": 0.0692, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.05625065416097641, |
| "step": 6125, |
| "valid_targets_mean": 3453.6, |
| "valid_targets_min": 743 |
| }, |
| { |
| "epoch": 6.445846477392219, |
| "grad_norm": 0.5423126191787105, |
| "learning_rate": 7.617154384031545e-07, |
| "loss": 0.0817, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1128939837217331, |
| "step": 6130, |
| "valid_targets_mean": 2007.8, |
| "valid_targets_min": 706 |
| }, |
| { |
| "epoch": 6.451104100946372, |
| "grad_norm": 0.46939199450309627, |
| "learning_rate": 7.474474316552638e-07, |
| "loss": 0.1023, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11290473490953445, |
| "step": 6135, |
| "valid_targets_mean": 2666.4, |
| "valid_targets_min": 675 |
| }, |
| { |
| "epoch": 6.456361724500526, |
| "grad_norm": 0.4257556315893541, |
| "learning_rate": 7.33311776503749e-07, |
| "loss": 0.076, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06424092501401901, |
| "step": 6140, |
| "valid_targets_mean": 2688.8, |
| "valid_targets_min": 663 |
| }, |
| { |
| "epoch": 6.461619348054679, |
| "grad_norm": 0.5016569812225409, |
| "learning_rate": 7.193085701241175e-07, |
| "loss": 0.0697, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07148440927267075, |
| "step": 6145, |
| "valid_targets_mean": 1787.4, |
| "valid_targets_min": 716 |
| }, |
| { |
| "epoch": 6.466876971608833, |
| "grad_norm": 0.42124970042233406, |
| "learning_rate": 7.054379087813568e-07, |
| "loss": 0.0656, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06680235266685486, |
| "step": 6150, |
| "valid_targets_mean": 2952.1, |
| "valid_targets_min": 542 |
| }, |
| { |
| "epoch": 6.472134595162986, |
| "grad_norm": 0.5217817694518172, |
| "learning_rate": 6.916998878292691e-07, |
| "loss": 0.0662, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07147432863712311, |
| "step": 6155, |
| "valid_targets_mean": 2716.6, |
| "valid_targets_min": 798 |
| }, |
| { |
| "epoch": 6.4773922187171395, |
| "grad_norm": 0.42995310088464617, |
| "learning_rate": 6.780946017098289e-07, |
| "loss": 0.0564, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.05714268982410431, |
| "step": 6160, |
| "valid_targets_mean": 2416.6, |
| "valid_targets_min": 635 |
| }, |
| { |
| "epoch": 6.482649842271293, |
| "grad_norm": 0.38547395604382156, |
| "learning_rate": 6.646221439525225e-07, |
| "loss": 0.0816, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.052166279405355453, |
| "step": 6165, |
| "valid_targets_mean": 2784.3, |
| "valid_targets_min": 794 |
| }, |
| { |
| "epoch": 6.4879074658254465, |
| "grad_norm": 0.42723697077583656, |
| "learning_rate": 6.512826071737021e-07, |
| "loss": 0.0601, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0602586567401886, |
| "step": 6170, |
| "valid_targets_mean": 2285.6, |
| "valid_targets_min": 704 |
| }, |
| { |
| "epoch": 6.4931650893796, |
| "grad_norm": 0.3949668820268369, |
| "learning_rate": 6.380760830759669e-07, |
| "loss": 0.0631, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0546693280339241, |
| "step": 6175, |
| "valid_targets_mean": 2570.1, |
| "valid_targets_min": 529 |
| }, |
| { |
| "epoch": 6.498422712933754, |
| "grad_norm": 0.528621393679054, |
| "learning_rate": 6.250026624475092e-07, |
| "loss": 0.0723, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08405116200447083, |
| "step": 6180, |
| "valid_targets_mean": 3507.9, |
| "valid_targets_min": 2017 |
| }, |
| { |
| "epoch": 6.503680336487907, |
| "grad_norm": 0.4242013145790033, |
| "learning_rate": 6.12062435161509e-07, |
| "loss": 0.0669, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06694699823856354, |
| "step": 6185, |
| "valid_targets_mean": 4252.3, |
| "valid_targets_min": 516 |
| }, |
| { |
| "epoch": 6.508937960042061, |
| "grad_norm": 0.422146737463763, |
| "learning_rate": 5.992554901755121e-07, |
| "loss": 0.0607, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06846270710229874, |
| "step": 6190, |
| "valid_targets_mean": 3945.1, |
| "valid_targets_min": 775 |
| }, |
| { |
| "epoch": 6.514195583596215, |
| "grad_norm": 0.3497829569971182, |
| "learning_rate": 5.865819155308039e-07, |
| "loss": 0.061, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.05343469977378845, |
| "step": 6195, |
| "valid_targets_mean": 3760.6, |
| "valid_targets_min": 605 |
| }, |
| { |
| "epoch": 6.519453207150368, |
| "grad_norm": 0.5797235114349107, |
| "learning_rate": 5.740417983518253e-07, |
| "loss": 0.1393, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22037141025066376, |
| "step": 6200, |
| "valid_targets_mean": 2532.4, |
| "valid_targets_min": 1132 |
| }, |
| { |
| "epoch": 6.524710830704522, |
| "grad_norm": 0.41241662391768236, |
| "learning_rate": 5.61635224845567e-07, |
| "loss": 0.0846, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06662846356630325, |
| "step": 6205, |
| "valid_targets_mean": 3141.9, |
| "valid_targets_min": 527 |
| }, |
| { |
| "epoch": 6.529968454258675, |
| "grad_norm": 0.4435464943863065, |
| "learning_rate": 5.493622803009602e-07, |
| "loss": 0.0701, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07728211581707001, |
| "step": 6210, |
| "valid_targets_mean": 3037.3, |
| "valid_targets_min": 717 |
| }, |
| { |
| "epoch": 6.535226077812829, |
| "grad_norm": 0.4556018124004852, |
| "learning_rate": 5.372230490883246e-07, |
| "loss": 0.0631, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08248764276504517, |
| "step": 6215, |
| "valid_targets_mean": 2589.2, |
| "valid_targets_min": 927 |
| }, |
| { |
| "epoch": 6.540483701366982, |
| "grad_norm": 1.0391530120290922, |
| "learning_rate": 5.252176146587484e-07, |
| "loss": 0.1451, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13617536425590515, |
| "step": 6220, |
| "valid_targets_mean": 1337.4, |
| "valid_targets_min": 788 |
| }, |
| { |
| "epoch": 6.545741324921136, |
| "grad_norm": 0.9024777771008466, |
| "learning_rate": 5.133460595435447e-07, |
| "loss": 0.1257, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1271430402994156, |
| "step": 6225, |
| "valid_targets_mean": 1537.9, |
| "valid_targets_min": 957 |
| }, |
| { |
| "epoch": 6.550998948475289, |
| "grad_norm": 0.8255851192829053, |
| "learning_rate": 5.016084653536756e-07, |
| "loss": 0.1173, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11300574243068695, |
| "step": 6230, |
| "valid_targets_mean": 1543.2, |
| "valid_targets_min": 796 |
| }, |
| { |
| "epoch": 6.556256572029443, |
| "grad_norm": 0.9127780019947226, |
| "learning_rate": 4.900049127791851e-07, |
| "loss": 0.119, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11401323229074478, |
| "step": 6235, |
| "valid_targets_mean": 1313.4, |
| "valid_targets_min": 697 |
| }, |
| { |
| "epoch": 6.561514195583596, |
| "grad_norm": 0.8621231993409767, |
| "learning_rate": 4.785354815886445e-07, |
| "loss": 0.1222, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12652909755706787, |
| "step": 6240, |
| "valid_targets_mean": 1616.7, |
| "valid_targets_min": 638 |
| }, |
| { |
| "epoch": 6.56677181913775, |
| "grad_norm": 0.8216649241251376, |
| "learning_rate": 4.6720025062862106e-07, |
| "loss": 0.117, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11938387155532837, |
| "step": 6245, |
| "valid_targets_mean": 1660.6, |
| "valid_targets_min": 727 |
| }, |
| { |
| "epoch": 6.572029442691903, |
| "grad_norm": 0.7950842564244311, |
| "learning_rate": 4.559992978231087e-07, |
| "loss": 0.1207, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10059969872236252, |
| "step": 6250, |
| "valid_targets_mean": 1361.5, |
| "valid_targets_min": 761 |
| }, |
| { |
| "epoch": 6.577287066246057, |
| "grad_norm": 0.953490690007579, |
| "learning_rate": 4.4493270017301305e-07, |
| "loss": 0.106, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10924120247364044, |
| "step": 6255, |
| "valid_targets_mean": 1297.8, |
| "valid_targets_min": 714 |
| }, |
| { |
| "epoch": 6.58254468980021, |
| "grad_norm": 0.8383747484138214, |
| "learning_rate": 4.340005337556186e-07, |
| "loss": 0.125, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10761392116546631, |
| "step": 6260, |
| "valid_targets_mean": 1455.5, |
| "valid_targets_min": 741 |
| }, |
| { |
| "epoch": 6.587802313354364, |
| "grad_norm": 0.8864969920018051, |
| "learning_rate": 4.232028737240623e-07, |
| "loss": 0.1218, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1390361189842224, |
| "step": 6265, |
| "valid_targets_mean": 2029.8, |
| "valid_targets_min": 663 |
| }, |
| { |
| "epoch": 6.593059936908517, |
| "grad_norm": 0.8403407406375845, |
| "learning_rate": 4.125397943068099e-07, |
| "loss": 0.1125, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11463350802659988, |
| "step": 6270, |
| "valid_targets_mean": 1525.1, |
| "valid_targets_min": 632 |
| }, |
| { |
| "epoch": 6.598317560462671, |
| "grad_norm": 0.8038451990410529, |
| "learning_rate": 4.0201136880716027e-07, |
| "loss": 0.1148, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11841858923435211, |
| "step": 6275, |
| "valid_targets_mean": 1709.6, |
| "valid_targets_min": 933 |
| }, |
| { |
| "epoch": 6.603575184016824, |
| "grad_norm": 0.7406552759110029, |
| "learning_rate": 3.9161766960273517e-07, |
| "loss": 0.1107, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10862021893262863, |
| "step": 6280, |
| "valid_targets_mean": 1535.0, |
| "valid_targets_min": 717 |
| }, |
| { |
| "epoch": 6.608832807570978, |
| "grad_norm": 0.8355604084930968, |
| "learning_rate": 3.8135876814497927e-07, |
| "loss": 0.1019, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10400351881980896, |
| "step": 6285, |
| "valid_targets_mean": 1315.5, |
| "valid_targets_min": 659 |
| }, |
| { |
| "epoch": 6.614090431125131, |
| "grad_norm": 0.7473839058279116, |
| "learning_rate": 3.7123473495866314e-07, |
| "loss": 0.1031, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0965389534831047, |
| "step": 6290, |
| "valid_targets_mean": 1413.6, |
| "valid_targets_min": 642 |
| }, |
| { |
| "epoch": 6.619348054679285, |
| "grad_norm": 0.8089353150472339, |
| "learning_rate": 3.61245639641421e-07, |
| "loss": 0.1085, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09670595824718475, |
| "step": 6295, |
| "valid_targets_mean": 1340.9, |
| "valid_targets_min": 765 |
| }, |
| { |
| "epoch": 6.624605678233438, |
| "grad_norm": 0.8494721770951325, |
| "learning_rate": 3.513915508632448e-07, |
| "loss": 0.1172, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11024098843336105, |
| "step": 6300, |
| "valid_targets_mean": 1332.8, |
| "valid_targets_min": 631 |
| }, |
| { |
| "epoch": 6.629863301787592, |
| "grad_norm": 0.9145610746631865, |
| "learning_rate": 3.4167253636602893e-07, |
| "loss": 0.1172, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12976564466953278, |
| "step": 6305, |
| "valid_targets_mean": 1548.9, |
| "valid_targets_min": 623 |
| }, |
| { |
| "epoch": 6.635120925341745, |
| "grad_norm": 0.9277244344400631, |
| "learning_rate": 3.3208866296310147e-07, |
| "loss": 0.1164, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14723122119903564, |
| "step": 6310, |
| "valid_targets_mean": 1934.2, |
| "valid_targets_min": 818 |
| }, |
| { |
| "epoch": 6.6403785488958995, |
| "grad_norm": 0.7804476643502358, |
| "learning_rate": 3.2263999653876057e-07, |
| "loss": 0.1112, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10922641307115555, |
| "step": 6315, |
| "valid_targets_mean": 1563.4, |
| "valid_targets_min": 776 |
| }, |
| { |
| "epoch": 6.645636172450052, |
| "grad_norm": 0.9309290018859334, |
| "learning_rate": 3.133266020478254e-07, |
| "loss": 0.1145, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11758076399564743, |
| "step": 6320, |
| "valid_targets_mean": 1428.6, |
| "valid_targets_min": 623 |
| }, |
| { |
| "epoch": 6.6508937960042065, |
| "grad_norm": 0.8316290540735192, |
| "learning_rate": 3.0414854351519476e-07, |
| "loss": 0.1119, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10959136486053467, |
| "step": 6325, |
| "valid_targets_mean": 1461.2, |
| "valid_targets_min": 693 |
| }, |
| { |
| "epoch": 6.65615141955836, |
| "grad_norm": 0.7992447961300793, |
| "learning_rate": 2.951058840353893e-07, |
| "loss": 0.1066, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08690951019525528, |
| "step": 6330, |
| "valid_targets_mean": 1157.9, |
| "valid_targets_min": 611 |
| }, |
| { |
| "epoch": 6.6614090431125135, |
| "grad_norm": 0.8469780514634077, |
| "learning_rate": 2.861986857721388e-07, |
| "loss": 0.1041, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11049091815948486, |
| "step": 6335, |
| "valid_targets_mean": 1616.5, |
| "valid_targets_min": 793 |
| }, |
| { |
| "epoch": 6.666666666666667, |
| "grad_norm": 0.7656172435806277, |
| "learning_rate": 2.7742700995794457e-07, |
| "loss": 0.105, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1010306179523468, |
| "step": 6340, |
| "valid_targets_mean": 1568.1, |
| "valid_targets_min": 563 |
| }, |
| { |
| "epoch": 6.6719242902208205, |
| "grad_norm": 0.7499652961611943, |
| "learning_rate": 2.687909168936509e-07, |
| "loss": 0.1122, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09741789102554321, |
| "step": 6345, |
| "valid_targets_mean": 1546.9, |
| "valid_targets_min": 837 |
| }, |
| { |
| "epoch": 6.677181913774974, |
| "grad_norm": 0.9094834260723604, |
| "learning_rate": 2.6029046594805206e-07, |
| "loss": 0.1108, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11675611883401871, |
| "step": 6350, |
| "valid_targets_mean": 1719.1, |
| "valid_targets_min": 1107 |
| }, |
| { |
| "epoch": 6.682439537329127, |
| "grad_norm": 0.7992755914863992, |
| "learning_rate": 2.519257155574617e-07, |
| "loss": 0.1168, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11167339235544205, |
| "step": 6355, |
| "valid_targets_mean": 1550.2, |
| "valid_targets_min": 680 |
| }, |
| { |
| "epoch": 6.687697160883281, |
| "grad_norm": 0.833039863652094, |
| "learning_rate": 2.436967232253218e-07, |
| "loss": 0.1055, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11066915839910507, |
| "step": 6360, |
| "valid_targets_mean": 1599.1, |
| "valid_targets_min": 803 |
| }, |
| { |
| "epoch": 6.692954784437434, |
| "grad_norm": 0.8152613912404252, |
| "learning_rate": 2.3560354552180976e-07, |
| "loss": 0.1104, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1145564392209053, |
| "step": 6365, |
| "valid_targets_mean": 1565.1, |
| "valid_targets_min": 631 |
| }, |
| { |
| "epoch": 6.698212407991588, |
| "grad_norm": 0.8826844936828919, |
| "learning_rate": 2.27646238083441e-07, |
| "loss": 0.1056, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10912003368139267, |
| "step": 6370, |
| "valid_targets_mean": 1662.8, |
| "valid_targets_min": 804 |
| }, |
| { |
| "epoch": 6.703470031545741, |
| "grad_norm": 0.7901670710260023, |
| "learning_rate": 2.1982485561269805e-07, |
| "loss": 0.1101, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10317906737327576, |
| "step": 6375, |
| "valid_targets_mean": 1515.2, |
| "valid_targets_min": 675 |
| }, |
| { |
| "epoch": 6.708727655099895, |
| "grad_norm": 0.806571889012237, |
| "learning_rate": 2.1213945187763764e-07, |
| "loss": 0.1048, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11043962836265564, |
| "step": 6380, |
| "valid_targets_mean": 1305.0, |
| "valid_targets_min": 856 |
| }, |
| { |
| "epoch": 6.713985278654048, |
| "grad_norm": 0.7921722408367218, |
| "learning_rate": 2.0459007971154632e-07, |
| "loss": 0.1027, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1003451719880104, |
| "step": 6385, |
| "valid_targets_mean": 1516.9, |
| "valid_targets_min": 715 |
| }, |
| { |
| "epoch": 6.719242902208202, |
| "grad_norm": 0.7841472689520302, |
| "learning_rate": 1.9717679101254549e-07, |
| "loss": 0.0966, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10266360640525818, |
| "step": 6390, |
| "valid_targets_mean": 1515.6, |
| "valid_targets_min": 678 |
| }, |
| { |
| "epoch": 6.724500525762355, |
| "grad_norm": 0.8819712887766852, |
| "learning_rate": 1.898996367432604e-07, |
| "loss": 0.1106, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11566631495952606, |
| "step": 6395, |
| "valid_targets_mean": 1387.8, |
| "valid_targets_min": 676 |
| }, |
| { |
| "epoch": 6.729758149316509, |
| "grad_norm": 0.714330087110787, |
| "learning_rate": 1.8275866693046263e-07, |
| "loss": 0.1019, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09523104131221771, |
| "step": 6400, |
| "valid_targets_mean": 1388.9, |
| "valid_targets_min": 794 |
| }, |
| { |
| "epoch": 6.735015772870662, |
| "grad_norm": 0.8191145281436136, |
| "learning_rate": 1.7575393066471714e-07, |
| "loss": 0.1077, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11150185763835907, |
| "step": 6405, |
| "valid_targets_mean": 1379.6, |
| "valid_targets_min": 607 |
| }, |
| { |
| "epoch": 6.740273396424816, |
| "grad_norm": 0.8136782878997603, |
| "learning_rate": 1.6888547610005802e-07, |
| "loss": 0.1047, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11300012469291687, |
| "step": 6410, |
| "valid_targets_mean": 1653.4, |
| "valid_targets_min": 741 |
| }, |
| { |
| "epoch": 6.745531019978969, |
| "grad_norm": 0.8474510518856821, |
| "learning_rate": 1.6215335045364656e-07, |
| "loss": 0.1105, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11601246148347855, |
| "step": 6415, |
| "valid_targets_mean": 1650.9, |
| "valid_targets_min": 858 |
| }, |
| { |
| "epoch": 6.750788643533123, |
| "grad_norm": 0.8818199690616307, |
| "learning_rate": 1.5555760000545595e-07, |
| "loss": 0.1003, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11719954013824463, |
| "step": 6420, |
| "valid_targets_mean": 1565.1, |
| "valid_targets_min": 689 |
| }, |
| { |
| "epoch": 6.756046267087276, |
| "grad_norm": 0.8365195445720387, |
| "learning_rate": 1.4909827009794486e-07, |
| "loss": 0.1121, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10661862045526505, |
| "step": 6425, |
| "valid_targets_mean": 1414.7, |
| "valid_targets_min": 725 |
| }, |
| { |
| "epoch": 6.76130389064143, |
| "grad_norm": 0.9421362155615107, |
| "learning_rate": 1.4277540513575328e-07, |
| "loss": 0.1122, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10590024292469025, |
| "step": 6430, |
| "valid_targets_mean": 1472.6, |
| "valid_targets_min": 828 |
| }, |
| { |
| "epoch": 6.766561514195583, |
| "grad_norm": 0.8292069355372615, |
| "learning_rate": 1.3658904858538936e-07, |
| "loss": 0.115, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10221198201179504, |
| "step": 6435, |
| "valid_targets_mean": 1424.0, |
| "valid_targets_min": 618 |
| }, |
| { |
| "epoch": 6.771819137749737, |
| "grad_norm": 0.784724325546131, |
| "learning_rate": 1.3053924297493858e-07, |
| "loss": 0.1027, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09747828543186188, |
| "step": 6440, |
| "valid_targets_mean": 1494.2, |
| "valid_targets_min": 629 |
| }, |
| { |
| "epoch": 6.77707676130389, |
| "grad_norm": 0.9526958247122579, |
| "learning_rate": 1.2462602989376404e-07, |
| "loss": 0.1086, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1333579123020172, |
| "step": 6445, |
| "valid_targets_mean": 1844.9, |
| "valid_targets_min": 1071 |
| }, |
| { |
| "epoch": 6.782334384858045, |
| "grad_norm": 0.8704294174376247, |
| "learning_rate": 1.1884944999222658e-07, |
| "loss": 0.1055, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10618209838867188, |
| "step": 6450, |
| "valid_targets_mean": 1349.2, |
| "valid_targets_min": 677 |
| }, |
| { |
| "epoch": 6.787592008412197, |
| "grad_norm": 0.8123941812093172, |
| "learning_rate": 1.1320954298140063e-07, |
| "loss": 0.0982, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09121832996606827, |
| "step": 6455, |
| "valid_targets_mean": 1227.6, |
| "valid_targets_min": 679 |
| }, |
| { |
| "epoch": 6.792849631966352, |
| "grad_norm": 0.8082068436686528, |
| "learning_rate": 1.0770634763280552e-07, |
| "loss": 0.1, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10017645359039307, |
| "step": 6460, |
| "valid_targets_mean": 1427.4, |
| "valid_targets_min": 504 |
| }, |
| { |
| "epoch": 6.798107255520505, |
| "grad_norm": 0.8108736533059384, |
| "learning_rate": 1.023399017781368e-07, |
| "loss": 0.1051, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10756579786539078, |
| "step": 6465, |
| "valid_targets_mean": 1693.7, |
| "valid_targets_min": 1023 |
| }, |
| { |
| "epoch": 6.803364879074659, |
| "grad_norm": 0.8056099663044899, |
| "learning_rate": 9.711024230900423e-08, |
| "loss": 0.1131, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10558433830738068, |
| "step": 6470, |
| "valid_targets_mean": 1453.0, |
| "valid_targets_min": 661 |
| }, |
| { |
| "epoch": 6.808622502628812, |
| "grad_norm": 0.8129767171895947, |
| "learning_rate": 9.201740517668089e-08, |
| "loss": 0.11, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10171358287334442, |
| "step": 6475, |
| "valid_targets_mean": 1503.2, |
| "valid_targets_min": 889 |
| }, |
| { |
| "epoch": 6.813880126182966, |
| "grad_norm": 0.7868281440128144, |
| "learning_rate": 8.706142539185447e-08, |
| "loss": 0.1004, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10630994290113449, |
| "step": 6480, |
| "valid_targets_mean": 1688.3, |
| "valid_targets_min": 723 |
| }, |
| { |
| "epoch": 6.819137749737119, |
| "grad_norm": 0.8176695994395253, |
| "learning_rate": 8.224233702438966e-08, |
| "loss": 0.1107, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09925578534603119, |
| "step": 6485, |
| "valid_targets_mean": 1409.5, |
| "valid_targets_min": 793 |
| }, |
| { |
| "epoch": 6.8243953732912725, |
| "grad_norm": 0.8104128575525036, |
| "learning_rate": 7.756017320309283e-08, |
| "loss": 0.1042, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11036364734172821, |
| "step": 6490, |
| "valid_targets_mean": 1478.6, |
| "valid_targets_min": 861 |
| }, |
| { |
| "epoch": 6.829652996845426, |
| "grad_norm": 0.806142478049214, |
| "learning_rate": 7.301496611547665e-08, |
| "loss": 0.1061, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09980900585651398, |
| "step": 6495, |
| "valid_targets_mean": 1374.3, |
| "valid_targets_min": 752 |
| }, |
| { |
| "epoch": 6.8349106203995795, |
| "grad_norm": 0.8826704948410696, |
| "learning_rate": 6.86067470075491e-08, |
| "loss": 0.108, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11913549154996872, |
| "step": 6500, |
| "valid_targets_mean": 1828.4, |
| "valid_targets_min": 789 |
| }, |
| { |
| "epoch": 6.840168243953733, |
| "grad_norm": 0.7419252758538742, |
| "learning_rate": 6.433554618359816e-08, |
| "loss": 0.0954, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08761540055274963, |
| "step": 6505, |
| "valid_targets_mean": 1423.6, |
| "valid_targets_min": 638 |
| }, |
| { |
| "epoch": 6.8454258675078865, |
| "grad_norm": 0.9502874390427088, |
| "learning_rate": 6.020139300597638e-08, |
| "loss": 0.1032, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11730216443538666, |
| "step": 6510, |
| "valid_targets_mean": 1504.5, |
| "valid_targets_min": 605 |
| }, |
| { |
| "epoch": 6.85068349106204, |
| "grad_norm": 0.8453159488614819, |
| "learning_rate": 5.620431589490105e-08, |
| "loss": 0.1145, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11261233687400818, |
| "step": 6515, |
| "valid_targets_mean": 1852.8, |
| "valid_targets_min": 746 |
| }, |
| { |
| "epoch": 6.8559411146161935, |
| "grad_norm": 0.8184180728396008, |
| "learning_rate": 5.234434232826324e-08, |
| "loss": 0.0984, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09230824559926987, |
| "step": 6520, |
| "valid_targets_mean": 1197.2, |
| "valid_targets_min": 723 |
| }, |
| { |
| "epoch": 6.861198738170347, |
| "grad_norm": 0.7795495085632375, |
| "learning_rate": 4.862149884143907e-08, |
| "loss": 0.1082, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10440020263195038, |
| "step": 6525, |
| "valid_targets_mean": 1528.6, |
| "valid_targets_min": 855 |
| }, |
| { |
| "epoch": 6.8664563617245005, |
| "grad_norm": 0.7558441306982393, |
| "learning_rate": 4.503581102709875e-08, |
| "loss": 0.1081, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10062847286462784, |
| "step": 6530, |
| "valid_targets_mean": 1590.4, |
| "valid_targets_min": 902 |
| }, |
| { |
| "epoch": 6.871713985278654, |
| "grad_norm": 0.7764594977941333, |
| "learning_rate": 4.1587303535040035e-08, |
| "loss": 0.1047, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0995735302567482, |
| "step": 6535, |
| "valid_targets_mean": 1551.3, |
| "valid_targets_min": 803 |
| }, |
| { |
| "epoch": 6.8769716088328074, |
| "grad_norm": 0.8417640147042569, |
| "learning_rate": 3.827600007201282e-08, |
| "loss": 0.1091, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11624845862388611, |
| "step": 6540, |
| "valid_targets_mean": 1491.0, |
| "valid_targets_min": 740 |
| }, |
| { |
| "epoch": 6.882229232386961, |
| "grad_norm": 0.7645744692343718, |
| "learning_rate": 3.510192340156149e-08, |
| "loss": 0.1053, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09398191422224045, |
| "step": 6545, |
| "valid_targets_mean": 1486.4, |
| "valid_targets_min": 1124 |
| }, |
| { |
| "epoch": 6.887486855941114, |
| "grad_norm": 0.8565616947940794, |
| "learning_rate": 3.20650953438606e-08, |
| "loss": 0.1064, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11091434955596924, |
| "step": 6550, |
| "valid_targets_mean": 1528.4, |
| "valid_targets_min": 655 |
| }, |
| { |
| "epoch": 6.892744479495268, |
| "grad_norm": 0.8665795299632393, |
| "learning_rate": 2.9165536775574987e-08, |
| "loss": 0.102, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11346090584993362, |
| "step": 6555, |
| "valid_targets_mean": 1507.2, |
| "valid_targets_min": 667 |
| }, |
| { |
| "epoch": 6.898002103049421, |
| "grad_norm": 0.8729186998860712, |
| "learning_rate": 2.6403267629706575e-08, |
| "loss": 0.1126, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11617542058229446, |
| "step": 6560, |
| "valid_targets_mean": 1626.7, |
| "valid_targets_min": 1012 |
| }, |
| { |
| "epoch": 6.903259726603575, |
| "grad_norm": 0.8284996847529668, |
| "learning_rate": 2.3778306895467785e-08, |
| "loss": 0.1092, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10244105756282806, |
| "step": 6565, |
| "valid_targets_mean": 1362.2, |
| "valid_targets_min": 684 |
| }, |
| { |
| "epoch": 6.908517350157728, |
| "grad_norm": 0.8091313800748592, |
| "learning_rate": 2.1290672618135e-08, |
| "loss": 0.1128, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10324139147996902, |
| "step": 6570, |
| "valid_targets_mean": 1613.3, |
| "valid_targets_min": 821 |
| }, |
| { |
| "epoch": 6.913774973711882, |
| "grad_norm": 0.7784695906063172, |
| "learning_rate": 1.8940381898946424e-08, |
| "loss": 0.1009, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09095930308103561, |
| "step": 6575, |
| "valid_targets_mean": 1164.2, |
| "valid_targets_min": 620 |
| }, |
| { |
| "epoch": 6.919032597266035, |
| "grad_norm": 0.7875994239344112, |
| "learning_rate": 1.6727450894959973e-08, |
| "loss": 0.1014, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09893280267715454, |
| "step": 6580, |
| "valid_targets_mean": 1539.8, |
| "valid_targets_min": 656 |
| }, |
| { |
| "epoch": 6.92429022082019, |
| "grad_norm": 0.8263690135861804, |
| "learning_rate": 1.4651894818966671e-08, |
| "loss": 0.1078, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13145191967487335, |
| "step": 6585, |
| "valid_targets_mean": 1951.9, |
| "valid_targets_min": 697 |
| }, |
| { |
| "epoch": 6.929547844374342, |
| "grad_norm": 0.8020330751476579, |
| "learning_rate": 1.2713727939364096e-08, |
| "loss": 0.1033, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10347574949264526, |
| "step": 6590, |
| "valid_targets_mean": 1668.9, |
| "valid_targets_min": 682 |
| }, |
| { |
| "epoch": 6.934805467928497, |
| "grad_norm": 0.7340918206011074, |
| "learning_rate": 1.091296358007643e-08, |
| "loss": 0.1033, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09722069650888443, |
| "step": 6595, |
| "valid_targets_mean": 1469.9, |
| "valid_targets_min": 850 |
| }, |
| { |
| "epoch": 6.94006309148265, |
| "grad_norm": 0.8148284715509453, |
| "learning_rate": 9.249614120450113e-09, |
| "loss": 0.1032, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08994179219007492, |
| "step": 6600, |
| "valid_targets_mean": 1366.6, |
| "valid_targets_min": 747 |
| }, |
| { |
| "epoch": 6.945320715036804, |
| "grad_norm": 0.7788698962799686, |
| "learning_rate": 7.723690995171673e-09, |
| "loss": 0.1197, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10366678237915039, |
| "step": 6605, |
| "valid_targets_mean": 1576.2, |
| "valid_targets_min": 933 |
| }, |
| { |
| "epoch": 6.950578338590957, |
| "grad_norm": 0.7730143749391549, |
| "learning_rate": 6.335204694196684e-09, |
| "loss": 0.1035, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1019914299249649, |
| "step": 6610, |
| "valid_targets_mean": 1368.4, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 6.955835962145111, |
| "grad_norm": 0.7974230619550986, |
| "learning_rate": 5.084164762667598e-09, |
| "loss": 0.1023, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09194013476371765, |
| "step": 6615, |
| "valid_targets_mean": 1435.2, |
| "valid_targets_min": 741 |
| }, |
| { |
| "epoch": 6.961093585699264, |
| "grad_norm": 0.7252215246052376, |
| "learning_rate": 3.970579800853802e-09, |
| "loss": 0.107, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09134560823440552, |
| "step": 6620, |
| "valid_targets_mean": 1414.9, |
| "valid_targets_min": 639 |
| }, |
| { |
| "epoch": 6.966351209253418, |
| "grad_norm": 0.8333562638031162, |
| "learning_rate": 2.9944574640894398e-09, |
| "loss": 0.0962, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10189159214496613, |
| "step": 6625, |
| "valid_targets_mean": 1274.8, |
| "valid_targets_min": 720 |
| }, |
| { |
| "epoch": 6.971608832807571, |
| "grad_norm": 0.8276294435850765, |
| "learning_rate": 2.1558044627267847e-09, |
| "loss": 0.1073, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09945736825466156, |
| "step": 6630, |
| "valid_targets_mean": 1450.4, |
| "valid_targets_min": 610 |
| }, |
| { |
| "epoch": 6.976866456361725, |
| "grad_norm": 0.7707616571362058, |
| "learning_rate": 1.4546265620785094e-09, |
| "loss": 0.1016, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0964282751083374, |
| "step": 6635, |
| "valid_targets_mean": 1527.5, |
| "valid_targets_min": 695 |
| }, |
| { |
| "epoch": 6.982124079915878, |
| "grad_norm": 0.8163614239658551, |
| "learning_rate": 8.909285823910374e-10, |
| "loss": 0.1103, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10646478831768036, |
| "step": 6640, |
| "valid_targets_mean": 1575.1, |
| "valid_targets_min": 807 |
| }, |
| { |
| "epoch": 6.987381703470032, |
| "grad_norm": 0.7974354783585509, |
| "learning_rate": 4.647143988067981e-10, |
| "loss": 0.1066, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09756039083003998, |
| "step": 6645, |
| "valid_targets_mean": 1433.2, |
| "valid_targets_min": 765 |
| }, |
| { |
| "epoch": 6.992639327024185, |
| "grad_norm": 0.8841092953018291, |
| "learning_rate": 1.7598694132869853e-10, |
| "loss": 0.1026, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10267548263072968, |
| "step": 6650, |
| "valid_targets_mean": 1380.9, |
| "valid_targets_min": 589 |
| }, |
| { |
| "epoch": 6.997896950578339, |
| "grad_norm": 0.7888297932191874, |
| "learning_rate": 2.474819481568247e-11, |
| "loss": 0.1053, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10763907432556152, |
| "step": 6655, |
| "valid_targets_mean": 1628.9, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 7.0, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08077868074178696, |
| "step": 6657, |
| "total_flos": 1429777853448192.0, |
| "train_loss": 0.1377790669734474, |
| "train_runtime": 24334.9572, |
| "train_samples_per_second": 4.375, |
| "train_steps_per_second": 0.274, |
| "valid_targets_mean": 1517.8, |
| "valid_targets_min": 393 |
| } |
| ], |
| "logging_steps": 5, |
| "max_steps": 6657, |
| "num_input_tokens_seen": 0, |
| "num_train_epochs": 7, |
| "save_steps": 200, |
| "stateful_callbacks": { |
| "TrainerControl": { |
| "args": { |
| "should_epoch_stop": false, |
| "should_evaluate": false, |
| "should_log": false, |
| "should_save": true, |
| "should_training_stop": true |
| }, |
| "attributes": {} |
| } |
| }, |
| "total_flos": 1429777853448192.0, |
| "train_batch_size": 1, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|