nl2bash-stack-undr7030 / trainer_state.json
hf-reset
Reset repository without checkpoints directories
15d059b
{
"best_global_step": null,
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 7.0,
"eval_steps": 500,
"global_step": 4361,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.008025682182985553,
"grad_norm": 14.646306271075366,
"learning_rate": 3.661327231121282e-07,
"loss": 0.7867,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.8202405571937561,
"step": 5,
"valid_targets_mean": 1387.8,
"valid_targets_min": 651
},
{
"epoch": 0.016051364365971106,
"grad_norm": 11.968096269141974,
"learning_rate": 8.237986270022884e-07,
"loss": 0.7576,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7305525541305542,
"step": 10,
"valid_targets_mean": 1799.4,
"valid_targets_min": 655
},
{
"epoch": 0.024077046548956663,
"grad_norm": 11.236420564589006,
"learning_rate": 1.2814645308924487e-06,
"loss": 0.7727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7805347442626953,
"step": 15,
"valid_targets_mean": 1906.4,
"valid_targets_min": 912
},
{
"epoch": 0.03210272873194221,
"grad_norm": 8.949334311195145,
"learning_rate": 1.7391304347826088e-06,
"loss": 0.752,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7785749435424805,
"step": 20,
"valid_targets_mean": 2390.4,
"valid_targets_min": 801
},
{
"epoch": 0.04012841091492777,
"grad_norm": 5.3497727404284365,
"learning_rate": 2.196796338672769e-06,
"loss": 0.673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6312217712402344,
"step": 25,
"valid_targets_mean": 2391.2,
"valid_targets_min": 658
},
{
"epoch": 0.048154093097913325,
"grad_norm": 4.580136509374292,
"learning_rate": 2.654462242562929e-06,
"loss": 0.6483,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6121365427970886,
"step": 30,
"valid_targets_mean": 2334.8,
"valid_targets_min": 677
},
{
"epoch": 0.056179775280898875,
"grad_norm": 4.161436647961576,
"learning_rate": 3.1121281464530894e-06,
"loss": 0.5971,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.592909574508667,
"step": 35,
"valid_targets_mean": 1784.5,
"valid_targets_min": 1077
},
{
"epoch": 0.06420545746388442,
"grad_norm": 3.212931241614404,
"learning_rate": 3.56979405034325e-06,
"loss": 0.5523,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5291016697883606,
"step": 40,
"valid_targets_mean": 1793.4,
"valid_targets_min": 650
},
{
"epoch": 0.07223113964686999,
"grad_norm": 1.89939583890284,
"learning_rate": 4.0274599542334094e-06,
"loss": 0.5286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5067185759544373,
"step": 45,
"valid_targets_mean": 1862.8,
"valid_targets_min": 656
},
{
"epoch": 0.08025682182985554,
"grad_norm": 1.4106073213091272,
"learning_rate": 4.48512585812357e-06,
"loss": 0.4867,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45846793055534363,
"step": 50,
"valid_targets_mean": 1882.2,
"valid_targets_min": 548
},
{
"epoch": 0.08828250401284109,
"grad_norm": 1.314092536682443,
"learning_rate": 4.94279176201373e-06,
"loss": 0.5091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5191839933395386,
"step": 55,
"valid_targets_mean": 1953.6,
"valid_targets_min": 573
},
{
"epoch": 0.09630818619582665,
"grad_norm": 1.22631301037501,
"learning_rate": 5.400457665903891e-06,
"loss": 0.4681,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4688069522380829,
"step": 60,
"valid_targets_mean": 1773.1,
"valid_targets_min": 596
},
{
"epoch": 0.1043338683788122,
"grad_norm": 0.9527209313385111,
"learning_rate": 5.858123569794051e-06,
"loss": 0.4591,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43702492117881775,
"step": 65,
"valid_targets_mean": 2561.0,
"valid_targets_min": 612
},
{
"epoch": 0.11235955056179775,
"grad_norm": 1.000235844903914,
"learning_rate": 6.31578947368421e-06,
"loss": 0.4309,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4246852397918701,
"step": 70,
"valid_targets_mean": 1998.6,
"valid_targets_min": 570
},
{
"epoch": 0.12038523274478331,
"grad_norm": 1.0089319236844694,
"learning_rate": 6.773455377574372e-06,
"loss": 0.4347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43148094415664673,
"step": 75,
"valid_targets_mean": 1942.4,
"valid_targets_min": 806
},
{
"epoch": 0.12841091492776885,
"grad_norm": 0.8232756236327731,
"learning_rate": 7.231121281464531e-06,
"loss": 0.4306,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43262892961502075,
"step": 80,
"valid_targets_mean": 2726.3,
"valid_targets_min": 1188
},
{
"epoch": 0.13643659711075443,
"grad_norm": 0.9596497429181713,
"learning_rate": 7.688787185354691e-06,
"loss": 0.4277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4384536147117615,
"step": 85,
"valid_targets_mean": 2762.1,
"valid_targets_min": 981
},
{
"epoch": 0.14446227929373998,
"grad_norm": 0.9854480370415547,
"learning_rate": 8.146453089244852e-06,
"loss": 0.409,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4489230513572693,
"step": 90,
"valid_targets_mean": 2211.6,
"valid_targets_min": 836
},
{
"epoch": 0.15248796147672553,
"grad_norm": 0.8568389517883238,
"learning_rate": 8.604118993135013e-06,
"loss": 0.3943,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38258206844329834,
"step": 95,
"valid_targets_mean": 1985.7,
"valid_targets_min": 662
},
{
"epoch": 0.16051364365971107,
"grad_norm": 0.963371139740054,
"learning_rate": 9.061784897025172e-06,
"loss": 0.3885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39598965644836426,
"step": 100,
"valid_targets_mean": 1740.9,
"valid_targets_min": 850
},
{
"epoch": 0.16853932584269662,
"grad_norm": 0.7956839523047545,
"learning_rate": 9.519450800915333e-06,
"loss": 0.3943,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3456423878669739,
"step": 105,
"valid_targets_mean": 2082.3,
"valid_targets_min": 765
},
{
"epoch": 0.17656500802568217,
"grad_norm": 1.0007550081839145,
"learning_rate": 9.977116704805492e-06,
"loss": 0.3831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.386109322309494,
"step": 110,
"valid_targets_mean": 1802.2,
"valid_targets_min": 734
},
{
"epoch": 0.18459069020866772,
"grad_norm": 1.0875676039705295,
"learning_rate": 1.0434782608695653e-05,
"loss": 0.3762,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.394925057888031,
"step": 115,
"valid_targets_mean": 1672.4,
"valid_targets_min": 753
},
{
"epoch": 0.1926163723916533,
"grad_norm": 0.7978089011421273,
"learning_rate": 1.0892448512585814e-05,
"loss": 0.3906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37832242250442505,
"step": 120,
"valid_targets_mean": 2175.1,
"valid_targets_min": 785
},
{
"epoch": 0.20064205457463885,
"grad_norm": 0.8058045609374141,
"learning_rate": 1.1350114416475973e-05,
"loss": 0.3619,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38131511211395264,
"step": 125,
"valid_targets_mean": 2393.2,
"valid_targets_min": 780
},
{
"epoch": 0.2086677367576244,
"grad_norm": 1.0459248253632374,
"learning_rate": 1.1807780320366134e-05,
"loss": 0.361,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3370898962020874,
"step": 130,
"valid_targets_mean": 2067.6,
"valid_targets_min": 778
},
{
"epoch": 0.21669341894060995,
"grad_norm": 0.815390844225969,
"learning_rate": 1.2265446224256295e-05,
"loss": 0.3776,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41217032074928284,
"step": 135,
"valid_targets_mean": 2430.4,
"valid_targets_min": 533
},
{
"epoch": 0.2247191011235955,
"grad_norm": 0.7725880706273025,
"learning_rate": 1.2723112128146454e-05,
"loss": 0.3671,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3731037378311157,
"step": 140,
"valid_targets_mean": 2520.3,
"valid_targets_min": 965
},
{
"epoch": 0.23274478330658105,
"grad_norm": 0.9555725515372832,
"learning_rate": 1.3180778032036615e-05,
"loss": 0.3566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37982848286628723,
"step": 145,
"valid_targets_mean": 1930.0,
"valid_targets_min": 705
},
{
"epoch": 0.24077046548956663,
"grad_norm": 0.9884623923983096,
"learning_rate": 1.3638443935926776e-05,
"loss": 0.3674,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3775394856929779,
"step": 150,
"valid_targets_mean": 2116.7,
"valid_targets_min": 662
},
{
"epoch": 0.24879614767255218,
"grad_norm": 1.034002208624198,
"learning_rate": 1.4096109839816933e-05,
"loss": 0.339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28776052594184875,
"step": 155,
"valid_targets_mean": 1503.6,
"valid_targets_min": 695
},
{
"epoch": 0.2568218298555377,
"grad_norm": 0.6896418675498204,
"learning_rate": 1.4553775743707096e-05,
"loss": 0.3622,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3446170687675476,
"step": 160,
"valid_targets_mean": 2950.1,
"valid_targets_min": 939
},
{
"epoch": 0.26484751203852325,
"grad_norm": 1.0577856602046278,
"learning_rate": 1.5011441647597256e-05,
"loss": 0.3664,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33905932307243347,
"step": 165,
"valid_targets_mean": 1820.1,
"valid_targets_min": 1114
},
{
"epoch": 0.27287319422150885,
"grad_norm": 0.9974853998819494,
"learning_rate": 1.5469107551487414e-05,
"loss": 0.346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3451690077781677,
"step": 170,
"valid_targets_mean": 1546.1,
"valid_targets_min": 563
},
{
"epoch": 0.2808988764044944,
"grad_norm": 1.0338258108878557,
"learning_rate": 1.5926773455377575e-05,
"loss": 0.3351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31521838903427124,
"step": 175,
"valid_targets_mean": 1886.1,
"valid_targets_min": 1008
},
{
"epoch": 0.28892455858747995,
"grad_norm": 0.8727309799049142,
"learning_rate": 1.6384439359267736e-05,
"loss": 0.3715,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38526463508605957,
"step": 180,
"valid_targets_mean": 2234.8,
"valid_targets_min": 824
},
{
"epoch": 0.2969502407704655,
"grad_norm": 1.0474632318062393,
"learning_rate": 1.6842105263157896e-05,
"loss": 0.3609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4184132218360901,
"step": 185,
"valid_targets_mean": 1813.5,
"valid_targets_min": 746
},
{
"epoch": 0.30497592295345105,
"grad_norm": 0.904562584347718,
"learning_rate": 1.7299771167048057e-05,
"loss": 0.3305,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2930997908115387,
"step": 190,
"valid_targets_mean": 1764.8,
"valid_targets_min": 1292
},
{
"epoch": 0.3130016051364366,
"grad_norm": 1.0289326023752954,
"learning_rate": 1.7757437070938218e-05,
"loss": 0.3533,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3898566663265228,
"step": 195,
"valid_targets_mean": 1837.3,
"valid_targets_min": 834
},
{
"epoch": 0.32102728731942215,
"grad_norm": 0.7975458356550457,
"learning_rate": 1.8215102974828376e-05,
"loss": 0.3667,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41650494933128357,
"step": 200,
"valid_targets_mean": 2710.9,
"valid_targets_min": 631
},
{
"epoch": 0.3290529695024077,
"grad_norm": 0.8771063421172884,
"learning_rate": 1.8672768878718537e-05,
"loss": 0.362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33713459968566895,
"step": 205,
"valid_targets_mean": 1893.6,
"valid_targets_min": 703
},
{
"epoch": 0.33707865168539325,
"grad_norm": 0.9698501237808315,
"learning_rate": 1.9130434782608697e-05,
"loss": 0.327,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32817181944847107,
"step": 210,
"valid_targets_mean": 1683.0,
"valid_targets_min": 923
},
{
"epoch": 0.3451043338683788,
"grad_norm": 0.9474489541649586,
"learning_rate": 1.9588100686498858e-05,
"loss": 0.3341,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2981823682785034,
"step": 215,
"valid_targets_mean": 1833.7,
"valid_targets_min": 688
},
{
"epoch": 0.35313001605136435,
"grad_norm": 1.181216739010819,
"learning_rate": 2.004576659038902e-05,
"loss": 0.3472,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3394661247730255,
"step": 220,
"valid_targets_mean": 1705.2,
"valid_targets_min": 762
},
{
"epoch": 0.3611556982343499,
"grad_norm": 0.8600956132450231,
"learning_rate": 2.050343249427918e-05,
"loss": 0.3324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36123359203338623,
"step": 225,
"valid_targets_mean": 2096.8,
"valid_targets_min": 611
},
{
"epoch": 0.36918138041733545,
"grad_norm": 0.882945376901777,
"learning_rate": 2.0961098398169337e-05,
"loss": 0.3306,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36194247007369995,
"step": 230,
"valid_targets_mean": 1882.9,
"valid_targets_min": 740
},
{
"epoch": 0.37720706260032105,
"grad_norm": 0.8725076626948183,
"learning_rate": 2.14187643020595e-05,
"loss": 0.3493,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38940614461898804,
"step": 235,
"valid_targets_mean": 2167.7,
"valid_targets_min": 827
},
{
"epoch": 0.3852327447833066,
"grad_norm": 0.7630509783880415,
"learning_rate": 2.187643020594966e-05,
"loss": 0.3471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35910847783088684,
"step": 240,
"valid_targets_mean": 2668.9,
"valid_targets_min": 728
},
{
"epoch": 0.39325842696629215,
"grad_norm": 0.8495303482377304,
"learning_rate": 2.2334096109839817e-05,
"loss": 0.328,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2962149977684021,
"step": 245,
"valid_targets_mean": 1937.8,
"valid_targets_min": 692
},
{
"epoch": 0.4012841091492777,
"grad_norm": 0.7814400087970893,
"learning_rate": 2.279176201372998e-05,
"loss": 0.3436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3515506386756897,
"step": 250,
"valid_targets_mean": 3026.1,
"valid_targets_min": 1030
},
{
"epoch": 0.40930979133226325,
"grad_norm": 0.8463651123622614,
"learning_rate": 2.3249427917620138e-05,
"loss": 0.3345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3280409574508667,
"step": 255,
"valid_targets_mean": 2258.4,
"valid_targets_min": 1139
},
{
"epoch": 0.4173354735152488,
"grad_norm": 0.9681815239196544,
"learning_rate": 2.37070938215103e-05,
"loss": 0.3405,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34646350145339966,
"step": 260,
"valid_targets_mean": 1639.3,
"valid_targets_min": 714
},
{
"epoch": 0.42536115569823435,
"grad_norm": 0.8245899420634851,
"learning_rate": 2.4164759725400463e-05,
"loss": 0.3234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29822391271591187,
"step": 265,
"valid_targets_mean": 2175.2,
"valid_targets_min": 807
},
{
"epoch": 0.4333868378812199,
"grad_norm": 0.8089617843516632,
"learning_rate": 2.462242562929062e-05,
"loss": 0.3253,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33770427107810974,
"step": 270,
"valid_targets_mean": 2268.4,
"valid_targets_min": 694
},
{
"epoch": 0.44141252006420545,
"grad_norm": 0.9716784399381654,
"learning_rate": 2.508009153318078e-05,
"loss": 0.3199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31351184844970703,
"step": 275,
"valid_targets_mean": 1710.8,
"valid_targets_min": 721
},
{
"epoch": 0.449438202247191,
"grad_norm": 0.9572310179043315,
"learning_rate": 2.5537757437070943e-05,
"loss": 0.3171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28802695870399475,
"step": 280,
"valid_targets_mean": 1709.4,
"valid_targets_min": 754
},
{
"epoch": 0.45746388443017655,
"grad_norm": 0.9544189503916952,
"learning_rate": 2.59954233409611e-05,
"loss": 0.317,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3242787718772888,
"step": 285,
"valid_targets_mean": 1835.8,
"valid_targets_min": 567
},
{
"epoch": 0.4654895666131621,
"grad_norm": 1.0011493165732186,
"learning_rate": 2.645308924485126e-05,
"loss": 0.336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30623307824134827,
"step": 290,
"valid_targets_mean": 1786.2,
"valid_targets_min": 790
},
{
"epoch": 0.47351524879614765,
"grad_norm": 0.8661555211405326,
"learning_rate": 2.6910755148741422e-05,
"loss": 0.3137,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30924296379089355,
"step": 295,
"valid_targets_mean": 2096.7,
"valid_targets_min": 244
},
{
"epoch": 0.48154093097913325,
"grad_norm": 1.0988416641746142,
"learning_rate": 2.7368421052631583e-05,
"loss": 0.3165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30219322443008423,
"step": 300,
"valid_targets_mean": 2274.4,
"valid_targets_min": 801
},
{
"epoch": 0.4895666131621188,
"grad_norm": 1.0111186395980374,
"learning_rate": 2.782608695652174e-05,
"loss": 0.3342,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34024935960769653,
"step": 305,
"valid_targets_mean": 1785.6,
"valid_targets_min": 859
},
{
"epoch": 0.49759229534510435,
"grad_norm": 1.1586792124415861,
"learning_rate": 2.8283752860411904e-05,
"loss": 0.3107,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31047970056533813,
"step": 310,
"valid_targets_mean": 1722.4,
"valid_targets_min": 746
},
{
"epoch": 0.5056179775280899,
"grad_norm": 0.832944021979809,
"learning_rate": 2.8741418764302062e-05,
"loss": 0.307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3337301015853882,
"step": 315,
"valid_targets_mean": 2222.3,
"valid_targets_min": 851
},
{
"epoch": 0.5136436597110754,
"grad_norm": 0.8609636836160994,
"learning_rate": 2.9199084668192223e-05,
"loss": 0.2979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29694342613220215,
"step": 320,
"valid_targets_mean": 1934.9,
"valid_targets_min": 640
},
{
"epoch": 0.521669341894061,
"grad_norm": 0.8598522131098509,
"learning_rate": 2.9656750572082384e-05,
"loss": 0.3052,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3284974694252014,
"step": 325,
"valid_targets_mean": 2044.1,
"valid_targets_min": 869
},
{
"epoch": 0.5296950240770465,
"grad_norm": 0.952951010741885,
"learning_rate": 3.0114416475972544e-05,
"loss": 0.3276,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28754106163978577,
"step": 330,
"valid_targets_mean": 1731.6,
"valid_targets_min": 679
},
{
"epoch": 0.5377207062600321,
"grad_norm": 0.9490678253695298,
"learning_rate": 3.05720823798627e-05,
"loss": 0.2909,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3454781174659729,
"step": 335,
"valid_targets_mean": 1781.4,
"valid_targets_min": 744
},
{
"epoch": 0.5457463884430177,
"grad_norm": 1.18873344442354,
"learning_rate": 3.102974828375286e-05,
"loss": 0.2988,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29542940855026245,
"step": 340,
"valid_targets_mean": 1536.3,
"valid_targets_min": 621
},
{
"epoch": 0.5537720706260032,
"grad_norm": 1.1976009299731565,
"learning_rate": 3.1487414187643024e-05,
"loss": 0.3173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2791876792907715,
"step": 345,
"valid_targets_mean": 1599.9,
"valid_targets_min": 698
},
{
"epoch": 0.5617977528089888,
"grad_norm": 0.9101478694060584,
"learning_rate": 3.1945080091533184e-05,
"loss": 0.2994,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2871367335319519,
"step": 350,
"valid_targets_mean": 1797.5,
"valid_targets_min": 646
},
{
"epoch": 0.5698234349919743,
"grad_norm": 0.9896692838718341,
"learning_rate": 3.240274599542334e-05,
"loss": 0.3153,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2911245822906494,
"step": 355,
"valid_targets_mean": 1839.2,
"valid_targets_min": 661
},
{
"epoch": 0.5778491171749599,
"grad_norm": 0.9509341469647331,
"learning_rate": 3.2860411899313506e-05,
"loss": 0.3164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29795265197753906,
"step": 360,
"valid_targets_mean": 1844.8,
"valid_targets_min": 810
},
{
"epoch": 0.5858747993579454,
"grad_norm": 0.8552209611893014,
"learning_rate": 3.331807780320366e-05,
"loss": 0.3174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35684460401535034,
"step": 365,
"valid_targets_mean": 2129.5,
"valid_targets_min": 711
},
{
"epoch": 0.593900481540931,
"grad_norm": 0.8555759703411486,
"learning_rate": 3.377574370709382e-05,
"loss": 0.3255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28512653708457947,
"step": 370,
"valid_targets_mean": 1772.9,
"valid_targets_min": 770
},
{
"epoch": 0.6019261637239165,
"grad_norm": 0.9269879757302991,
"learning_rate": 3.423340961098399e-05,
"loss": 0.3077,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25699400901794434,
"step": 375,
"valid_targets_mean": 1689.4,
"valid_targets_min": 645
},
{
"epoch": 0.6099518459069021,
"grad_norm": 1.0001088715401525,
"learning_rate": 3.469107551487414e-05,
"loss": 0.315,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34773507714271545,
"step": 380,
"valid_targets_mean": 1948.1,
"valid_targets_min": 712
},
{
"epoch": 0.6179775280898876,
"grad_norm": 1.170913919890504,
"learning_rate": 3.5148741418764304e-05,
"loss": 0.2916,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27243420481681824,
"step": 385,
"valid_targets_mean": 1619.1,
"valid_targets_min": 874
},
{
"epoch": 0.6260032102728732,
"grad_norm": 0.8232018782624154,
"learning_rate": 3.5606407322654464e-05,
"loss": 0.3072,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32129108905792236,
"step": 390,
"valid_targets_mean": 2377.1,
"valid_targets_min": 764
},
{
"epoch": 0.6340288924558587,
"grad_norm": 0.8185543627668448,
"learning_rate": 3.6064073226544625e-05,
"loss": 0.3273,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3443065881729126,
"step": 395,
"valid_targets_mean": 2255.8,
"valid_targets_min": 856
},
{
"epoch": 0.6420545746388443,
"grad_norm": 0.9722842463690324,
"learning_rate": 3.6521739130434786e-05,
"loss": 0.2939,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30047857761383057,
"step": 400,
"valid_targets_mean": 1743.6,
"valid_targets_min": 822
},
{
"epoch": 0.6500802568218299,
"grad_norm": 0.7967856246753074,
"learning_rate": 3.697940503432495e-05,
"loss": 0.3206,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2986922860145569,
"step": 405,
"valid_targets_mean": 2248.8,
"valid_targets_min": 776
},
{
"epoch": 0.6581059390048154,
"grad_norm": 0.8316226837505692,
"learning_rate": 3.743707093821511e-05,
"loss": 0.3035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28393733501434326,
"step": 410,
"valid_targets_mean": 1886.7,
"valid_targets_min": 668
},
{
"epoch": 0.666131621187801,
"grad_norm": 1.1649505956487092,
"learning_rate": 3.789473684210526e-05,
"loss": 0.3091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3361932039260864,
"step": 415,
"valid_targets_mean": 2057.5,
"valid_targets_min": 649
},
{
"epoch": 0.6741573033707865,
"grad_norm": 0.8674562998891178,
"learning_rate": 3.835240274599543e-05,
"loss": 0.2817,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.286508172750473,
"step": 420,
"valid_targets_mean": 1988.1,
"valid_targets_min": 790
},
{
"epoch": 0.6821829855537721,
"grad_norm": 0.9171965836082356,
"learning_rate": 3.8810068649885584e-05,
"loss": 0.3252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3114051818847656,
"step": 425,
"valid_targets_mean": 1783.7,
"valid_targets_min": 940
},
{
"epoch": 0.6902086677367576,
"grad_norm": 0.8725500087205194,
"learning_rate": 3.9267734553775745e-05,
"loss": 0.2903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2869841754436493,
"step": 430,
"valid_targets_mean": 1863.4,
"valid_targets_min": 768
},
{
"epoch": 0.6982343499197432,
"grad_norm": 0.9441119652995636,
"learning_rate": 3.9725400457665905e-05,
"loss": 0.3042,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2990264892578125,
"step": 435,
"valid_targets_mean": 1948.9,
"valid_targets_min": 1061
},
{
"epoch": 0.7062600321027287,
"grad_norm": 0.9405263676842486,
"learning_rate": 3.99999743609667e-05,
"loss": 0.3121,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32914310693740845,
"step": 440,
"valid_targets_mean": 2115.7,
"valid_targets_min": 572
},
{
"epoch": 0.7142857142857143,
"grad_norm": 0.8453482397076572,
"learning_rate": 3.999968592259695e-05,
"loss": 0.3008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30714958906173706,
"step": 445,
"valid_targets_mean": 2305.3,
"valid_targets_min": 1354
},
{
"epoch": 0.7223113964686998,
"grad_norm": 0.7738975856001973,
"learning_rate": 3.9999077001703266e-05,
"loss": 0.3068,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32613644003868103,
"step": 450,
"valid_targets_mean": 2465.8,
"valid_targets_min": 881
},
{
"epoch": 0.7303370786516854,
"grad_norm": 0.8149570285290635,
"learning_rate": 3.999814760804324e-05,
"loss": 0.3068,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30127108097076416,
"step": 455,
"valid_targets_mean": 1977.8,
"valid_targets_min": 747
},
{
"epoch": 0.7383627608346709,
"grad_norm": 0.9294086272204561,
"learning_rate": 3.9996897756509806e-05,
"loss": 0.3028,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27201634645462036,
"step": 460,
"valid_targets_mean": 1491.2,
"valid_targets_min": 647
},
{
"epoch": 0.7463884430176565,
"grad_norm": 0.8344262631630353,
"learning_rate": 3.9995327467131074e-05,
"loss": 0.3243,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33017224073410034,
"step": 465,
"valid_targets_mean": 1846.1,
"valid_targets_min": 790
},
{
"epoch": 0.7544141252006421,
"grad_norm": 0.7829996456838156,
"learning_rate": 3.9993436765069954e-05,
"loss": 0.316,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3319680094718933,
"step": 470,
"valid_targets_mean": 2419.9,
"valid_targets_min": 534
},
{
"epoch": 0.7624398073836276,
"grad_norm": 0.8771047139224807,
"learning_rate": 3.999122568062376e-05,
"loss": 0.3174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3266174793243408,
"step": 475,
"valid_targets_mean": 2624.4,
"valid_targets_min": 919
},
{
"epoch": 0.7704654895666132,
"grad_norm": 0.8858493072216881,
"learning_rate": 3.9988694249223747e-05,
"loss": 0.305,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.275663822889328,
"step": 480,
"valid_targets_mean": 1647.2,
"valid_targets_min": 684
},
{
"epoch": 0.7784911717495987,
"grad_norm": 0.7689051739854088,
"learning_rate": 3.9985842511434544e-05,
"loss": 0.2923,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2797590494155884,
"step": 485,
"valid_targets_mean": 2174.2,
"valid_targets_min": 982
},
{
"epoch": 0.7865168539325843,
"grad_norm": 0.8020487982931901,
"learning_rate": 3.9982670512953446e-05,
"loss": 0.3016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34576845169067383,
"step": 490,
"valid_targets_mean": 2432.9,
"valid_targets_min": 884
},
{
"epoch": 0.7945425361155698,
"grad_norm": 0.9730877600468747,
"learning_rate": 3.9979178304609777e-05,
"loss": 0.2908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27685031294822693,
"step": 495,
"valid_targets_mean": 1754.3,
"valid_targets_min": 549
},
{
"epoch": 0.8025682182985554,
"grad_norm": 0.8427811924307392,
"learning_rate": 3.9975365942364e-05,
"loss": 0.2916,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26822972297668457,
"step": 500,
"valid_targets_mean": 1744.6,
"valid_targets_min": 698
},
{
"epoch": 0.8105939004815409,
"grad_norm": 0.8345994269057178,
"learning_rate": 3.997123348730685e-05,
"loss": 0.2982,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2742110788822174,
"step": 505,
"valid_targets_mean": 2118.4,
"valid_targets_min": 845
},
{
"epoch": 0.8186195826645265,
"grad_norm": 0.7394141508614848,
"learning_rate": 3.9966781005658336e-05,
"loss": 0.3182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29566675424575806,
"step": 510,
"valid_targets_mean": 2393.6,
"valid_targets_min": 770
},
{
"epoch": 0.826645264847512,
"grad_norm": 0.7868169024326342,
"learning_rate": 3.996200856876671e-05,
"loss": 0.3184,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31672143936157227,
"step": 515,
"valid_targets_mean": 2246.7,
"valid_targets_min": 659
},
{
"epoch": 0.8346709470304976,
"grad_norm": 0.8208599603839487,
"learning_rate": 3.9956916253107316e-05,
"loss": 0.2801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23943054676055908,
"step": 520,
"valid_targets_mean": 1570.6,
"valid_targets_min": 836
},
{
"epoch": 0.8426966292134831,
"grad_norm": 0.8304116707206449,
"learning_rate": 3.995150414028134e-05,
"loss": 0.2939,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30285578966140747,
"step": 525,
"valid_targets_mean": 1989.4,
"valid_targets_min": 781
},
{
"epoch": 0.8507223113964687,
"grad_norm": 1.0277770584511348,
"learning_rate": 3.994577231701451e-05,
"loss": 0.2891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32783007621765137,
"step": 530,
"valid_targets_mean": 2061.1,
"valid_targets_min": 799
},
{
"epoch": 0.8587479935794543,
"grad_norm": 0.952928563450375,
"learning_rate": 3.993972087515574e-05,
"loss": 0.3037,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34268754720687866,
"step": 535,
"valid_targets_mean": 1843.8,
"valid_targets_min": 777
},
{
"epoch": 0.8667736757624398,
"grad_norm": 0.9308129927095735,
"learning_rate": 3.9933349911675615e-05,
"loss": 0.3211,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2926996052265167,
"step": 540,
"valid_targets_mean": 1644.0,
"valid_targets_min": 882
},
{
"epoch": 0.8747993579454254,
"grad_norm": 0.7426138307689881,
"learning_rate": 3.9926659528664866e-05,
"loss": 0.2915,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2840152978897095,
"step": 545,
"valid_targets_mean": 2081.6,
"valid_targets_min": 668
},
{
"epoch": 0.8828250401284109,
"grad_norm": 0.7590896177179798,
"learning_rate": 3.9919649833332715e-05,
"loss": 0.2874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30055904388427734,
"step": 550,
"valid_targets_mean": 2541.2,
"valid_targets_min": 982
},
{
"epoch": 0.8908507223113965,
"grad_norm": 0.9273338134445059,
"learning_rate": 3.991232093800517e-05,
"loss": 0.2785,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22772808372974396,
"step": 555,
"valid_targets_mean": 1515.6,
"valid_targets_min": 727
},
{
"epoch": 0.898876404494382,
"grad_norm": 0.7731132242138054,
"learning_rate": 3.990467296012322e-05,
"loss": 0.3127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31191396713256836,
"step": 560,
"valid_targets_mean": 2190.2,
"valid_targets_min": 757
},
{
"epoch": 0.9069020866773676,
"grad_norm": 0.8650619758973038,
"learning_rate": 3.989670602224094e-05,
"loss": 0.2988,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32659170031547546,
"step": 565,
"valid_targets_mean": 1817.8,
"valid_targets_min": 869
},
{
"epoch": 0.9149277688603531,
"grad_norm": 0.8114237738910773,
"learning_rate": 3.988842025202358e-05,
"loss": 0.2936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2951407730579376,
"step": 570,
"valid_targets_mean": 2183.2,
"valid_targets_min": 1130
},
{
"epoch": 0.9229534510433387,
"grad_norm": 0.7315127957593782,
"learning_rate": 3.987981578224542e-05,
"loss": 0.3023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3168894648551941,
"step": 575,
"valid_targets_mean": 2335.3,
"valid_targets_min": 963
},
{
"epoch": 0.9309791332263242,
"grad_norm": 0.8198512266606438,
"learning_rate": 3.987089275078776e-05,
"loss": 0.2992,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3281818628311157,
"step": 580,
"valid_targets_mean": 1949.1,
"valid_targets_min": 926
},
{
"epoch": 0.9390048154093098,
"grad_norm": 0.9458954789473605,
"learning_rate": 3.986165130063662e-05,
"loss": 0.2847,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26376253366470337,
"step": 585,
"valid_targets_mean": 1493.2,
"valid_targets_min": 869
},
{
"epoch": 0.9470304975922953,
"grad_norm": 0.881632921637052,
"learning_rate": 3.985209157988048e-05,
"loss": 0.3026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31336453557014465,
"step": 590,
"valid_targets_mean": 1887.2,
"valid_targets_min": 803
},
{
"epoch": 0.9550561797752809,
"grad_norm": 0.8617456541273046,
"learning_rate": 3.984221374170793e-05,
"loss": 0.2898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2735736072063446,
"step": 595,
"valid_targets_mean": 1538.6,
"valid_targets_min": 638
},
{
"epoch": 0.9630818619582665,
"grad_norm": 0.8672485396619697,
"learning_rate": 3.983201794440517e-05,
"loss": 0.2968,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30543556809425354,
"step": 600,
"valid_targets_mean": 2531.9,
"valid_targets_min": 699
},
{
"epoch": 0.971107544141252,
"grad_norm": 0.7590885144559714,
"learning_rate": 3.982150435135353e-05,
"loss": 0.2922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2916344702243805,
"step": 605,
"valid_targets_mean": 2051.1,
"valid_targets_min": 783
},
{
"epoch": 0.9791332263242376,
"grad_norm": 0.7718877500600386,
"learning_rate": 3.981067313102677e-05,
"loss": 0.2868,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28497275710105896,
"step": 610,
"valid_targets_mean": 1904.2,
"valid_targets_min": 784
},
{
"epoch": 0.9871589085072231,
"grad_norm": 0.7608096902947907,
"learning_rate": 3.979952445698847e-05,
"loss": 0.2909,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26857396960258484,
"step": 615,
"valid_targets_mean": 1962.2,
"valid_targets_min": 744
},
{
"epoch": 0.9951845906902087,
"grad_norm": 0.6228654680626398,
"learning_rate": 3.978805850788919e-05,
"loss": 0.2987,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23795419931411743,
"step": 620,
"valid_targets_mean": 2535.7,
"valid_targets_min": 892
},
{
"epoch": 1.0032102728731942,
"grad_norm": 0.8226067743998671,
"learning_rate": 3.9776275467463645e-05,
"loss": 0.2819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2510879337787628,
"step": 625,
"valid_targets_mean": 1790.2,
"valid_targets_min": 940
},
{
"epoch": 1.0112359550561798,
"grad_norm": 0.9254700139665087,
"learning_rate": 3.9764175524527713e-05,
"loss": 0.2686,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27632659673690796,
"step": 630,
"valid_targets_mean": 1515.6,
"valid_targets_min": 548
},
{
"epoch": 1.0192616372391654,
"grad_norm": 0.8465617431259781,
"learning_rate": 3.975175887297545e-05,
"loss": 0.2817,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30026766657829285,
"step": 635,
"valid_targets_mean": 1732.3,
"valid_targets_min": 798
},
{
"epoch": 1.0272873194221508,
"grad_norm": 0.6931817861755858,
"learning_rate": 3.9739025711775984e-05,
"loss": 0.2677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27642396092414856,
"step": 640,
"valid_targets_mean": 2458.4,
"valid_targets_min": 593
},
{
"epoch": 1.0353130016051364,
"grad_norm": 0.8037354268649257,
"learning_rate": 3.972597624497029e-05,
"loss": 0.2701,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27763617038726807,
"step": 645,
"valid_targets_mean": 1996.9,
"valid_targets_min": 916
},
{
"epoch": 1.043338683788122,
"grad_norm": 0.7384503118506207,
"learning_rate": 3.971261068166796e-05,
"loss": 0.2676,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24708183109760284,
"step": 650,
"valid_targets_mean": 1862.0,
"valid_targets_min": 768
},
{
"epoch": 1.0513643659711076,
"grad_norm": 0.7212274419919188,
"learning_rate": 3.969892923604383e-05,
"loss": 0.2686,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3036978244781494,
"step": 655,
"valid_targets_mean": 2355.9,
"valid_targets_min": 745
},
{
"epoch": 1.0593900481540932,
"grad_norm": 0.843707373832904,
"learning_rate": 3.9684932127334555e-05,
"loss": 0.2824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29731786251068115,
"step": 660,
"valid_targets_mean": 2513.6,
"valid_targets_min": 821
},
{
"epoch": 1.0674157303370786,
"grad_norm": 0.8252091123984003,
"learning_rate": 3.967061957983509e-05,
"loss": 0.2792,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2805379629135132,
"step": 665,
"valid_targets_mean": 2306.0,
"valid_targets_min": 928
},
{
"epoch": 1.0754414125200642,
"grad_norm": 0.7679243083152455,
"learning_rate": 3.965599182289511e-05,
"loss": 0.2555,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2966977655887604,
"step": 670,
"valid_targets_mean": 2099.9,
"valid_targets_min": 703
},
{
"epoch": 1.0834670947030498,
"grad_norm": 0.7324918129142989,
"learning_rate": 3.964104909091531e-05,
"loss": 0.2663,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.273954838514328,
"step": 675,
"valid_targets_mean": 2465.0,
"valid_targets_min": 896
},
{
"epoch": 1.0914927768860354,
"grad_norm": 0.9526343036354475,
"learning_rate": 3.962579162334368e-05,
"loss": 0.2659,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2664143145084381,
"step": 680,
"valid_targets_mean": 1999.2,
"valid_targets_min": 933
},
{
"epoch": 1.0995184590690208,
"grad_norm": 0.7991262471661897,
"learning_rate": 3.961021966467165e-05,
"loss": 0.2738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31175559759140015,
"step": 685,
"valid_targets_mean": 2189.3,
"valid_targets_min": 770
},
{
"epoch": 1.1075441412520064,
"grad_norm": 0.7616807096516526,
"learning_rate": 3.9594333464430155e-05,
"loss": 0.2769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2699921429157257,
"step": 690,
"valid_targets_mean": 2126.8,
"valid_targets_min": 868
},
{
"epoch": 1.115569823434992,
"grad_norm": 0.6893907566892634,
"learning_rate": 3.957813327718568e-05,
"loss": 0.2536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2612619996070862,
"step": 695,
"valid_targets_mean": 2350.4,
"valid_targets_min": 1039
},
{
"epoch": 1.1235955056179776,
"grad_norm": 0.759736214908413,
"learning_rate": 3.956161936253615e-05,
"loss": 0.2769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2773323059082031,
"step": 700,
"valid_targets_mean": 2099.1,
"valid_targets_min": 1106
},
{
"epoch": 1.131621187800963,
"grad_norm": 0.7969447025466453,
"learning_rate": 3.954479198510676e-05,
"loss": 0.2837,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.284991979598999,
"step": 705,
"valid_targets_mean": 2341.9,
"valid_targets_min": 825
},
{
"epoch": 1.1396468699839486,
"grad_norm": 0.8759437781132143,
"learning_rate": 3.952765141454578e-05,
"loss": 0.2598,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2301260232925415,
"step": 710,
"valid_targets_mean": 1502.1,
"valid_targets_min": 802
},
{
"epoch": 1.1476725521669342,
"grad_norm": 1.5236051002273119,
"learning_rate": 3.951019792552018e-05,
"loss": 0.2759,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2769410014152527,
"step": 715,
"valid_targets_mean": 1819.7,
"valid_targets_min": 788
},
{
"epoch": 1.1556982343499198,
"grad_norm": 0.8290152147933497,
"learning_rate": 3.949243179771126e-05,
"loss": 0.2765,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26144346594810486,
"step": 720,
"valid_targets_mean": 1860.0,
"valid_targets_min": 634
},
{
"epoch": 1.1637239165329052,
"grad_norm": 0.8614047618513456,
"learning_rate": 3.947435331581017e-05,
"loss": 0.264,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2969715893268585,
"step": 725,
"valid_targets_mean": 1768.7,
"valid_targets_min": 660
},
{
"epoch": 1.1717495987158908,
"grad_norm": 0.8263928626213929,
"learning_rate": 3.945596276951333e-05,
"loss": 0.2614,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2564338147640228,
"step": 730,
"valid_targets_mean": 1887.8,
"valid_targets_min": 799
},
{
"epoch": 1.1797752808988764,
"grad_norm": 0.7152475805264833,
"learning_rate": 3.943726045351782e-05,
"loss": 0.2745,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28374791145324707,
"step": 735,
"valid_targets_mean": 2314.3,
"valid_targets_min": 666
},
{
"epoch": 1.187800963081862,
"grad_norm": 0.8571151233033966,
"learning_rate": 3.941824666751659e-05,
"loss": 0.2709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26686954498291016,
"step": 740,
"valid_targets_mean": 1607.6,
"valid_targets_min": 596
},
{
"epoch": 1.1958266452648476,
"grad_norm": 0.86405780600893,
"learning_rate": 3.939892171619375e-05,
"loss": 0.2675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2871187925338745,
"step": 745,
"valid_targets_mean": 1871.7,
"valid_targets_min": 679
},
{
"epoch": 1.203852327447833,
"grad_norm": 0.717709948229875,
"learning_rate": 3.9379285909219616e-05,
"loss": 0.2722,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28010597825050354,
"step": 750,
"valid_targets_mean": 2421.4,
"valid_targets_min": 647
},
{
"epoch": 1.2118780096308186,
"grad_norm": 0.654139274364583,
"learning_rate": 3.935933956124578e-05,
"loss": 0.2486,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2108229696750641,
"step": 755,
"valid_targets_mean": 1986.1,
"valid_targets_min": 504
},
{
"epoch": 1.2199036918138042,
"grad_norm": 0.7787020251350064,
"learning_rate": 3.933908299190006e-05,
"loss": 0.2538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22526943683624268,
"step": 760,
"valid_targets_mean": 1925.8,
"valid_targets_min": 782
},
{
"epoch": 1.2279293739967898,
"grad_norm": 0.6960673012286028,
"learning_rate": 3.931851652578137e-05,
"loss": 0.2691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28950342535972595,
"step": 765,
"valid_targets_mean": 2596.1,
"valid_targets_min": 715
},
{
"epoch": 1.2359550561797752,
"grad_norm": 0.7791017658890873,
"learning_rate": 3.929764049245454e-05,
"loss": 0.2731,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3156774640083313,
"step": 770,
"valid_targets_mean": 2444.2,
"valid_targets_min": 859
},
{
"epoch": 1.2439807383627608,
"grad_norm": 0.7183503125932852,
"learning_rate": 3.9276455226445015e-05,
"loss": 0.2643,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3058626055717468,
"step": 775,
"valid_targets_mean": 2245.4,
"valid_targets_min": 850
},
{
"epoch": 1.2520064205457464,
"grad_norm": 0.6695581705684971,
"learning_rate": 3.92549610672335e-05,
"loss": 0.2681,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.289934903383255,
"step": 780,
"valid_targets_mean": 2771.9,
"valid_targets_min": 684
},
{
"epoch": 1.260032102728732,
"grad_norm": 0.6866570176470886,
"learning_rate": 3.9233158359250526e-05,
"loss": 0.2608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23689235746860504,
"step": 785,
"valid_targets_mean": 1918.2,
"valid_targets_min": 607
},
{
"epoch": 1.2680577849117176,
"grad_norm": 0.7822630337022523,
"learning_rate": 3.9211047451870925e-05,
"loss": 0.2662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2988463044166565,
"step": 790,
"valid_targets_mean": 2311.7,
"valid_targets_min": 771
},
{
"epoch": 1.276083467094703,
"grad_norm": 0.8317062530284344,
"learning_rate": 3.9188628699408226e-05,
"loss": 0.2749,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31084558367729187,
"step": 795,
"valid_targets_mean": 1966.4,
"valid_targets_min": 723
},
{
"epoch": 1.2841091492776886,
"grad_norm": 0.72484686674938,
"learning_rate": 3.916590246110899e-05,
"loss": 0.2561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2934309244155884,
"step": 800,
"valid_targets_mean": 2700.1,
"valid_targets_min": 748
},
{
"epoch": 1.2921348314606742,
"grad_norm": 0.8156555683738264,
"learning_rate": 3.914286910114705e-05,
"loss": 0.2662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29776060581207275,
"step": 805,
"valid_targets_mean": 2074.9,
"valid_targets_min": 705
},
{
"epoch": 1.3001605136436596,
"grad_norm": 0.8183857431272717,
"learning_rate": 3.9119528988617676e-05,
"loss": 0.2539,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25548940896987915,
"step": 810,
"valid_targets_mean": 1921.6,
"valid_targets_min": 718
},
{
"epoch": 1.3081861958266452,
"grad_norm": 0.7288663029670344,
"learning_rate": 3.909588249753164e-05,
"loss": 0.2738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2411450296640396,
"step": 815,
"valid_targets_mean": 2309.4,
"valid_targets_min": 779
},
{
"epoch": 1.3162118780096308,
"grad_norm": 0.8147197023616638,
"learning_rate": 3.907193000680924e-05,
"loss": 0.2743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29190874099731445,
"step": 820,
"valid_targets_mean": 1898.1,
"valid_targets_min": 700
},
{
"epoch": 1.3242375601926164,
"grad_norm": 0.8065187260999866,
"learning_rate": 3.9047671900274256e-05,
"loss": 0.256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2601572275161743,
"step": 825,
"valid_targets_mean": 1808.4,
"valid_targets_min": 658
},
{
"epoch": 1.332263242375602,
"grad_norm": 0.8207215518210806,
"learning_rate": 3.9023108566647746e-05,
"loss": 0.2575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2769230604171753,
"step": 830,
"valid_targets_mean": 2078.6,
"valid_targets_min": 613
},
{
"epoch": 1.3402889245585876,
"grad_norm": 0.924972736057203,
"learning_rate": 3.899824039954185e-05,
"loss": 0.2565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24372698366641998,
"step": 835,
"valid_targets_mean": 1450.0,
"valid_targets_min": 648
},
{
"epoch": 1.348314606741573,
"grad_norm": 0.714092931128622,
"learning_rate": 3.897306779745347e-05,
"loss": 0.2789,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.271422415971756,
"step": 840,
"valid_targets_mean": 2285.3,
"valid_targets_min": 735
},
{
"epoch": 1.3563402889245586,
"grad_norm": 0.8417283546200632,
"learning_rate": 3.89475911637579e-05,
"loss": 0.2758,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2518080770969391,
"step": 845,
"valid_targets_mean": 1609.2,
"valid_targets_min": 621
},
{
"epoch": 1.3643659711075442,
"grad_norm": 0.7852542096242522,
"learning_rate": 3.892181090670233e-05,
"loss": 0.2755,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2653108239173889,
"step": 850,
"valid_targets_mean": 1744.6,
"valid_targets_min": 806
},
{
"epoch": 1.3723916532905296,
"grad_norm": 0.7958802575764924,
"learning_rate": 3.8895727439399366e-05,
"loss": 0.2567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2511981129646301,
"step": 855,
"valid_targets_mean": 1641.1,
"valid_targets_min": 1017
},
{
"epoch": 1.3804173354735152,
"grad_norm": 0.7781458043061429,
"learning_rate": 3.8869341179820314e-05,
"loss": 0.2689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2821986973285675,
"step": 860,
"valid_targets_mean": 2122.4,
"valid_targets_min": 882
},
{
"epoch": 1.3884430176565008,
"grad_norm": 0.9086989564254825,
"learning_rate": 3.884265255078859e-05,
"loss": 0.2651,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2702217102050781,
"step": 865,
"valid_targets_mean": 1887.4,
"valid_targets_min": 746
},
{
"epoch": 1.3964686998394864,
"grad_norm": 0.774043855966981,
"learning_rate": 3.881566197997286e-05,
"loss": 0.2624,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2534475326538086,
"step": 870,
"valid_targets_mean": 2067.0,
"valid_targets_min": 919
},
{
"epoch": 1.404494382022472,
"grad_norm": 0.7066842171984723,
"learning_rate": 3.8788369899880225e-05,
"loss": 0.2629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28810229897499084,
"step": 875,
"valid_targets_mean": 2462.9,
"valid_targets_min": 762
},
{
"epoch": 1.4125200642054574,
"grad_norm": 0.7708815207296795,
"learning_rate": 3.8760776747849303e-05,
"loss": 0.2641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26532846689224243,
"step": 880,
"valid_targets_mean": 1815.2,
"valid_targets_min": 764
},
{
"epoch": 1.420545746388443,
"grad_norm": 0.75205317271865,
"learning_rate": 3.873288296604317e-05,
"loss": 0.2761,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2786597013473511,
"step": 885,
"valid_targets_mean": 1939.7,
"valid_targets_min": 894
},
{
"epoch": 1.4285714285714286,
"grad_norm": 0.672307215560877,
"learning_rate": 3.870468900144233e-05,
"loss": 0.2782,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28444236516952515,
"step": 890,
"valid_targets_mean": 2277.8,
"valid_targets_min": 836
},
{
"epoch": 1.4365971107544142,
"grad_norm": 0.6608204156050805,
"learning_rate": 3.8676195305837536e-05,
"loss": 0.2557,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2395007461309433,
"step": 895,
"valid_targets_mean": 2169.6,
"valid_targets_min": 656
},
{
"epoch": 1.4446227929373996,
"grad_norm": 0.7138327208605213,
"learning_rate": 3.864740233582252e-05,
"loss": 0.2817,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2664600908756256,
"step": 900,
"valid_targets_mean": 2115.5,
"valid_targets_min": 467
},
{
"epoch": 1.4526484751203852,
"grad_norm": 0.6925022486252039,
"learning_rate": 3.8618310552786715e-05,
"loss": 0.2631,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2339175045490265,
"step": 905,
"valid_targets_mean": 2044.7,
"valid_targets_min": 748
},
{
"epoch": 1.4606741573033708,
"grad_norm": 0.8534400357923534,
"learning_rate": 3.858892042290785e-05,
"loss": 0.2625,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29541435837745667,
"step": 910,
"valid_targets_mean": 1677.3,
"valid_targets_min": 761
},
{
"epoch": 1.4686998394863564,
"grad_norm": 0.7239107539611367,
"learning_rate": 3.855923241714447e-05,
"loss": 0.268,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27571260929107666,
"step": 915,
"valid_targets_mean": 2073.4,
"valid_targets_min": 675
},
{
"epoch": 1.476725521669342,
"grad_norm": 0.8487942181629813,
"learning_rate": 3.852924701122839e-05,
"loss": 0.2654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29242533445358276,
"step": 920,
"valid_targets_mean": 1567.2,
"valid_targets_min": 713
},
{
"epoch": 1.4847512038523274,
"grad_norm": 0.7010812875356174,
"learning_rate": 3.8498964685657084e-05,
"loss": 0.2678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28116998076438904,
"step": 925,
"valid_targets_mean": 2125.7,
"valid_targets_min": 797
},
{
"epoch": 1.492776886035313,
"grad_norm": 0.7241807089136368,
"learning_rate": 3.846838592568599e-05,
"loss": 0.2684,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28465375304222107,
"step": 930,
"valid_targets_mean": 2401.2,
"valid_targets_min": 694
},
{
"epoch": 1.5008025682182986,
"grad_norm": 0.7316004281768466,
"learning_rate": 3.84375112213207e-05,
"loss": 0.2645,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25454214215278625,
"step": 935,
"valid_targets_mean": 1856.4,
"valid_targets_min": 764
},
{
"epoch": 1.508828250401284,
"grad_norm": 0.7770880009110686,
"learning_rate": 3.840634106730915e-05,
"loss": 0.2577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24702686071395874,
"step": 940,
"valid_targets_mean": 1784.5,
"valid_targets_min": 854
},
{
"epoch": 1.5168539325842696,
"grad_norm": 0.7275439210958472,
"learning_rate": 3.837487596313366e-05,
"loss": 0.2743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28921470046043396,
"step": 945,
"valid_targets_mean": 1958.6,
"valid_targets_min": 1030
},
{
"epoch": 1.5248796147672552,
"grad_norm": 0.7295956985847399,
"learning_rate": 3.834311641300296e-05,
"loss": 0.2458,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2506203055381775,
"step": 950,
"valid_targets_mean": 2109.1,
"valid_targets_min": 875
},
{
"epoch": 1.5329052969502408,
"grad_norm": 0.7788207921479691,
"learning_rate": 3.831106292584406e-05,
"loss": 0.2625,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2641506493091583,
"step": 955,
"valid_targets_mean": 1837.2,
"valid_targets_min": 635
},
{
"epoch": 1.5409309791332264,
"grad_norm": 1.0545045402423714,
"learning_rate": 3.827871601529417e-05,
"loss": 0.2701,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28296715021133423,
"step": 960,
"valid_targets_mean": 1895.5,
"valid_targets_min": 1085
},
{
"epoch": 1.548956661316212,
"grad_norm": 0.8057606395413027,
"learning_rate": 3.8246076199692395e-05,
"loss": 0.2581,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2991617023944855,
"step": 965,
"valid_targets_mean": 2077.7,
"valid_targets_min": 722
},
{
"epoch": 1.5569823434991974,
"grad_norm": 0.6927010096471385,
"learning_rate": 3.821314400207148e-05,
"loss": 0.2614,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2451082170009613,
"step": 970,
"valid_targets_mean": 1981.5,
"valid_targets_min": 898
},
{
"epoch": 1.565008025682183,
"grad_norm": 0.7110441501753103,
"learning_rate": 3.817991995014939e-05,
"loss": 0.263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29124924540519714,
"step": 975,
"valid_targets_mean": 2240.8,
"valid_targets_min": 642
},
{
"epoch": 1.5730337078651684,
"grad_norm": 0.6885281006909981,
"learning_rate": 3.8146404576320894e-05,
"loss": 0.2476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23632869124412537,
"step": 980,
"valid_targets_mean": 1979.8,
"valid_targets_min": 657
},
{
"epoch": 1.581059390048154,
"grad_norm": 0.7522169112208279,
"learning_rate": 3.8112598417649015e-05,
"loss": 0.2664,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2756073772907257,
"step": 985,
"valid_targets_mean": 2060.7,
"valid_targets_min": 663
},
{
"epoch": 1.5890850722311396,
"grad_norm": 0.8786648311794397,
"learning_rate": 3.80785020158564e-05,
"loss": 0.2627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25147706270217896,
"step": 990,
"valid_targets_mean": 1561.0,
"valid_targets_min": 793
},
{
"epoch": 1.5971107544141252,
"grad_norm": 0.7195963819191232,
"learning_rate": 3.804411591731668e-05,
"loss": 0.2649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2796766459941864,
"step": 995,
"valid_targets_mean": 2145.2,
"valid_targets_min": 892
},
{
"epoch": 1.6051364365971108,
"grad_norm": 0.8812045734435614,
"learning_rate": 3.80094406730457e-05,
"loss": 0.2634,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23850060999393463,
"step": 1000,
"valid_targets_mean": 2386.0,
"valid_targets_min": 732
},
{
"epoch": 1.6131621187800964,
"grad_norm": 0.7667863911451553,
"learning_rate": 3.7974476838692656e-05,
"loss": 0.2635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.268310546875,
"step": 1005,
"valid_targets_mean": 1975.6,
"valid_targets_min": 748
},
{
"epoch": 1.621187800963082,
"grad_norm": 0.7545530524527456,
"learning_rate": 3.793922497453124e-05,
"loss": 0.2479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.234517440199852,
"step": 1010,
"valid_targets_mean": 1716.2,
"valid_targets_min": 649
},
{
"epoch": 1.6292134831460674,
"grad_norm": 0.7013505596294985,
"learning_rate": 3.790368564545067e-05,
"loss": 0.2607,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28479787707328796,
"step": 1015,
"valid_targets_mean": 2393.4,
"valid_targets_min": 684
},
{
"epoch": 1.637239165329053,
"grad_norm": 0.8351965152529512,
"learning_rate": 3.786785942094656e-05,
"loss": 0.2544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2289065718650818,
"step": 1020,
"valid_targets_mean": 1477.6,
"valid_targets_min": 244
},
{
"epoch": 1.6452648475120384,
"grad_norm": 0.8048989954188138,
"learning_rate": 3.783174687511188e-05,
"loss": 0.2614,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24464435875415802,
"step": 1025,
"valid_targets_mean": 1876.4,
"valid_targets_min": 810
},
{
"epoch": 1.653290529695024,
"grad_norm": 0.6657920575704092,
"learning_rate": 3.7795348586627696e-05,
"loss": 0.2563,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2421034723520279,
"step": 1030,
"valid_targets_mean": 2440.4,
"valid_targets_min": 704
},
{
"epoch": 1.6613162118780096,
"grad_norm": 0.6978432635250694,
"learning_rate": 3.7758665138753943e-05,
"loss": 0.2774,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25340160727500916,
"step": 1035,
"valid_targets_mean": 2174.9,
"valid_targets_min": 604
},
{
"epoch": 1.6693418940609952,
"grad_norm": 0.7036409883833363,
"learning_rate": 3.7721697119320054e-05,
"loss": 0.2734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2678963541984558,
"step": 1040,
"valid_targets_mean": 2500.4,
"valid_targets_min": 750
},
{
"epoch": 1.6773675762439808,
"grad_norm": 0.7683015358822927,
"learning_rate": 3.768444512071553e-05,
"loss": 0.2525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24290819466114044,
"step": 1045,
"valid_targets_mean": 1559.9,
"valid_targets_min": 611
},
{
"epoch": 1.6853932584269664,
"grad_norm": 0.7747543733128794,
"learning_rate": 3.7646909739880486e-05,
"loss": 0.2688,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3120294213294983,
"step": 1050,
"valid_targets_mean": 2086.7,
"valid_targets_min": 564
},
{
"epoch": 1.6934189406099518,
"grad_norm": 0.7582150632753363,
"learning_rate": 3.760909157829604e-05,
"loss": 0.2697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2633521556854248,
"step": 1055,
"valid_targets_mean": 1768.8,
"valid_targets_min": 700
},
{
"epoch": 1.7014446227929374,
"grad_norm": 0.782741178401804,
"learning_rate": 3.75709912419747e-05,
"loss": 0.2615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2791171669960022,
"step": 1060,
"valid_targets_mean": 1728.7,
"valid_targets_min": 909
},
{
"epoch": 1.709470304975923,
"grad_norm": 0.8113224135725746,
"learning_rate": 3.7532609341450655e-05,
"loss": 0.2662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.257160484790802,
"step": 1065,
"valid_targets_mean": 2120.3,
"valid_targets_min": 773
},
{
"epoch": 1.7174959871589084,
"grad_norm": 0.7462354824079133,
"learning_rate": 3.749394649176998e-05,
"loss": 0.2646,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2856426239013672,
"step": 1070,
"valid_targets_mean": 2123.1,
"valid_targets_min": 765
},
{
"epoch": 1.725521669341894,
"grad_norm": 0.7126762615208581,
"learning_rate": 3.745500331248078e-05,
"loss": 0.2515,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24018818140029907,
"step": 1075,
"valid_targets_mean": 1817.8,
"valid_targets_min": 865
},
{
"epoch": 1.7335473515248796,
"grad_norm": 0.6898127387055668,
"learning_rate": 3.741578042762329e-05,
"loss": 0.2599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26695871353149414,
"step": 1080,
"valid_targets_mean": 2342.2,
"valid_targets_min": 770
},
{
"epoch": 1.7415730337078652,
"grad_norm": 0.66757954744143,
"learning_rate": 3.737627846571982e-05,
"loss": 0.2467,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22607743740081787,
"step": 1085,
"valid_targets_mean": 2161.1,
"valid_targets_min": 856
},
{
"epoch": 1.7495987158908508,
"grad_norm": 0.6652154306317639,
"learning_rate": 3.733649805976474e-05,
"loss": 0.2564,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2927885055541992,
"step": 1090,
"valid_targets_mean": 2548.8,
"valid_targets_min": 715
},
{
"epoch": 1.7576243980738364,
"grad_norm": 0.7237170273830091,
"learning_rate": 3.729643984721431e-05,
"loss": 0.2477,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2599429190158844,
"step": 1095,
"valid_targets_mean": 2250.6,
"valid_targets_min": 1026
},
{
"epoch": 1.7656500802568218,
"grad_norm": 0.7141988738983245,
"learning_rate": 3.725610446997646e-05,
"loss": 0.2667,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2560562193393707,
"step": 1100,
"valid_targets_mean": 2340.1,
"valid_targets_min": 788
},
{
"epoch": 1.7736757624398074,
"grad_norm": 1.1500842386133312,
"learning_rate": 3.7215492574400514e-05,
"loss": 0.275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30140018463134766,
"step": 1105,
"valid_targets_mean": 2404.6,
"valid_targets_min": 691
},
{
"epoch": 1.7817014446227928,
"grad_norm": 0.6808585287726022,
"learning_rate": 3.717460481126684e-05,
"loss": 0.2703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3125297427177429,
"step": 1110,
"valid_targets_mean": 2692.1,
"valid_targets_min": 912
},
{
"epoch": 1.7897271268057784,
"grad_norm": 0.7248268534788489,
"learning_rate": 3.7133441835776386e-05,
"loss": 0.2792,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2808183431625366,
"step": 1115,
"valid_targets_mean": 2375.7,
"valid_targets_min": 878
},
{
"epoch": 1.797752808988764,
"grad_norm": 0.8633733319106702,
"learning_rate": 3.7092004307540235e-05,
"loss": 0.2577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29408037662506104,
"step": 1120,
"valid_targets_mean": 1460.2,
"valid_targets_min": 750
},
{
"epoch": 1.8057784911717496,
"grad_norm": 0.7680940895196984,
"learning_rate": 3.7050292890568995e-05,
"loss": 0.2916,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2827860116958618,
"step": 1125,
"valid_targets_mean": 2280.7,
"valid_targets_min": 699
},
{
"epoch": 1.8138041733547352,
"grad_norm": 0.7869442484722307,
"learning_rate": 3.700830825326218e-05,
"loss": 0.2661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26617157459259033,
"step": 1130,
"valid_targets_mean": 1957.4,
"valid_targets_min": 824
},
{
"epoch": 1.8218298555377208,
"grad_norm": 0.7696885298751593,
"learning_rate": 3.696605106839747e-05,
"loss": 0.2939,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2644560933113098,
"step": 1135,
"valid_targets_mean": 1796.3,
"valid_targets_min": 715
},
{
"epoch": 1.8298555377207064,
"grad_norm": 0.8922311571098936,
"learning_rate": 3.6923522013119964e-05,
"loss": 0.2555,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2608848214149475,
"step": 1140,
"valid_targets_mean": 1475.7,
"valid_targets_min": 710
},
{
"epoch": 1.8378812199036918,
"grad_norm": 0.6335228244683325,
"learning_rate": 3.688072176893132e-05,
"loss": 0.2682,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.288246750831604,
"step": 1145,
"valid_targets_mean": 2936.8,
"valid_targets_min": 645
},
{
"epoch": 1.8459069020866774,
"grad_norm": 0.7476777076459231,
"learning_rate": 3.683765102167881e-05,
"loss": 0.2552,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27494877576828003,
"step": 1150,
"valid_targets_mean": 2268.6,
"valid_targets_min": 698
},
{
"epoch": 1.8539325842696628,
"grad_norm": 0.7507784672507724,
"learning_rate": 3.679431046154438e-05,
"loss": 0.2557,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27138835191726685,
"step": 1155,
"valid_targets_mean": 2028.2,
"valid_targets_min": 820
},
{
"epoch": 1.8619582664526484,
"grad_norm": 0.775484617594402,
"learning_rate": 3.675070078303352e-05,
"loss": 0.2617,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2535039782524109,
"step": 1160,
"valid_targets_mean": 1500.2,
"valid_targets_min": 692
},
{
"epoch": 1.869983948635634,
"grad_norm": 0.7919636650285514,
"learning_rate": 3.670682268496421e-05,
"loss": 0.2554,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28811001777648926,
"step": 1165,
"valid_targets_mean": 2233.0,
"valid_targets_min": 778
},
{
"epoch": 1.8780096308186196,
"grad_norm": 0.8269276141613667,
"learning_rate": 3.6662676870455676e-05,
"loss": 0.2575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22544220089912415,
"step": 1170,
"valid_targets_mean": 1450.8,
"valid_targets_min": 632
},
{
"epoch": 1.8860353130016052,
"grad_norm": 0.7176606864299451,
"learning_rate": 3.661826404691712e-05,
"loss": 0.2548,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2399870753288269,
"step": 1175,
"valid_targets_mean": 1901.9,
"valid_targets_min": 703
},
{
"epoch": 1.8940609951845908,
"grad_norm": 0.6785006811736799,
"learning_rate": 3.657358492603641e-05,
"loss": 0.2719,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28619182109832764,
"step": 1180,
"valid_targets_mean": 2383.9,
"valid_targets_min": 773
},
{
"epoch": 1.9020866773675762,
"grad_norm": 0.7006806520786782,
"learning_rate": 3.652864022376866e-05,
"loss": 0.2548,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2502840459346771,
"step": 1185,
"valid_targets_mean": 2024.3,
"valid_targets_min": 744
},
{
"epoch": 1.9101123595505618,
"grad_norm": 0.7555474304079293,
"learning_rate": 3.648343066032476e-05,
"loss": 0.2659,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22855910658836365,
"step": 1190,
"valid_targets_mean": 1711.2,
"valid_targets_min": 641
},
{
"epoch": 1.9181380417335474,
"grad_norm": 0.7676954013858329,
"learning_rate": 3.643795696015985e-05,
"loss": 0.2515,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26554515957832336,
"step": 1195,
"valid_targets_mean": 1831.3,
"valid_targets_min": 675
},
{
"epoch": 1.9261637239165328,
"grad_norm": 5.5556263099749215,
"learning_rate": 3.639221985196166e-05,
"loss": 0.2483,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2238149791955948,
"step": 1200,
"valid_targets_mean": 1427.6,
"valid_targets_min": 727
},
{
"epoch": 1.9341894060995184,
"grad_norm": 0.7081355832362357,
"learning_rate": 3.634622006863891e-05,
"loss": 0.2597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2723257541656494,
"step": 1205,
"valid_targets_mean": 2102.0,
"valid_targets_min": 522
},
{
"epoch": 1.942215088282504,
"grad_norm": 0.7197674750606493,
"learning_rate": 3.62999583473095e-05,
"loss": 0.272,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2823481857776642,
"step": 1210,
"valid_targets_mean": 1959.4,
"valid_targets_min": 620
},
{
"epoch": 1.9502407704654896,
"grad_norm": 0.7351267896359547,
"learning_rate": 3.625343542928874e-05,
"loss": 0.2515,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23494531214237213,
"step": 1215,
"valid_targets_mean": 1691.6,
"valid_targets_min": 721
},
{
"epoch": 1.9582664526484752,
"grad_norm": 0.8091637524191202,
"learning_rate": 3.620665206007744e-05,
"loss": 0.2528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2615356743335724,
"step": 1220,
"valid_targets_mean": 1755.5,
"valid_targets_min": 625
},
{
"epoch": 1.9662921348314608,
"grad_norm": 0.630617638795346,
"learning_rate": 3.615960898934999e-05,
"loss": 0.2705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2906268835067749,
"step": 1225,
"valid_targets_mean": 2880.1,
"valid_targets_min": 797
},
{
"epoch": 1.9743178170144462,
"grad_norm": 0.698026717328934,
"learning_rate": 3.6112306970942334e-05,
"loss": 0.2593,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24983006715774536,
"step": 1230,
"valid_targets_mean": 1999.2,
"valid_targets_min": 822
},
{
"epoch": 1.9823434991974318,
"grad_norm": 0.7323645627563731,
"learning_rate": 3.606474676283987e-05,
"loss": 0.2657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2904243469238281,
"step": 1235,
"valid_targets_mean": 2122.1,
"valid_targets_min": 707
},
{
"epoch": 1.9903691813804172,
"grad_norm": 0.6960742489484173,
"learning_rate": 3.6016929127165365e-05,
"loss": 0.2821,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2649298906326294,
"step": 1240,
"valid_targets_mean": 2274.1,
"valid_targets_min": 917
},
{
"epoch": 1.9983948635634028,
"grad_norm": 0.7269920662477591,
"learning_rate": 3.5968854830166666e-05,
"loss": 0.262,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26873061060905457,
"step": 1245,
"valid_targets_mean": 2070.6,
"valid_targets_min": 677
},
{
"epoch": 2.0064205457463884,
"grad_norm": 0.6264465786385531,
"learning_rate": 3.592052464220447e-05,
"loss": 0.2386,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20619434118270874,
"step": 1250,
"valid_targets_mean": 2345.5,
"valid_targets_min": 623
},
{
"epoch": 2.014446227929374,
"grad_norm": 0.8060408716572437,
"learning_rate": 3.587193933773998e-05,
"loss": 0.2143,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22666709125041962,
"step": 1255,
"valid_targets_mean": 1974.3,
"valid_targets_min": 855
},
{
"epoch": 2.0224719101123596,
"grad_norm": 0.6893664644285946,
"learning_rate": 3.582309969532247e-05,
"loss": 0.217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21046797931194305,
"step": 1260,
"valid_targets_mean": 2176.0,
"valid_targets_min": 753
},
{
"epoch": 2.030497592295345,
"grad_norm": 0.7574788853071039,
"learning_rate": 3.577400649757682e-05,
"loss": 0.219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18405956029891968,
"step": 1265,
"valid_targets_mean": 1458.5,
"valid_targets_min": 570
},
{
"epoch": 2.038523274478331,
"grad_norm": 0.7882212386208145,
"learning_rate": 3.572466053119099e-05,
"loss": 0.2304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25198838114738464,
"step": 1270,
"valid_targets_mean": 1880.4,
"valid_targets_min": 753
},
{
"epoch": 2.0465489566613164,
"grad_norm": 0.8196333002543982,
"learning_rate": 3.567506258690338e-05,
"loss": 0.2222,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22230197489261627,
"step": 1275,
"valid_targets_mean": 1761.6,
"valid_targets_min": 819
},
{
"epoch": 2.0545746388443016,
"grad_norm": 0.848915909008126,
"learning_rate": 3.562521345949018e-05,
"loss": 0.223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2496098428964615,
"step": 1280,
"valid_targets_mean": 2336.7,
"valid_targets_min": 627
},
{
"epoch": 2.062600321027287,
"grad_norm": 0.8863737442776473,
"learning_rate": 3.5575113947752666e-05,
"loss": 0.2352,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24262848496437073,
"step": 1285,
"valid_targets_mean": 1759.6,
"valid_targets_min": 695
},
{
"epoch": 2.070626003210273,
"grad_norm": 0.7589911362614817,
"learning_rate": 3.552476485450434e-05,
"loss": 0.2256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22207708656787872,
"step": 1290,
"valid_targets_mean": 1856.1,
"valid_targets_min": 646
},
{
"epoch": 2.0786516853932584,
"grad_norm": 0.9495179896994681,
"learning_rate": 3.547416698655807e-05,
"loss": 0.219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25257399678230286,
"step": 1295,
"valid_targets_mean": 2386.2,
"valid_targets_min": 639
},
{
"epoch": 2.086677367576244,
"grad_norm": 0.7221290673835988,
"learning_rate": 3.5423321154713245e-05,
"loss": 0.2224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22047732770442963,
"step": 1300,
"valid_targets_mean": 2135.1,
"valid_targets_min": 742
},
{
"epoch": 2.0947030497592296,
"grad_norm": 0.8574890872992614,
"learning_rate": 3.537222817374266e-05,
"loss": 0.2212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18799078464508057,
"step": 1305,
"valid_targets_mean": 1523.1,
"valid_targets_min": 785
},
{
"epoch": 2.102728731942215,
"grad_norm": 0.7745571983724101,
"learning_rate": 3.532088886237956e-05,
"loss": 0.227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2367406189441681,
"step": 1310,
"valid_targets_mean": 1826.2,
"valid_targets_min": 819
},
{
"epoch": 2.110754414125201,
"grad_norm": 0.7807741896820481,
"learning_rate": 3.526930404330447e-05,
"loss": 0.2226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2241775095462799,
"step": 1315,
"valid_targets_mean": 1756.4,
"valid_targets_min": 919
},
{
"epoch": 2.1187800963081864,
"grad_norm": 0.8548618903538644,
"learning_rate": 3.521747454313201e-05,
"loss": 0.2225,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2160843312740326,
"step": 1320,
"valid_targets_mean": 1812.9,
"valid_targets_min": 1086
},
{
"epoch": 2.1268057784911716,
"grad_norm": 0.776344012436439,
"learning_rate": 3.516540119239769e-05,
"loss": 0.2167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22034770250320435,
"step": 1325,
"valid_targets_mean": 1766.5,
"valid_targets_min": 801
},
{
"epoch": 2.134831460674157,
"grad_norm": 1.2889351825397468,
"learning_rate": 3.511308482554454e-05,
"loss": 0.2266,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24177859723567963,
"step": 1330,
"valid_targets_mean": 2334.4,
"valid_targets_min": 572
},
{
"epoch": 2.142857142857143,
"grad_norm": 0.8008461502115394,
"learning_rate": 3.506052628090981e-05,
"loss": 0.22,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21476683020591736,
"step": 1335,
"valid_targets_mean": 2030.2,
"valid_targets_min": 661
},
{
"epoch": 2.1508828250401284,
"grad_norm": 0.810451115473788,
"learning_rate": 3.500772640071145e-05,
"loss": 0.2349,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22298628091812134,
"step": 1340,
"valid_targets_mean": 1712.6,
"valid_targets_min": 850
},
{
"epoch": 2.158908507223114,
"grad_norm": 0.7573148185013651,
"learning_rate": 3.495468603103472e-05,
"loss": 0.2469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24540317058563232,
"step": 1345,
"valid_targets_mean": 2262.4,
"valid_targets_min": 1157
},
{
"epoch": 2.1669341894060996,
"grad_norm": 0.7168592022709548,
"learning_rate": 3.4901406021818526e-05,
"loss": 0.2104,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22075840830802917,
"step": 1350,
"valid_targets_mean": 2246.2,
"valid_targets_min": 776
},
{
"epoch": 2.174959871589085,
"grad_norm": 0.8065302620751352,
"learning_rate": 3.4847887226841874e-05,
"loss": 0.2149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21199846267700195,
"step": 1355,
"valid_targets_mean": 1803.8,
"valid_targets_min": 740
},
{
"epoch": 2.182985553772071,
"grad_norm": 0.6668455625016351,
"learning_rate": 3.479413050371016e-05,
"loss": 0.2101,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20517484843730927,
"step": 1360,
"valid_targets_mean": 2204.4,
"valid_targets_min": 714
},
{
"epoch": 2.191011235955056,
"grad_norm": 0.7616659943300983,
"learning_rate": 3.4740136713841416e-05,
"loss": 0.238,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22425301373004913,
"step": 1365,
"valid_targets_mean": 1955.1,
"valid_targets_min": 692
},
{
"epoch": 2.1990369181380416,
"grad_norm": 0.765106380987224,
"learning_rate": 3.4685906722452537e-05,
"loss": 0.226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20790395140647888,
"step": 1370,
"valid_targets_mean": 2030.4,
"valid_targets_min": 873
},
{
"epoch": 2.207062600321027,
"grad_norm": 0.8408989245850991,
"learning_rate": 3.4631441398545394e-05,
"loss": 0.2069,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20086929202079773,
"step": 1375,
"valid_targets_mean": 1581.3,
"valid_targets_min": 635
},
{
"epoch": 2.215088282504013,
"grad_norm": 0.7954396264203275,
"learning_rate": 3.4576741614892925e-05,
"loss": 0.2278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23235668241977692,
"step": 1380,
"valid_targets_mean": 2279.1,
"valid_targets_min": 950
},
{
"epoch": 2.2231139646869984,
"grad_norm": 0.7874064449767312,
"learning_rate": 3.452180824802512e-05,
"loss": 0.2374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2614269554615021,
"step": 1385,
"valid_targets_mean": 2237.8,
"valid_targets_min": 681
},
{
"epoch": 2.231139646869984,
"grad_norm": 0.7379527533621459,
"learning_rate": 3.4466642178215015e-05,
"loss": 0.2221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24073539674282074,
"step": 1390,
"valid_targets_mean": 2265.8,
"valid_targets_min": 774
},
{
"epoch": 2.2391653290529696,
"grad_norm": 0.683724568782726,
"learning_rate": 3.441124428946455e-05,
"loss": 0.2207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2088882178068161,
"step": 1395,
"valid_targets_mean": 2312.8,
"valid_targets_min": 661
},
{
"epoch": 2.247191011235955,
"grad_norm": 0.697858810104743,
"learning_rate": 3.435561546949043e-05,
"loss": 0.2199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25173261761665344,
"step": 1400,
"valid_targets_mean": 2850.9,
"valid_targets_min": 1085
},
{
"epoch": 2.255216693418941,
"grad_norm": 0.7114309986626526,
"learning_rate": 3.429975660970988e-05,
"loss": 0.213,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.234367236495018,
"step": 1405,
"valid_targets_mean": 2420.1,
"valid_targets_min": 823
},
{
"epoch": 2.263242375601926,
"grad_norm": 0.7461264034166555,
"learning_rate": 3.424366860522638e-05,
"loss": 0.2182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23270238935947418,
"step": 1410,
"valid_targets_mean": 1986.1,
"valid_targets_min": 793
},
{
"epoch": 2.2712680577849116,
"grad_norm": 0.6975362183207242,
"learning_rate": 3.41873523548153e-05,
"loss": 0.2333,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19744381308555603,
"step": 1415,
"valid_targets_mean": 1985.9,
"valid_targets_min": 1006
},
{
"epoch": 2.279293739967897,
"grad_norm": 0.7633475145958678,
"learning_rate": 3.413080876090952e-05,
"loss": 0.223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2305845320224762,
"step": 1420,
"valid_targets_mean": 2110.4,
"valid_targets_min": 1051
},
{
"epoch": 2.287319422150883,
"grad_norm": 0.6987877696053163,
"learning_rate": 3.4074038729584955e-05,
"loss": 0.2212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18873882293701172,
"step": 1425,
"valid_targets_mean": 2079.9,
"valid_targets_min": 748
},
{
"epoch": 2.2953451043338684,
"grad_norm": 0.8229960285752915,
"learning_rate": 3.401704317054604e-05,
"loss": 0.2279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22099998593330383,
"step": 1430,
"valid_targets_mean": 1742.9,
"valid_targets_min": 709
},
{
"epoch": 2.303370786516854,
"grad_norm": 0.7979213067997468,
"learning_rate": 3.395982299711114e-05,
"loss": 0.2241,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23837853968143463,
"step": 1435,
"valid_targets_mean": 2065.1,
"valid_targets_min": 734
},
{
"epoch": 2.3113964686998396,
"grad_norm": 0.7410217576693533,
"learning_rate": 3.390237912619793e-05,
"loss": 0.2278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19628407061100006,
"step": 1440,
"valid_targets_mean": 1947.8,
"valid_targets_min": 725
},
{
"epoch": 2.319422150882825,
"grad_norm": 0.725538489703123,
"learning_rate": 3.384471247830872e-05,
"loss": 0.2319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22274473309516907,
"step": 1445,
"valid_targets_mean": 2046.8,
"valid_targets_min": 846
},
{
"epoch": 2.3274478330658104,
"grad_norm": 0.7718380143410368,
"learning_rate": 3.378682397751565e-05,
"loss": 0.2265,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2532963156700134,
"step": 1450,
"valid_targets_mean": 2101.1,
"valid_targets_min": 737
},
{
"epoch": 2.335473515248796,
"grad_norm": 0.8011655529732985,
"learning_rate": 3.372871455144593e-05,
"loss": 0.2219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23601312935352325,
"step": 1455,
"valid_targets_mean": 1879.2,
"valid_targets_min": 822
},
{
"epoch": 2.3434991974317816,
"grad_norm": 0.9443935694282609,
"learning_rate": 3.367038513126697e-05,
"loss": 0.2262,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.206557959318161,
"step": 1460,
"valid_targets_mean": 1639.8,
"valid_targets_min": 648
},
{
"epoch": 2.351524879614767,
"grad_norm": 0.7339382552691981,
"learning_rate": 3.3611836651671426e-05,
"loss": 0.2255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23191966116428375,
"step": 1465,
"valid_targets_mean": 2068.2,
"valid_targets_min": 670
},
{
"epoch": 2.359550561797753,
"grad_norm": 0.7882153069080308,
"learning_rate": 3.355307005086226e-05,
"loss": 0.2284,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20615904033184052,
"step": 1470,
"valid_targets_mean": 1522.9,
"valid_targets_min": 760
},
{
"epoch": 2.3675762439807384,
"grad_norm": 0.7562840977782597,
"learning_rate": 3.34940862705377e-05,
"loss": 0.2126,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1904546320438385,
"step": 1475,
"valid_targets_mean": 1568.2,
"valid_targets_min": 696
},
{
"epoch": 2.375601926163724,
"grad_norm": 0.8538351538237444,
"learning_rate": 3.3434886255876106e-05,
"loss": 0.2375,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25030791759490967,
"step": 1480,
"valid_targets_mean": 2046.1,
"valid_targets_min": 790
},
{
"epoch": 2.3836276083467096,
"grad_norm": 0.7220287827741136,
"learning_rate": 3.33754709555209e-05,
"loss": 0.23,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2569080591201782,
"step": 1485,
"valid_targets_mean": 2494.1,
"valid_targets_min": 788
},
{
"epoch": 2.391653290529695,
"grad_norm": 0.7818531275905918,
"learning_rate": 3.33158413215653e-05,
"loss": 0.2294,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2130444347858429,
"step": 1490,
"valid_targets_mean": 1575.5,
"valid_targets_min": 652
},
{
"epoch": 2.399678972712681,
"grad_norm": 0.7625675101581627,
"learning_rate": 3.325599830953708e-05,
"loss": 0.2155,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21467597782611847,
"step": 1495,
"valid_targets_mean": 2187.6,
"valid_targets_min": 722
},
{
"epoch": 2.407704654895666,
"grad_norm": 0.7704348694195301,
"learning_rate": 3.31959428783833e-05,
"loss": 0.2318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2410392463207245,
"step": 1500,
"valid_targets_mean": 2143.1,
"valid_targets_min": 785
},
{
"epoch": 2.4157303370786516,
"grad_norm": 0.6834706733838948,
"learning_rate": 3.3135675990454856e-05,
"loss": 0.2332,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22266864776611328,
"step": 1505,
"valid_targets_mean": 2381.1,
"valid_targets_min": 671
},
{
"epoch": 2.423756019261637,
"grad_norm": 0.7632035756467823,
"learning_rate": 3.307519861149114e-05,
"loss": 0.2259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25074198842048645,
"step": 1510,
"valid_targets_mean": 2307.4,
"valid_targets_min": 704
},
{
"epoch": 2.431781701444623,
"grad_norm": 0.7796558920418386,
"learning_rate": 3.3014511710604526e-05,
"loss": 0.2185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2310362160205841,
"step": 1515,
"valid_targets_mean": 2021.8,
"valid_targets_min": 670
},
{
"epoch": 2.4398073836276084,
"grad_norm": 0.8050959296365663,
"learning_rate": 3.295361626026484e-05,
"loss": 0.2154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22600339353084564,
"step": 1520,
"valid_targets_mean": 1891.7,
"valid_targets_min": 589
},
{
"epoch": 2.447833065810594,
"grad_norm": 0.7172384753459945,
"learning_rate": 3.28925132362838e-05,
"loss": 0.223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21628597378730774,
"step": 1525,
"valid_targets_mean": 1877.1,
"valid_targets_min": 826
},
{
"epoch": 2.4558587479935796,
"grad_norm": 0.6974119595402761,
"learning_rate": 3.2831203617799316e-05,
"loss": 0.2363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23294216394424438,
"step": 1530,
"valid_targets_mean": 2408.9,
"valid_targets_min": 875
},
{
"epoch": 2.4638844301765648,
"grad_norm": 0.7841982652104295,
"learning_rate": 3.276968838725992e-05,
"loss": 0.2192,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23504158854484558,
"step": 1535,
"valid_targets_mean": 1922.0,
"valid_targets_min": 856
},
{
"epoch": 2.4719101123595504,
"grad_norm": 0.7111349004760731,
"learning_rate": 3.2707968530408886e-05,
"loss": 0.2259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2083408683538437,
"step": 1540,
"valid_targets_mean": 2066.4,
"valid_targets_min": 714
},
{
"epoch": 2.479935794542536,
"grad_norm": 0.7365161685746568,
"learning_rate": 3.264604503626853e-05,
"loss": 0.2174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.235595241189003,
"step": 1545,
"valid_targets_mean": 2078.4,
"valid_targets_min": 776
},
{
"epoch": 2.4879614767255216,
"grad_norm": 0.7269740343287259,
"learning_rate": 3.2583918897124315e-05,
"loss": 0.2163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2562892735004425,
"step": 1550,
"valid_targets_mean": 2318.0,
"valid_targets_min": 617
},
{
"epoch": 2.495987158908507,
"grad_norm": 0.758066997386104,
"learning_rate": 3.2521591108508965e-05,
"loss": 0.2234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23280540108680725,
"step": 1555,
"valid_targets_mean": 1912.3,
"valid_targets_min": 892
},
{
"epoch": 2.504012841091493,
"grad_norm": 0.6629939180933154,
"learning_rate": 3.245906266918651e-05,
"loss": 0.2249,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19812926650047302,
"step": 1560,
"valid_targets_mean": 2150.6,
"valid_targets_min": 903
},
{
"epoch": 2.5120385232744784,
"grad_norm": 0.7017031358542662,
"learning_rate": 3.2396334581136315e-05,
"loss": 0.2246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19861991703510284,
"step": 1565,
"valid_targets_mean": 1771.2,
"valid_targets_min": 797
},
{
"epoch": 2.520064205457464,
"grad_norm": 0.7456695638200225,
"learning_rate": 3.2333407849536936e-05,
"loss": 0.2306,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2588405907154083,
"step": 1570,
"valid_targets_mean": 2140.0,
"valid_targets_min": 548
},
{
"epoch": 2.5280898876404496,
"grad_norm": 0.6842578186040127,
"learning_rate": 3.2270283482750106e-05,
"loss": 0.2307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23806709051132202,
"step": 1575,
"valid_targets_mean": 2214.6,
"valid_targets_min": 780
},
{
"epoch": 2.5361155698234352,
"grad_norm": 0.7163287836668685,
"learning_rate": 3.220696249230453e-05,
"loss": 0.2295,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2398744523525238,
"step": 1580,
"valid_targets_mean": 2410.4,
"valid_targets_min": 1246
},
{
"epoch": 2.5441412520064204,
"grad_norm": 0.7034472910128594,
"learning_rate": 3.214344589287969e-05,
"loss": 0.2373,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24632596969604492,
"step": 1585,
"valid_targets_mean": 2491.1,
"valid_targets_min": 875
},
{
"epoch": 2.552166934189406,
"grad_norm": 0.7470426673989888,
"learning_rate": 3.2079734702289555e-05,
"loss": 0.2241,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23413334786891937,
"step": 1590,
"valid_targets_mean": 2035.4,
"valid_targets_min": 1093
},
{
"epoch": 2.5601926163723916,
"grad_norm": 0.6695700379125197,
"learning_rate": 3.201582994146633e-05,
"loss": 0.2195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.220213383436203,
"step": 1595,
"valid_targets_mean": 2228.4,
"valid_targets_min": 832
},
{
"epoch": 2.568218298555377,
"grad_norm": 0.6398428853902913,
"learning_rate": 3.195173263444405e-05,
"loss": 0.2253,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2369084358215332,
"step": 1600,
"valid_targets_mean": 2804.1,
"valid_targets_min": 1139
},
{
"epoch": 2.576243980738363,
"grad_norm": 0.7976580250915132,
"learning_rate": 3.188744380834218e-05,
"loss": 0.2327,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25882312655448914,
"step": 1605,
"valid_targets_mean": 1818.9,
"valid_targets_min": 758
},
{
"epoch": 2.5842696629213484,
"grad_norm": 0.738638803709468,
"learning_rate": 3.182296449334916e-05,
"loss": 0.2248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2369651198387146,
"step": 1610,
"valid_targets_mean": 2066.5,
"valid_targets_min": 1206
},
{
"epoch": 2.592295345104334,
"grad_norm": 0.8660756736906835,
"learning_rate": 3.1758295722705895e-05,
"loss": 0.2251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22791454195976257,
"step": 1615,
"valid_targets_mean": 1701.2,
"valid_targets_min": 787
},
{
"epoch": 2.600321027287319,
"grad_norm": 0.7304793227556174,
"learning_rate": 3.1693438532689196e-05,
"loss": 0.2252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16894668340682983,
"step": 1620,
"valid_targets_mean": 1490.4,
"valid_targets_min": 567
},
{
"epoch": 2.608346709470305,
"grad_norm": 0.7316882732876415,
"learning_rate": 3.162839396259519e-05,
"loss": 0.2194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17454849183559418,
"step": 1625,
"valid_targets_mean": 1789.1,
"valid_targets_min": 734
},
{
"epoch": 2.6163723916532904,
"grad_norm": 0.8293784310074404,
"learning_rate": 3.156316305472263e-05,
"loss": 0.2214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22549498081207275,
"step": 1630,
"valid_targets_mean": 1512.9,
"valid_targets_min": 713
},
{
"epoch": 2.624398073836276,
"grad_norm": 0.7732588913978171,
"learning_rate": 3.149774685435626e-05,
"loss": 0.2293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23763619363307953,
"step": 1635,
"valid_targets_mean": 1928.6,
"valid_targets_min": 714
},
{
"epoch": 2.6324237560192616,
"grad_norm": 0.6863872080427466,
"learning_rate": 3.143214640974996e-05,
"loss": 0.2135,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19767194986343384,
"step": 1640,
"valid_targets_mean": 1965.4,
"valid_targets_min": 960
},
{
"epoch": 2.640449438202247,
"grad_norm": 0.7870511412965953,
"learning_rate": 3.136636277211005e-05,
"loss": 0.2229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23969687521457672,
"step": 1645,
"valid_targets_mean": 1663.8,
"valid_targets_min": 721
},
{
"epoch": 2.648475120385233,
"grad_norm": 0.7980891149995513,
"learning_rate": 3.13003969955784e-05,
"loss": 0.2094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19080209732055664,
"step": 1650,
"valid_targets_mean": 1481.9,
"valid_targets_min": 731
},
{
"epoch": 2.6565008025682184,
"grad_norm": 0.7955277559817313,
"learning_rate": 3.1234250137215546e-05,
"loss": 0.2225,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21440812945365906,
"step": 1655,
"valid_targets_mean": 1468.8,
"valid_targets_min": 723
},
{
"epoch": 2.664526484751204,
"grad_norm": 0.7368668559606313,
"learning_rate": 3.1167923256983724e-05,
"loss": 0.2188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19377027451992035,
"step": 1660,
"valid_targets_mean": 1893.8,
"valid_targets_min": 686
},
{
"epoch": 2.6725521669341896,
"grad_norm": 0.8011351264520532,
"learning_rate": 3.110141741772994e-05,
"loss": 0.2444,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2542601227760315,
"step": 1665,
"valid_targets_mean": 1760.2,
"valid_targets_min": 667
},
{
"epoch": 2.6805778491171752,
"grad_norm": 0.6620763926446247,
"learning_rate": 3.103473368516887e-05,
"loss": 0.2304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2350524365901947,
"step": 1670,
"valid_targets_mean": 2464.2,
"valid_targets_min": 788
},
{
"epoch": 2.6886035313001604,
"grad_norm": 0.7931697359506537,
"learning_rate": 3.0967873127865856e-05,
"loss": 0.2273,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22060030698776245,
"step": 1675,
"valid_targets_mean": 1841.6,
"valid_targets_min": 700
},
{
"epoch": 2.696629213483146,
"grad_norm": 0.7023736927777215,
"learning_rate": 3.090083681721972e-05,
"loss": 0.2323,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21952059864997864,
"step": 1680,
"valid_targets_mean": 2159.6,
"valid_targets_min": 899
},
{
"epoch": 2.7046548956661316,
"grad_norm": 0.7025168140845389,
"learning_rate": 3.083362582744564e-05,
"loss": 0.2272,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2323223054409027,
"step": 1685,
"valid_targets_mean": 2033.8,
"valid_targets_min": 696
},
{
"epoch": 2.712680577849117,
"grad_norm": 0.6589820080202528,
"learning_rate": 3.0766241235557914e-05,
"loss": 0.2212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20285199582576752,
"step": 1690,
"valid_targets_mean": 2020.0,
"valid_targets_min": 703
},
{
"epoch": 2.720706260032103,
"grad_norm": 0.6509308612016727,
"learning_rate": 3.0698684121352704e-05,
"loss": 0.2244,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20531073212623596,
"step": 1695,
"valid_targets_mean": 2438.1,
"valid_targets_min": 847
},
{
"epoch": 2.7287319422150884,
"grad_norm": 0.7373126457209139,
"learning_rate": 3.0630955567390714e-05,
"loss": 0.2288,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22566135227680206,
"step": 1700,
"valid_targets_mean": 2027.4,
"valid_targets_min": 671
},
{
"epoch": 2.7367576243980736,
"grad_norm": 0.8219020871621718,
"learning_rate": 3.0563056658979915e-05,
"loss": 0.248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2077377736568451,
"step": 1705,
"valid_targets_mean": 1601.4,
"valid_targets_min": 522
},
{
"epoch": 2.744783306581059,
"grad_norm": 0.6685564666402026,
"learning_rate": 3.0494988484158048e-05,
"loss": 0.2166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21543152630329132,
"step": 1710,
"valid_targets_mean": 2170.0,
"valid_targets_min": 870
},
{
"epoch": 2.752808988764045,
"grad_norm": 0.8026549087712966,
"learning_rate": 3.0426752133675274e-05,
"loss": 0.2071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22285577654838562,
"step": 1715,
"valid_targets_mean": 1749.9,
"valid_targets_min": 814
},
{
"epoch": 2.7608346709470304,
"grad_norm": 0.690495095349738,
"learning_rate": 3.035834870097665e-05,
"loss": 0.2331,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21550163626670837,
"step": 1720,
"valid_targets_mean": 2140.2,
"valid_targets_min": 662
},
{
"epoch": 2.768860353130016,
"grad_norm": 0.7360103068007144,
"learning_rate": 3.0289779282184627e-05,
"loss": 0.222,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24632824957370758,
"step": 1725,
"valid_targets_mean": 2156.0,
"valid_targets_min": 732
},
{
"epoch": 2.7768860353130016,
"grad_norm": 0.7527366517311297,
"learning_rate": 3.0221044976081484e-05,
"loss": 0.237,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2297508716583252,
"step": 1730,
"valid_targets_mean": 1963.5,
"valid_targets_min": 785
},
{
"epoch": 2.784911717495987,
"grad_norm": 0.7821248977519579,
"learning_rate": 3.0152146884091714e-05,
"loss": 0.2182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22388526797294617,
"step": 1735,
"valid_targets_mean": 2456.3,
"valid_targets_min": 1014
},
{
"epoch": 2.792937399678973,
"grad_norm": 0.7248411712033483,
"learning_rate": 3.0083086110264372e-05,
"loss": 0.2188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20279636979103088,
"step": 1740,
"valid_targets_mean": 1725.7,
"valid_targets_min": 822
},
{
"epoch": 2.8009630818619584,
"grad_norm": 0.7719057875204387,
"learning_rate": 3.0013863761255394e-05,
"loss": 0.226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22379055619239807,
"step": 1745,
"valid_targets_mean": 1751.1,
"valid_targets_min": 595
},
{
"epoch": 2.808988764044944,
"grad_norm": 0.7078438529016131,
"learning_rate": 2.9944480946309857e-05,
"loss": 0.2099,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2104533314704895,
"step": 1750,
"valid_targets_mean": 2152.8,
"valid_targets_min": 677
},
{
"epoch": 2.8170144462279296,
"grad_norm": 0.7421779901837455,
"learning_rate": 2.9874938777244203e-05,
"loss": 0.2209,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2339702844619751,
"step": 1755,
"valid_targets_mean": 2193.9,
"valid_targets_min": 1060
},
{
"epoch": 2.825040128410915,
"grad_norm": 0.6791983094516799,
"learning_rate": 2.9805238368428417e-05,
"loss": 0.2323,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23603284358978271,
"step": 1760,
"valid_targets_mean": 2690.4,
"valid_targets_min": 789
},
{
"epoch": 2.8330658105939004,
"grad_norm": 0.7641709144274127,
"learning_rate": 2.9735380836768194e-05,
"loss": 0.2216,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2092696875333786,
"step": 1765,
"valid_targets_mean": 1717.9,
"valid_targets_min": 770
},
{
"epoch": 2.841091492776886,
"grad_norm": 0.6388373211209032,
"learning_rate": 2.966536730168702e-05,
"loss": 0.2211,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23387748003005981,
"step": 1770,
"valid_targets_mean": 2613.9,
"valid_targets_min": 700
},
{
"epoch": 2.8491171749598716,
"grad_norm": 0.7037310466747174,
"learning_rate": 2.9595198885108222e-05,
"loss": 0.2351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24809247255325317,
"step": 1775,
"valid_targets_mean": 2320.5,
"valid_targets_min": 765
},
{
"epoch": 2.857142857142857,
"grad_norm": 0.7618055649190782,
"learning_rate": 2.9524876711437027e-05,
"loss": 0.2283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23056885600090027,
"step": 1780,
"valid_targets_mean": 2268.4,
"valid_targets_min": 780
},
{
"epoch": 2.865168539325843,
"grad_norm": 0.7549506776491252,
"learning_rate": 2.945440190754252e-05,
"loss": 0.2393,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2515849471092224,
"step": 1785,
"valid_targets_mean": 2207.3,
"valid_targets_min": 837
},
{
"epoch": 2.8731942215088284,
"grad_norm": 0.7470019603913977,
"learning_rate": 2.9383775602739585e-05,
"loss": 0.2308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23992541432380676,
"step": 1790,
"valid_targets_mean": 2084.7,
"valid_targets_min": 777
},
{
"epoch": 2.8812199036918136,
"grad_norm": 0.7337045498667797,
"learning_rate": 2.931299892877081e-05,
"loss": 0.2292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2097863256931305,
"step": 1795,
"valid_targets_mean": 1751.9,
"valid_targets_min": 760
},
{
"epoch": 2.889245585874799,
"grad_norm": 0.7475735728231748,
"learning_rate": 2.924207301978837e-05,
"loss": 0.2208,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22301986813545227,
"step": 1800,
"valid_targets_mean": 1816.0,
"valid_targets_min": 711
},
{
"epoch": 2.897271268057785,
"grad_norm": 0.8609335895996135,
"learning_rate": 2.917099901233582e-05,
"loss": 0.2255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24170774221420288,
"step": 1805,
"valid_targets_mean": 1630.4,
"valid_targets_min": 814
},
{
"epoch": 2.9052969502407704,
"grad_norm": 0.8836714454451741,
"learning_rate": 2.9099778045329915e-05,
"loss": 0.2112,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2119920253753662,
"step": 1810,
"valid_targets_mean": 1986.5,
"valid_targets_min": 738
},
{
"epoch": 2.913322632423756,
"grad_norm": 1.3175708087375508,
"learning_rate": 2.902841126004234e-05,
"loss": 0.2321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26432716846466064,
"step": 1815,
"valid_targets_mean": 2028.9,
"valid_targets_min": 874
},
{
"epoch": 2.9213483146067416,
"grad_norm": 0.7616325494153396,
"learning_rate": 2.8956899800081434e-05,
"loss": 0.2161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22558796405792236,
"step": 1820,
"valid_targets_mean": 1613.9,
"valid_targets_min": 548
},
{
"epoch": 2.929373996789727,
"grad_norm": 0.7367382610423877,
"learning_rate": 2.888524481137384e-05,
"loss": 0.2248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23133790493011475,
"step": 1825,
"valid_targets_mean": 2021.1,
"valid_targets_min": 777
},
{
"epoch": 2.937399678972713,
"grad_norm": 0.6844977955140614,
"learning_rate": 2.8813447442146177e-05,
"loss": 0.2362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21383780241012573,
"step": 1830,
"valid_targets_mean": 1867.3,
"valid_targets_min": 504
},
{
"epoch": 2.9454253611556984,
"grad_norm": 0.7558744597489246,
"learning_rate": 2.8741508842906617e-05,
"loss": 0.2277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21160289645195007,
"step": 1835,
"valid_targets_mean": 1775.3,
"valid_targets_min": 729
},
{
"epoch": 2.953451043338684,
"grad_norm": 0.7825251274320609,
"learning_rate": 2.8669430166426452e-05,
"loss": 0.2079,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22142228484153748,
"step": 1840,
"valid_targets_mean": 1709.3,
"valid_targets_min": 684
},
{
"epoch": 2.961476725521669,
"grad_norm": 0.8621972624844769,
"learning_rate": 2.8597212567721638e-05,
"loss": 0.2277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20812058448791504,
"step": 1845,
"valid_targets_mean": 1360.6,
"valid_targets_min": 743
},
{
"epoch": 2.969502407704655,
"grad_norm": 0.716293562577063,
"learning_rate": 2.8524857204034256e-05,
"loss": 0.2182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24998609721660614,
"step": 1850,
"valid_targets_mean": 1911.3,
"valid_targets_min": 885
},
{
"epoch": 2.9775280898876404,
"grad_norm": 0.6539894083962282,
"learning_rate": 2.8452365234813992e-05,
"loss": 0.2269,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24071596562862396,
"step": 1855,
"valid_targets_mean": 2464.8,
"valid_targets_min": 734
},
{
"epoch": 2.985553772070626,
"grad_norm": 0.7537202116782218,
"learning_rate": 2.8379737821699557e-05,
"loss": 0.2218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2464880496263504,
"step": 1860,
"valid_targets_mean": 2069.2,
"valid_targets_min": 714
},
{
"epoch": 2.9935794542536116,
"grad_norm": 0.7507065541075459,
"learning_rate": 2.8306976128500054e-05,
"loss": 0.2269,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2356579601764679,
"step": 1865,
"valid_targets_mean": 2693.5,
"valid_targets_min": 725
},
{
"epoch": 3.001605136436597,
"grad_norm": 0.6923513946863307,
"learning_rate": 2.823408132117635e-05,
"loss": 0.2151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20384138822555542,
"step": 1870,
"valid_targets_mean": 2270.1,
"valid_targets_min": 695
},
{
"epoch": 3.009630818619583,
"grad_norm": 0.7149443578899167,
"learning_rate": 2.8161054567822375e-05,
"loss": 0.1878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18554896116256714,
"step": 1875,
"valid_targets_mean": 2369.7,
"valid_targets_min": 806
},
{
"epoch": 3.0176565008025684,
"grad_norm": 0.7734688939301865,
"learning_rate": 2.8087897038646428e-05,
"loss": 0.1891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19679996371269226,
"step": 1880,
"valid_targets_mean": 2192.3,
"valid_targets_min": 743
},
{
"epoch": 3.0256821829855536,
"grad_norm": 0.7653501614317052,
"learning_rate": 2.801460990595239e-05,
"loss": 0.2005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20114630460739136,
"step": 1885,
"valid_targets_mean": 1874.9,
"valid_targets_min": 765
},
{
"epoch": 3.033707865168539,
"grad_norm": 0.830666272441702,
"learning_rate": 2.7941194344120965e-05,
"loss": 0.1876,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1925143003463745,
"step": 1890,
"valid_targets_mean": 1578.1,
"valid_targets_min": 727
},
{
"epoch": 3.041733547351525,
"grad_norm": 1.2399862833715765,
"learning_rate": 2.7867651529590864e-05,
"loss": 0.1867,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17397508025169373,
"step": 1895,
"valid_targets_mean": 1400.1,
"valid_targets_min": 693
},
{
"epoch": 3.0497592295345104,
"grad_norm": 0.8087269986100477,
"learning_rate": 2.7793982640839933e-05,
"loss": 0.1783,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1715751439332962,
"step": 1900,
"valid_targets_mean": 1782.9,
"valid_targets_min": 689
},
{
"epoch": 3.057784911717496,
"grad_norm": 0.6281749949063277,
"learning_rate": 2.7720188858366275e-05,
"loss": 0.195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18476352095603943,
"step": 1905,
"valid_targets_mean": 2993.0,
"valid_targets_min": 740
},
{
"epoch": 3.0658105939004816,
"grad_norm": 0.635189484478004,
"learning_rate": 2.7646271364669338e-05,
"loss": 0.1818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15959222614765167,
"step": 1910,
"valid_targets_mean": 2513.0,
"valid_targets_min": 650
},
{
"epoch": 3.073836276083467,
"grad_norm": 0.7011950467502195,
"learning_rate": 2.7572231344230983e-05,
"loss": 0.1967,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1984846293926239,
"step": 1915,
"valid_targets_mean": 2431.4,
"valid_targets_min": 722
},
{
"epoch": 3.081861958266453,
"grad_norm": 0.8410097906484902,
"learning_rate": 2.7498069983496466e-05,
"loss": 0.1957,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20174948871135712,
"step": 1920,
"valid_targets_mean": 1798.1,
"valid_targets_min": 694
},
{
"epoch": 3.0898876404494384,
"grad_norm": 0.7073569345794174,
"learning_rate": 2.7423788470855455e-05,
"loss": 0.2015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19382837414741516,
"step": 1925,
"valid_targets_mean": 2452.8,
"valid_targets_min": 843
},
{
"epoch": 3.0979133226324236,
"grad_norm": 0.8179807578648297,
"learning_rate": 2.734938799662297e-05,
"loss": 0.1936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16232554614543915,
"step": 1930,
"valid_targets_mean": 1700.2,
"valid_targets_min": 827
},
{
"epoch": 3.105939004815409,
"grad_norm": 0.7858838266351695,
"learning_rate": 2.727486975302032e-05,
"loss": 0.1876,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19014039635658264,
"step": 1935,
"valid_targets_mean": 1804.1,
"valid_targets_min": 730
},
{
"epoch": 3.113964686998395,
"grad_norm": 0.7209047591018296,
"learning_rate": 2.7200234934156012e-05,
"loss": 0.1953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17354069650173187,
"step": 1940,
"valid_targets_mean": 1919.5,
"valid_targets_min": 756
},
{
"epoch": 3.1219903691813804,
"grad_norm": 0.8428897718911152,
"learning_rate": 2.712548473600657e-05,
"loss": 0.1995,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19806596636772156,
"step": 1945,
"valid_targets_mean": 1813.6,
"valid_targets_min": 632
},
{
"epoch": 3.130016051364366,
"grad_norm": 0.809920682857247,
"learning_rate": 2.7050620356397413e-05,
"loss": 0.1916,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18115901947021484,
"step": 1950,
"valid_targets_mean": 1606.6,
"valid_targets_min": 819
},
{
"epoch": 3.1380417335473516,
"grad_norm": 0.893305519656849,
"learning_rate": 2.6975642994983658e-05,
"loss": 0.1908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1924627125263214,
"step": 1955,
"valid_targets_mean": 1423.1,
"valid_targets_min": 554
},
{
"epoch": 3.146067415730337,
"grad_norm": 0.751617349429226,
"learning_rate": 2.6900553853230856e-05,
"loss": 0.194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19373275339603424,
"step": 1960,
"valid_targets_mean": 2145.9,
"valid_targets_min": 912
},
{
"epoch": 3.154093097913323,
"grad_norm": 0.8000049867410969,
"learning_rate": 2.6825354134395804e-05,
"loss": 0.195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18756906688213348,
"step": 1965,
"valid_targets_mean": 1920.1,
"valid_targets_min": 734
},
{
"epoch": 3.162118780096308,
"grad_norm": 0.7061336594749047,
"learning_rate": 2.6750045043507196e-05,
"loss": 0.1794,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18700531125068665,
"step": 1970,
"valid_targets_mean": 1959.3,
"valid_targets_min": 869
},
{
"epoch": 3.1701444622792936,
"grad_norm": 0.6065987384881834,
"learning_rate": 2.667462778734637e-05,
"loss": 0.1818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15520010888576508,
"step": 1975,
"valid_targets_mean": 2880.4,
"valid_targets_min": 623
},
{
"epoch": 3.178170144462279,
"grad_norm": 0.7999447629388277,
"learning_rate": 2.6599103574427928e-05,
"loss": 0.1758,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1867016702890396,
"step": 1980,
"valid_targets_mean": 1824.9,
"valid_targets_min": 777
},
{
"epoch": 3.186195826645265,
"grad_norm": 0.797199335886302,
"learning_rate": 2.6523473614980395e-05,
"loss": 0.1982,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20053572952747345,
"step": 1985,
"valid_targets_mean": 1946.2,
"valid_targets_min": 725
},
{
"epoch": 3.1942215088282504,
"grad_norm": 0.7659734706627166,
"learning_rate": 2.6447739120926815e-05,
"loss": 0.1745,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17469337582588196,
"step": 1990,
"valid_targets_mean": 1612.2,
"valid_targets_min": 684
},
{
"epoch": 3.202247191011236,
"grad_norm": 0.7701645192834687,
"learning_rate": 2.6371901305865346e-05,
"loss": 0.1939,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21454013884067535,
"step": 1995,
"valid_targets_mean": 2100.4,
"valid_targets_min": 835
},
{
"epoch": 3.2102728731942216,
"grad_norm": 0.8125509864840708,
"learning_rate": 2.629596138504978e-05,
"loss": 0.2023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19029833376407623,
"step": 2000,
"valid_targets_mean": 1778.3,
"valid_targets_min": 648
},
{
"epoch": 3.218298555377207,
"grad_norm": 0.7175888565554096,
"learning_rate": 2.6219920575370115e-05,
"loss": 0.1862,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18968114256858826,
"step": 2005,
"valid_targets_mean": 2400.2,
"valid_targets_min": 1284
},
{
"epoch": 3.226324237560193,
"grad_norm": 0.774431761352013,
"learning_rate": 2.6143780095332996e-05,
"loss": 0.1995,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22374089062213898,
"step": 2010,
"valid_targets_mean": 2418.2,
"valid_targets_min": 745
},
{
"epoch": 3.234349919743178,
"grad_norm": 0.7366934183831256,
"learning_rate": 2.6067541165042262e-05,
"loss": 0.1891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1646566092967987,
"step": 2015,
"valid_targets_mean": 1817.9,
"valid_targets_min": 880
},
{
"epoch": 3.2423756019261636,
"grad_norm": 0.9085528020394846,
"learning_rate": 2.5991205006179332e-05,
"loss": 0.1866,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2022278755903244,
"step": 2020,
"valid_targets_mean": 1888.2,
"valid_targets_min": 638
},
{
"epoch": 3.250401284109149,
"grad_norm": 0.8496667981008769,
"learning_rate": 2.5914772841983653e-05,
"loss": 0.1974,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20533272624015808,
"step": 2025,
"valid_targets_mean": 1874.3,
"valid_targets_min": 790
},
{
"epoch": 3.258426966292135,
"grad_norm": 0.7969748922112211,
"learning_rate": 2.5838245897233113e-05,
"loss": 0.1993,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1906946450471878,
"step": 2030,
"valid_targets_mean": 1718.5,
"valid_targets_min": 549
},
{
"epoch": 3.2664526484751204,
"grad_norm": 0.6925975178805427,
"learning_rate": 2.5761625398224387e-05,
"loss": 0.1947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18433983623981476,
"step": 2035,
"valid_targets_mean": 2462.9,
"valid_targets_min": 686
},
{
"epoch": 3.274478330658106,
"grad_norm": 0.7245709850282777,
"learning_rate": 2.56849125727533e-05,
"loss": 0.1907,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16477423906326294,
"step": 2040,
"valid_targets_mean": 2091.6,
"valid_targets_min": 744
},
{
"epoch": 3.2825040128410916,
"grad_norm": 0.7771087868403446,
"learning_rate": 2.560810865009515e-05,
"loss": 0.1835,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.193090558052063,
"step": 2045,
"valid_targets_mean": 1966.6,
"valid_targets_min": 631
},
{
"epoch": 3.290529695024077,
"grad_norm": 0.7254301119297374,
"learning_rate": 2.5531214860985015e-05,
"loss": 0.1944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1945345103740692,
"step": 2050,
"valid_targets_mean": 2402.4,
"valid_targets_min": 889
},
{
"epoch": 3.2985553772070624,
"grad_norm": 0.8027092204852169,
"learning_rate": 2.5454232437598032e-05,
"loss": 0.1959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20133385062217712,
"step": 2055,
"valid_targets_mean": 1915.6,
"valid_targets_min": 739
},
{
"epoch": 3.306581059390048,
"grad_norm": 0.7363037186006427,
"learning_rate": 2.537716261352963e-05,
"loss": 0.1923,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2043621689081192,
"step": 2060,
"valid_targets_mean": 2254.2,
"valid_targets_min": 762
},
{
"epoch": 3.3146067415730336,
"grad_norm": 0.7744385014125538,
"learning_rate": 2.53000066237758e-05,
"loss": 0.1982,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1948285698890686,
"step": 2065,
"valid_targets_mean": 1942.2,
"valid_targets_min": 607
},
{
"epoch": 3.322632423756019,
"grad_norm": 0.7687870461284612,
"learning_rate": 2.5222765704713265e-05,
"loss": 0.1833,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18752048909664154,
"step": 2070,
"valid_targets_mean": 1865.8,
"valid_targets_min": 985
},
{
"epoch": 3.330658105939005,
"grad_norm": 0.7263395997338279,
"learning_rate": 2.5145441094079702e-05,
"loss": 0.1907,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19827114045619965,
"step": 2075,
"valid_targets_mean": 2504.3,
"valid_targets_min": 920
},
{
"epoch": 3.3386837881219904,
"grad_norm": 0.7381187748986383,
"learning_rate": 2.5068034030953888e-05,
"loss": 0.1885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17457011342048645,
"step": 2080,
"valid_targets_mean": 2321.3,
"valid_targets_min": 867
},
{
"epoch": 3.346709470304976,
"grad_norm": 0.7334484973637228,
"learning_rate": 2.499054575573585e-05,
"loss": 0.1921,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16836518049240112,
"step": 2085,
"valid_targets_mean": 2020.1,
"valid_targets_min": 662
},
{
"epoch": 3.3547351524879616,
"grad_norm": 0.8336487761249294,
"learning_rate": 2.491297751012699e-05,
"loss": 0.1967,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18217214941978455,
"step": 2090,
"valid_targets_mean": 1471.1,
"valid_targets_min": 713
},
{
"epoch": 3.362760834670947,
"grad_norm": 0.7231447723601349,
"learning_rate": 2.483533053711018e-05,
"loss": 0.181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19125714898109436,
"step": 2095,
"valid_targets_mean": 2079.2,
"valid_targets_min": 818
},
{
"epoch": 3.370786516853933,
"grad_norm": 0.7871767792479442,
"learning_rate": 2.4757606080929856e-05,
"loss": 0.1897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19560378789901733,
"step": 2100,
"valid_targets_mean": 1715.2,
"valid_targets_min": 722
},
{
"epoch": 3.378812199036918,
"grad_norm": 0.7353603707138118,
"learning_rate": 2.467980538707207e-05,
"loss": 0.193,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1874968260526657,
"step": 2105,
"valid_targets_mean": 2198.7,
"valid_targets_min": 995
},
{
"epoch": 3.3868378812199036,
"grad_norm": 0.8102308981966291,
"learning_rate": 2.460192970224454e-05,
"loss": 0.2001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2087075412273407,
"step": 2110,
"valid_targets_mean": 1647.7,
"valid_targets_min": 659
},
{
"epoch": 3.394863563402889,
"grad_norm": 0.7431520066152951,
"learning_rate": 2.4523980274356665e-05,
"loss": 0.1914,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21111366152763367,
"step": 2115,
"valid_targets_mean": 2318.9,
"valid_targets_min": 467
},
{
"epoch": 3.402889245585875,
"grad_norm": 0.6583964122894566,
"learning_rate": 2.444595835249952e-05,
"loss": 0.1853,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17443379759788513,
"step": 2120,
"valid_targets_mean": 2557.6,
"valid_targets_min": 923
},
{
"epoch": 3.4109149277688604,
"grad_norm": 0.9040657902276791,
"learning_rate": 2.436786518692587e-05,
"loss": 0.1958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18719065189361572,
"step": 2125,
"valid_targets_mean": 2413.8,
"valid_targets_min": 734
},
{
"epoch": 3.418940609951846,
"grad_norm": 0.730483546474811,
"learning_rate": 2.428970202903011e-05,
"loss": 0.1963,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19034501910209656,
"step": 2130,
"valid_targets_mean": 2162.1,
"valid_targets_min": 825
},
{
"epoch": 3.4269662921348316,
"grad_norm": 0.8290450345988953,
"learning_rate": 2.4211470131328208e-05,
"loss": 0.1932,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20703352987766266,
"step": 2135,
"valid_targets_mean": 1847.6,
"valid_targets_min": 725
},
{
"epoch": 3.4349919743178168,
"grad_norm": 0.6912484043662559,
"learning_rate": 2.4133170747437657e-05,
"loss": 0.1943,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2027449905872345,
"step": 2140,
"valid_targets_mean": 2536.1,
"valid_targets_min": 612
},
{
"epoch": 3.4430176565008024,
"grad_norm": 0.748348272526716,
"learning_rate": 2.4054805132057362e-05,
"loss": 0.1935,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1785166710615158,
"step": 2145,
"valid_targets_mean": 1872.3,
"valid_targets_min": 750
},
{
"epoch": 3.451043338683788,
"grad_norm": 0.8392457980303076,
"learning_rate": 2.397637454094756e-05,
"loss": 0.1857,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19250713288784027,
"step": 2150,
"valid_targets_mean": 1665.8,
"valid_targets_min": 692
},
{
"epoch": 3.4590690208667736,
"grad_norm": 0.7956502741744578,
"learning_rate": 2.3897880230909678e-05,
"loss": 0.1936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1779821813106537,
"step": 2155,
"valid_targets_mean": 1863.2,
"valid_targets_min": 639
},
{
"epoch": 3.467094703049759,
"grad_norm": 0.6735272716108055,
"learning_rate": 2.3819323459766194e-05,
"loss": 0.1911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18678349256515503,
"step": 2160,
"valid_targets_mean": 2579.4,
"valid_targets_min": 1288
},
{
"epoch": 3.475120385232745,
"grad_norm": 0.781264193277655,
"learning_rate": 2.3740705486340492e-05,
"loss": 0.178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16642053425312042,
"step": 2165,
"valid_targets_mean": 2064.8,
"valid_targets_min": 692
},
{
"epoch": 3.4831460674157304,
"grad_norm": 0.8509728426922071,
"learning_rate": 2.366202757043668e-05,
"loss": 0.1814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1804889738559723,
"step": 2170,
"valid_targets_mean": 1531.1,
"valid_targets_min": 820
},
{
"epoch": 3.491171749598716,
"grad_norm": 0.7681030716681042,
"learning_rate": 2.358329097281942e-05,
"loss": 0.2023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21239528059959412,
"step": 2175,
"valid_targets_mean": 2224.4,
"valid_targets_min": 734
},
{
"epoch": 3.4991974317817016,
"grad_norm": 0.6875253594702069,
"learning_rate": 2.3504496955193695e-05,
"loss": 0.188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17239797115325928,
"step": 2180,
"valid_targets_mean": 1882.8,
"valid_targets_min": 933
},
{
"epoch": 3.5072231139646872,
"grad_norm": 0.7423496773042868,
"learning_rate": 2.342564678018462e-05,
"loss": 0.2018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19619911909103394,
"step": 2185,
"valid_targets_mean": 2109.4,
"valid_targets_min": 793
},
{
"epoch": 3.515248796147673,
"grad_norm": 0.6599800958836226,
"learning_rate": 2.3346741711317185e-05,
"loss": 0.1857,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1889185905456543,
"step": 2190,
"valid_targets_mean": 2660.3,
"valid_targets_min": 888
},
{
"epoch": 3.523274478330658,
"grad_norm": 0.8332035412792131,
"learning_rate": 2.326778301299603e-05,
"loss": 0.1922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1888495832681656,
"step": 2195,
"valid_targets_mean": 1617.4,
"valid_targets_min": 682
},
{
"epoch": 3.5313001605136436,
"grad_norm": 0.7422726313573247,
"learning_rate": 2.3188771950485172e-05,
"loss": 0.1885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16541287302970886,
"step": 2200,
"valid_targets_mean": 1771.2,
"valid_targets_min": 723
},
{
"epoch": 3.539325842696629,
"grad_norm": 0.7751086907387414,
"learning_rate": 2.3109709789887732e-05,
"loss": 0.2092,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2171766757965088,
"step": 2205,
"valid_targets_mean": 2355.4,
"valid_targets_min": 790
},
{
"epoch": 3.547351524879615,
"grad_norm": 0.7959173282766169,
"learning_rate": 2.3030597798125642e-05,
"loss": 0.1955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20218120515346527,
"step": 2210,
"valid_targets_mean": 1999.3,
"valid_targets_min": 567
},
{
"epoch": 3.5553772070626004,
"grad_norm": 0.7123208491374362,
"learning_rate": 2.295143724291935e-05,
"loss": 0.1871,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18248684704303741,
"step": 2215,
"valid_targets_mean": 1983.6,
"valid_targets_min": 861
},
{
"epoch": 3.563402889245586,
"grad_norm": 0.7239156258883958,
"learning_rate": 2.2872229392767497e-05,
"loss": 0.1977,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18239015340805054,
"step": 2220,
"valid_targets_mean": 2137.5,
"valid_targets_min": 845
},
{
"epoch": 3.571428571428571,
"grad_norm": 0.8073709827317045,
"learning_rate": 2.2792975516926615e-05,
"loss": 0.1908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20157527923583984,
"step": 2225,
"valid_targets_mean": 2178.2,
"valid_targets_min": 947
},
{
"epoch": 3.579454253611557,
"grad_norm": 0.9561614899504988,
"learning_rate": 2.271367688539075e-05,
"loss": 0.1909,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18683037161827087,
"step": 2230,
"valid_targets_mean": 2166.1,
"valid_targets_min": 720
},
{
"epoch": 3.5874799357945424,
"grad_norm": 0.7468302593032567,
"learning_rate": 2.2634334768871133e-05,
"loss": 0.188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1675512194633484,
"step": 2235,
"valid_targets_mean": 1832.1,
"valid_targets_min": 666
},
{
"epoch": 3.595505617977528,
"grad_norm": 0.7591043916830319,
"learning_rate": 2.2554950438775813e-05,
"loss": 0.1904,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19787640869617462,
"step": 2240,
"valid_targets_mean": 2119.7,
"valid_targets_min": 646
},
{
"epoch": 3.6035313001605136,
"grad_norm": 0.7812103358035377,
"learning_rate": 2.2475525167189298e-05,
"loss": 0.1916,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18840080499649048,
"step": 2245,
"valid_targets_mean": 1717.6,
"valid_targets_min": 797
},
{
"epoch": 3.611556982343499,
"grad_norm": 0.8048037305797138,
"learning_rate": 2.2396060226852148e-05,
"loss": 0.1911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17736947536468506,
"step": 2250,
"valid_targets_mean": 1519.2,
"valid_targets_min": 713
},
{
"epoch": 3.619582664526485,
"grad_norm": 0.7382055576071299,
"learning_rate": 2.2316556891140594e-05,
"loss": 0.1989,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18542557954788208,
"step": 2255,
"valid_targets_mean": 1981.1,
"valid_targets_min": 658
},
{
"epoch": 3.6276083467094704,
"grad_norm": 0.8117240899793563,
"learning_rate": 2.2237016434046124e-05,
"loss": 0.1885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.199208065867424,
"step": 2260,
"valid_targets_mean": 2017.4,
"valid_targets_min": 694
},
{
"epoch": 3.635634028892456,
"grad_norm": 0.7814089947481103,
"learning_rate": 2.2157440130155084e-05,
"loss": 0.1778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2004736363887787,
"step": 2265,
"valid_targets_mean": 2167.4,
"valid_targets_min": 648
},
{
"epoch": 3.6436597110754416,
"grad_norm": 0.8313337224306722,
"learning_rate": 2.2077829254628224e-05,
"loss": 0.205,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19507341086864471,
"step": 2270,
"valid_targets_mean": 1738.1,
"valid_targets_min": 776
},
{
"epoch": 3.6516853932584272,
"grad_norm": 0.736982749910831,
"learning_rate": 2.1998185083180297e-05,
"loss": 0.197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17966896295547485,
"step": 2275,
"valid_targets_mean": 1906.8,
"valid_targets_min": 676
},
{
"epoch": 3.6597110754414124,
"grad_norm": 0.7529274800924642,
"learning_rate": 2.1918508892059608e-05,
"loss": 0.1751,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1658572107553482,
"step": 2280,
"valid_targets_mean": 1714.2,
"valid_targets_min": 667
},
{
"epoch": 3.667736757624398,
"grad_norm": 0.8232143722363245,
"learning_rate": 2.1838801958027533e-05,
"loss": 0.1974,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21375055611133575,
"step": 2285,
"valid_targets_mean": 1926.2,
"valid_targets_min": 723
},
{
"epoch": 3.6757624398073836,
"grad_norm": 0.7437594523483552,
"learning_rate": 2.175906555833811e-05,
"loss": 0.1793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14584185183048248,
"step": 2290,
"valid_targets_mean": 1485.8,
"valid_targets_min": 660
},
{
"epoch": 3.683788121990369,
"grad_norm": 0.8253400566984553,
"learning_rate": 2.1679300970717526e-05,
"loss": 0.1862,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.198220357298851,
"step": 2295,
"valid_targets_mean": 1756.6,
"valid_targets_min": 687
},
{
"epoch": 3.691813804173355,
"grad_norm": 0.7631981257736214,
"learning_rate": 2.1599509473343688e-05,
"loss": 0.1899,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1921335756778717,
"step": 2300,
"valid_targets_mean": 1836.2,
"valid_targets_min": 809
},
{
"epoch": 3.6998394863563404,
"grad_norm": 0.8125231968272838,
"learning_rate": 2.1519692344825684e-05,
"loss": 0.1975,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19826048612594604,
"step": 2305,
"valid_targets_mean": 2303.0,
"valid_targets_min": 810
},
{
"epoch": 3.7078651685393256,
"grad_norm": 0.796754649081973,
"learning_rate": 2.1439850864183343e-05,
"loss": 0.1828,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18836288154125214,
"step": 2310,
"valid_targets_mean": 1845.9,
"valid_targets_min": 682
},
{
"epoch": 3.715890850722311,
"grad_norm": 0.7011535417327573,
"learning_rate": 2.1359986310826723e-05,
"loss": 0.1818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15693524479866028,
"step": 2315,
"valid_targets_mean": 1808.2,
"valid_targets_min": 692
},
{
"epoch": 3.723916532905297,
"grad_norm": 0.6745982102974377,
"learning_rate": 2.1280099964535594e-05,
"loss": 0.2062,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20702672004699707,
"step": 2320,
"valid_targets_mean": 2588.8,
"valid_targets_min": 594
},
{
"epoch": 3.7319422150882824,
"grad_norm": 0.7036120650208736,
"learning_rate": 2.120019310543896e-05,
"loss": 0.1977,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2342701256275177,
"step": 2325,
"valid_targets_mean": 2742.9,
"valid_targets_min": 718
},
{
"epoch": 3.739967897271268,
"grad_norm": 0.6978119100165123,
"learning_rate": 2.1120267013994527e-05,
"loss": 0.1859,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19557003676891327,
"step": 2330,
"valid_targets_mean": 2265.5,
"valid_targets_min": 839
},
{
"epoch": 3.7479935794542536,
"grad_norm": 1.1106527175621144,
"learning_rate": 2.104032297096817e-05,
"loss": 0.1919,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19205822050571442,
"step": 2335,
"valid_targets_mean": 2021.2,
"valid_targets_min": 819
},
{
"epoch": 3.756019261637239,
"grad_norm": 0.6649212142267416,
"learning_rate": 2.096036225741346e-05,
"loss": 0.1927,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1821729838848114,
"step": 2340,
"valid_targets_mean": 2483.3,
"valid_targets_min": 754
},
{
"epoch": 3.764044943820225,
"grad_norm": 0.8682584189157655,
"learning_rate": 2.088038615465107e-05,
"loss": 0.1993,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2323881983757019,
"step": 2345,
"valid_targets_mean": 2172.1,
"valid_targets_min": 914
},
{
"epoch": 3.7720706260032104,
"grad_norm": 0.7059973626007631,
"learning_rate": 2.080039594424829e-05,
"loss": 0.194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19035211205482483,
"step": 2350,
"valid_targets_mean": 2238.2,
"valid_targets_min": 647
},
{
"epoch": 3.780096308186196,
"grad_norm": 0.7025817999562849,
"learning_rate": 2.0720392907998473e-05,
"loss": 0.1838,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16978096961975098,
"step": 2355,
"valid_targets_mean": 1907.9,
"valid_targets_min": 830
},
{
"epoch": 3.7881219903691816,
"grad_norm": 0.7720895482426217,
"learning_rate": 2.0640378327900507e-05,
"loss": 0.1831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18614491820335388,
"step": 2360,
"valid_targets_mean": 1797.3,
"valid_targets_min": 620
},
{
"epoch": 3.796147672552167,
"grad_norm": 0.7448908723180842,
"learning_rate": 2.0560353486138255e-05,
"loss": 0.1864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1888936161994934,
"step": 2365,
"valid_targets_mean": 2135.0,
"valid_targets_min": 651
},
{
"epoch": 3.8041733547351524,
"grad_norm": 0.7293585089215756,
"learning_rate": 2.0480319665060014e-05,
"loss": 0.1881,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17815639078617096,
"step": 2370,
"valid_targets_mean": 1993.8,
"valid_targets_min": 916
},
{
"epoch": 3.812199036918138,
"grad_norm": 0.8436319534001945,
"learning_rate": 2.0400278147157973e-05,
"loss": 0.1924,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19632424414157867,
"step": 2375,
"valid_targets_mean": 1567.9,
"valid_targets_min": 700
},
{
"epoch": 3.8202247191011236,
"grad_norm": 0.762177401689057,
"learning_rate": 2.0320230215047667e-05,
"loss": 0.1783,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17414651811122894,
"step": 2380,
"valid_targets_mean": 1993.4,
"valid_targets_min": 805
},
{
"epoch": 3.828250401284109,
"grad_norm": 0.7862690373739996,
"learning_rate": 2.0240177151447397e-05,
"loss": 0.1902,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1997125893831253,
"step": 2385,
"valid_targets_mean": 1752.0,
"valid_targets_min": 824
},
{
"epoch": 3.836276083467095,
"grad_norm": 0.7671200606374088,
"learning_rate": 2.0160120239157705e-05,
"loss": 0.1862,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19353365898132324,
"step": 2390,
"valid_targets_mean": 1993.4,
"valid_targets_min": 926
},
{
"epoch": 3.8443017656500804,
"grad_norm": 0.7497960536151272,
"learning_rate": 2.0080060761040795e-05,
"loss": 0.1923,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18841297924518585,
"step": 2395,
"valid_targets_mean": 2027.2,
"valid_targets_min": 805
},
{
"epoch": 3.8523274478330656,
"grad_norm": 0.6984086156626323,
"learning_rate": 2e-05,
"loss": 0.1921,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17640450596809387,
"step": 2400,
"valid_targets_mean": 2163.6,
"valid_targets_min": 731
},
{
"epoch": 3.860353130016051,
"grad_norm": 0.6985420493366072,
"learning_rate": 1.991993923895921e-05,
"loss": 0.1912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1724482774734497,
"step": 2405,
"valid_targets_mean": 2245.6,
"valid_targets_min": 689
},
{
"epoch": 3.868378812199037,
"grad_norm": 0.7664827628096461,
"learning_rate": 1.9839879760842302e-05,
"loss": 0.1933,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17965087294578552,
"step": 2410,
"valid_targets_mean": 1988.3,
"valid_targets_min": 669
},
{
"epoch": 3.8764044943820224,
"grad_norm": 0.8574637628450187,
"learning_rate": 1.975982284855261e-05,
"loss": 0.1853,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17706872522830963,
"step": 2415,
"valid_targets_mean": 1429.2,
"valid_targets_min": 826
},
{
"epoch": 3.884430176565008,
"grad_norm": 0.8159684403134524,
"learning_rate": 1.967976978495234e-05,
"loss": 0.193,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2066316157579422,
"step": 2420,
"valid_targets_mean": 1944.9,
"valid_targets_min": 578
},
{
"epoch": 3.8924558587479936,
"grad_norm": 0.7653474014396054,
"learning_rate": 1.959972185284203e-05,
"loss": 0.1873,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20480495691299438,
"step": 2425,
"valid_targets_mean": 2137.4,
"valid_targets_min": 711
},
{
"epoch": 3.900481540930979,
"grad_norm": 0.7119154640913655,
"learning_rate": 1.951968033493999e-05,
"loss": 0.1916,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22431352734565735,
"step": 2430,
"valid_targets_mean": 2569.9,
"valid_targets_min": 922
},
{
"epoch": 3.908507223113965,
"grad_norm": 0.6933243254616628,
"learning_rate": 1.9439646513861748e-05,
"loss": 0.189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1814383864402771,
"step": 2435,
"valid_targets_mean": 2834.9,
"valid_targets_min": 721
},
{
"epoch": 3.9165329052969504,
"grad_norm": 0.7003573100002531,
"learning_rate": 1.93596216720995e-05,
"loss": 0.1975,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1896560937166214,
"step": 2440,
"valid_targets_mean": 2383.5,
"valid_targets_min": 703
},
{
"epoch": 3.924558587479936,
"grad_norm": 0.7987554233995582,
"learning_rate": 1.9279607092001534e-05,
"loss": 0.1912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17562270164489746,
"step": 2445,
"valid_targets_mean": 1630.9,
"valid_targets_min": 812
},
{
"epoch": 3.932584269662921,
"grad_norm": 0.7727774163624671,
"learning_rate": 1.9199604055751718e-05,
"loss": 0.1937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2166813164949417,
"step": 2450,
"valid_targets_mean": 2261.4,
"valid_targets_min": 881
},
{
"epoch": 3.940609951845907,
"grad_norm": 0.8131949994370706,
"learning_rate": 1.9119613845348935e-05,
"loss": 0.1931,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1931370496749878,
"step": 2455,
"valid_targets_mean": 2146.0,
"valid_targets_min": 665
},
{
"epoch": 3.9486356340288924,
"grad_norm": 0.7543765118463652,
"learning_rate": 1.9039637742586545e-05,
"loss": 0.1935,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18845586478710175,
"step": 2460,
"valid_targets_mean": 1944.2,
"valid_targets_min": 990
},
{
"epoch": 3.956661316211878,
"grad_norm": 0.8095687971348281,
"learning_rate": 1.8959677029031832e-05,
"loss": 0.1764,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19238343834877014,
"step": 2465,
"valid_targets_mean": 2164.7,
"valid_targets_min": 890
},
{
"epoch": 3.9646869983948636,
"grad_norm": 0.8236185986919573,
"learning_rate": 1.8879732986005476e-05,
"loss": 0.2015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19786785542964935,
"step": 2470,
"valid_targets_mean": 1725.6,
"valid_targets_min": 744
},
{
"epoch": 3.972712680577849,
"grad_norm": 0.9277927282461786,
"learning_rate": 1.8799806894561042e-05,
"loss": 0.1974,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2078876495361328,
"step": 2475,
"valid_targets_mean": 2197.4,
"valid_targets_min": 1186
},
{
"epoch": 3.980738362760835,
"grad_norm": 0.7514885129339864,
"learning_rate": 1.8719900035464412e-05,
"loss": 0.1936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16057060658931732,
"step": 2480,
"valid_targets_mean": 1605.2,
"valid_targets_min": 645
},
{
"epoch": 3.98876404494382,
"grad_norm": 0.6523845582349944,
"learning_rate": 1.864001368917328e-05,
"loss": 0.1882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19543814659118652,
"step": 2485,
"valid_targets_mean": 2637.5,
"valid_targets_min": 689
},
{
"epoch": 3.9967897271268056,
"grad_norm": 0.7614952279373743,
"learning_rate": 1.856014913581666e-05,
"loss": 0.1922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19684013724327087,
"step": 2490,
"valid_targets_mean": 2091.9,
"valid_targets_min": 786
},
{
"epoch": 4.004815409309791,
"grad_norm": 0.7598894989729227,
"learning_rate": 1.8480307655174322e-05,
"loss": 0.1732,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16470491886138916,
"step": 2495,
"valid_targets_mean": 1833.8,
"valid_targets_min": 567
},
{
"epoch": 4.012841091492777,
"grad_norm": 0.7220917183884463,
"learning_rate": 1.8400490526656322e-05,
"loss": 0.1642,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1639862060546875,
"step": 2500,
"valid_targets_mean": 2315.0,
"valid_targets_min": 835
},
{
"epoch": 4.020866773675762,
"grad_norm": 0.7146247317400145,
"learning_rate": 1.8320699029282477e-05,
"loss": 0.1459,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1569473147392273,
"step": 2505,
"valid_targets_mean": 2658.7,
"valid_targets_min": 617
},
{
"epoch": 4.028892455858748,
"grad_norm": 0.7357502371403062,
"learning_rate": 1.8240934441661898e-05,
"loss": 0.1693,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15852639079093933,
"step": 2510,
"valid_targets_mean": 2141.9,
"valid_targets_min": 551
},
{
"epoch": 4.036918138041734,
"grad_norm": 0.9021773647071464,
"learning_rate": 1.8161198041972478e-05,
"loss": 0.1611,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15807832777500153,
"step": 2515,
"valid_targets_mean": 1685.3,
"valid_targets_min": 687
},
{
"epoch": 4.044943820224719,
"grad_norm": 0.8267907751505533,
"learning_rate": 1.8081491107940405e-05,
"loss": 0.157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1717631220817566,
"step": 2520,
"valid_targets_mean": 1869.8,
"valid_targets_min": 922
},
{
"epoch": 4.052969502407705,
"grad_norm": 0.8272280336042476,
"learning_rate": 1.8001814916819706e-05,
"loss": 0.1633,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15036287903785706,
"step": 2525,
"valid_targets_mean": 2030.8,
"valid_targets_min": 660
},
{
"epoch": 4.06099518459069,
"grad_norm": 0.750320928818136,
"learning_rate": 1.7922170745371782e-05,
"loss": 0.1631,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15992726385593414,
"step": 2530,
"valid_targets_mean": 2341.8,
"valid_targets_min": 752
},
{
"epoch": 4.069020866773676,
"grad_norm": 0.710265161172677,
"learning_rate": 1.7842559869844926e-05,
"loss": 0.1616,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16481420397758484,
"step": 2535,
"valid_targets_mean": 2390.8,
"valid_targets_min": 879
},
{
"epoch": 4.077046548956662,
"grad_norm": 0.6932511885249728,
"learning_rate": 1.7762983565953882e-05,
"loss": 0.1604,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15228337049484253,
"step": 2540,
"valid_targets_mean": 2558.4,
"valid_targets_min": 1005
},
{
"epoch": 4.085072231139647,
"grad_norm": 0.9665904156345935,
"learning_rate": 1.768344310885941e-05,
"loss": 0.1585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1605364829301834,
"step": 2545,
"valid_targets_mean": 1897.4,
"valid_targets_min": 619
},
{
"epoch": 4.093097913322633,
"grad_norm": 0.8370869748032498,
"learning_rate": 1.760393977314786e-05,
"loss": 0.1582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1575726568698883,
"step": 2550,
"valid_targets_mean": 1763.5,
"valid_targets_min": 697
},
{
"epoch": 4.101123595505618,
"grad_norm": 0.851361799332316,
"learning_rate": 1.7524474832810715e-05,
"loss": 0.1517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15234051644802094,
"step": 2555,
"valid_targets_mean": 1794.1,
"valid_targets_min": 759
},
{
"epoch": 4.109149277688603,
"grad_norm": 0.8670710844035465,
"learning_rate": 1.7445049561224197e-05,
"loss": 0.158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18183620274066925,
"step": 2560,
"valid_targets_mean": 1944.7,
"valid_targets_min": 802
},
{
"epoch": 4.117174959871589,
"grad_norm": 0.8008124802397306,
"learning_rate": 1.736566523112888e-05,
"loss": 0.1617,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1569271683692932,
"step": 2565,
"valid_targets_mean": 1758.4,
"valid_targets_min": 963
},
{
"epoch": 4.125200642054574,
"grad_norm": 0.7244247443223619,
"learning_rate": 1.7286323114609264e-05,
"loss": 0.1652,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16013914346694946,
"step": 2570,
"valid_targets_mean": 2266.8,
"valid_targets_min": 695
},
{
"epoch": 4.13322632423756,
"grad_norm": 0.7258758426401232,
"learning_rate": 1.7207024483073395e-05,
"loss": 0.1528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1507132351398468,
"step": 2575,
"valid_targets_mean": 2195.1,
"valid_targets_min": 797
},
{
"epoch": 4.141252006420546,
"grad_norm": 0.7747021374459989,
"learning_rate": 1.7127770607232506e-05,
"loss": 0.165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16840553283691406,
"step": 2580,
"valid_targets_mean": 2432.6,
"valid_targets_min": 899
},
{
"epoch": 4.149277688603531,
"grad_norm": 0.8370328803383551,
"learning_rate": 1.7048562757080658e-05,
"loss": 0.1517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15022283792495728,
"step": 2585,
"valid_targets_mean": 2054.2,
"valid_targets_min": 1080
},
{
"epoch": 4.157303370786517,
"grad_norm": 0.863183572527677,
"learning_rate": 1.6969402201874358e-05,
"loss": 0.1688,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18424132466316223,
"step": 2590,
"valid_targets_mean": 1905.8,
"valid_targets_min": 672
},
{
"epoch": 4.165329052969502,
"grad_norm": 0.7325225003293633,
"learning_rate": 1.6890290210112268e-05,
"loss": 0.1648,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16462567448616028,
"step": 2595,
"valid_targets_mean": 2701.8,
"valid_targets_min": 884
},
{
"epoch": 4.173354735152488,
"grad_norm": 0.8550527776626037,
"learning_rate": 1.6811228049514828e-05,
"loss": 0.1628,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18417339026927948,
"step": 2600,
"valid_targets_mean": 2102.4,
"valid_targets_min": 801
},
{
"epoch": 4.181380417335474,
"grad_norm": 0.7738912822273089,
"learning_rate": 1.6732216987003972e-05,
"loss": 0.1657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14265528321266174,
"step": 2605,
"valid_targets_mean": 2429.2,
"valid_targets_min": 726
},
{
"epoch": 4.189406099518459,
"grad_norm": 0.846741833270454,
"learning_rate": 1.6653258288682815e-05,
"loss": 0.1591,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.165584534406662,
"step": 2610,
"valid_targets_mean": 2022.3,
"valid_targets_min": 682
},
{
"epoch": 4.197431781701445,
"grad_norm": 0.7860604699119313,
"learning_rate": 1.6574353219815383e-05,
"loss": 0.1622,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17301838099956512,
"step": 2615,
"valid_targets_mean": 2509.3,
"valid_targets_min": 864
},
{
"epoch": 4.20545746388443,
"grad_norm": 0.6042094358589516,
"learning_rate": 1.6495503044806305e-05,
"loss": 0.1597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1679677814245224,
"step": 2620,
"valid_targets_mean": 4193.2,
"valid_targets_min": 1385
},
{
"epoch": 4.213483146067416,
"grad_norm": 0.8435205892952795,
"learning_rate": 1.641670902718058e-05,
"loss": 0.1666,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16670869290828705,
"step": 2625,
"valid_targets_mean": 1701.4,
"valid_targets_min": 750
},
{
"epoch": 4.221508828250402,
"grad_norm": 0.8069505344707392,
"learning_rate": 1.633797242956332e-05,
"loss": 0.168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17490074038505554,
"step": 2630,
"valid_targets_mean": 2187.9,
"valid_targets_min": 808
},
{
"epoch": 4.229534510433387,
"grad_norm": 0.7681332462758949,
"learning_rate": 1.625929451365951e-05,
"loss": 0.1565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.139631450176239,
"step": 2635,
"valid_targets_mean": 2152.5,
"valid_targets_min": 825
},
{
"epoch": 4.237560192616373,
"grad_norm": 0.7743079695057093,
"learning_rate": 1.618067654023381e-05,
"loss": 0.1593,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15092188119888306,
"step": 2640,
"valid_targets_mean": 2007.7,
"valid_targets_min": 788
},
{
"epoch": 4.245585874799358,
"grad_norm": 0.8045522607448906,
"learning_rate": 1.6102119769090325e-05,
"loss": 0.159,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15477828681468964,
"step": 2645,
"valid_targets_mean": 2015.0,
"valid_targets_min": 1041
},
{
"epoch": 4.253611556982343,
"grad_norm": 0.7842184804024716,
"learning_rate": 1.6023625459052442e-05,
"loss": 0.1623,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14832571148872375,
"step": 2650,
"valid_targets_mean": 1659.8,
"valid_targets_min": 739
},
{
"epoch": 4.261637239165329,
"grad_norm": 0.8453627359844748,
"learning_rate": 1.594519486794264e-05,
"loss": 0.1634,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17142939567565918,
"step": 2655,
"valid_targets_mean": 1726.5,
"valid_targets_min": 650
},
{
"epoch": 4.269662921348314,
"grad_norm": 0.68904498722134,
"learning_rate": 1.586682925256235e-05,
"loss": 0.1541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1561916470527649,
"step": 2660,
"valid_targets_mean": 2864.8,
"valid_targets_min": 946
},
{
"epoch": 4.2776886035313,
"grad_norm": 0.7432020014717042,
"learning_rate": 1.5788529868671792e-05,
"loss": 0.1553,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16694585978984833,
"step": 2665,
"valid_targets_mean": 2652.6,
"valid_targets_min": 724
},
{
"epoch": 4.285714285714286,
"grad_norm": 0.8573411887216612,
"learning_rate": 1.5710297970969893e-05,
"loss": 0.1604,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16618192195892334,
"step": 2670,
"valid_targets_mean": 1786.7,
"valid_targets_min": 591
},
{
"epoch": 4.293739967897271,
"grad_norm": 0.8616537427897845,
"learning_rate": 1.563213481307413e-05,
"loss": 0.1607,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1844010055065155,
"step": 2675,
"valid_targets_mean": 2021.8,
"valid_targets_min": 859
},
{
"epoch": 4.301765650080257,
"grad_norm": 0.7980069825955369,
"learning_rate": 1.5554041647500485e-05,
"loss": 0.1652,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18299910426139832,
"step": 2680,
"valid_targets_mean": 2434.2,
"valid_targets_min": 597
},
{
"epoch": 4.309791332263242,
"grad_norm": 0.7786630652444673,
"learning_rate": 1.5476019725643342e-05,
"loss": 0.1631,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17932823300361633,
"step": 2685,
"valid_targets_mean": 2057.4,
"valid_targets_min": 652
},
{
"epoch": 4.317817014446228,
"grad_norm": 0.8119610141424436,
"learning_rate": 1.5398070297755465e-05,
"loss": 0.1652,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1823132038116455,
"step": 2690,
"valid_targets_mean": 2320.1,
"valid_targets_min": 633
},
{
"epoch": 4.325842696629214,
"grad_norm": 0.8571455033898614,
"learning_rate": 1.5320194612927935e-05,
"loss": 0.1661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19664575159549713,
"step": 2695,
"valid_targets_mean": 2258.8,
"valid_targets_min": 826
},
{
"epoch": 4.333868378812199,
"grad_norm": 0.810464889478973,
"learning_rate": 1.5242393919070146e-05,
"loss": 0.1665,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16627417504787445,
"step": 2700,
"valid_targets_mean": 1929.9,
"valid_targets_min": 821
},
{
"epoch": 4.341894060995185,
"grad_norm": 0.8148753400319572,
"learning_rate": 1.5164669462889825e-05,
"loss": 0.1637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14969250559806824,
"step": 2705,
"valid_targets_mean": 1406.3,
"valid_targets_min": 760
},
{
"epoch": 4.34991974317817,
"grad_norm": 0.7742908439387767,
"learning_rate": 1.5087022489873016e-05,
"loss": 0.1619,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15673664212226868,
"step": 2710,
"valid_targets_mean": 2016.5,
"valid_targets_min": 776
},
{
"epoch": 4.357945425361156,
"grad_norm": 0.8241151599270962,
"learning_rate": 1.5009454244264156e-05,
"loss": 0.1627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16360478103160858,
"step": 2715,
"valid_targets_mean": 2072.0,
"valid_targets_min": 563
},
{
"epoch": 4.365971107544142,
"grad_norm": 0.7258922171050899,
"learning_rate": 1.4931965969046113e-05,
"loss": 0.1671,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1603405475616455,
"step": 2720,
"valid_targets_mean": 2382.3,
"valid_targets_min": 1182
},
{
"epoch": 4.373996789727126,
"grad_norm": 0.746718193097595,
"learning_rate": 1.4854558905920303e-05,
"loss": 0.1578,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1559460312128067,
"step": 2725,
"valid_targets_mean": 2081.0,
"valid_targets_min": 622
},
{
"epoch": 4.382022471910112,
"grad_norm": 0.8753737997888681,
"learning_rate": 1.4777234295286742e-05,
"loss": 0.162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15468575060367584,
"step": 2730,
"valid_targets_mean": 1593.1,
"valid_targets_min": 634
},
{
"epoch": 4.390048154093098,
"grad_norm": 0.8037530854979934,
"learning_rate": 1.469999337622421e-05,
"loss": 0.1671,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16917386651039124,
"step": 2735,
"valid_targets_mean": 2151.1,
"valid_targets_min": 627
},
{
"epoch": 4.398073836276083,
"grad_norm": 0.8500743057064097,
"learning_rate": 1.4622837386470373e-05,
"loss": 0.16,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.166961207985878,
"step": 2740,
"valid_targets_mean": 1751.0,
"valid_targets_min": 740
},
{
"epoch": 4.406099518459069,
"grad_norm": 0.8311068179954831,
"learning_rate": 1.4545767562401973e-05,
"loss": 0.17,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15660396218299866,
"step": 2745,
"valid_targets_mean": 1665.8,
"valid_targets_min": 728
},
{
"epoch": 4.414125200642054,
"grad_norm": 0.7888439337676993,
"learning_rate": 1.4468785139014986e-05,
"loss": 0.1608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16615541279315948,
"step": 2750,
"valid_targets_mean": 2020.2,
"valid_targets_min": 883
},
{
"epoch": 4.42215088282504,
"grad_norm": 0.7271702792121916,
"learning_rate": 1.4391891349904859e-05,
"loss": 0.1507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1305883228778839,
"step": 2755,
"valid_targets_mean": 1820.6,
"valid_targets_min": 780
},
{
"epoch": 4.430176565008026,
"grad_norm": 0.8100289776181084,
"learning_rate": 1.4315087427246706e-05,
"loss": 0.1622,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16775105893611908,
"step": 2760,
"valid_targets_mean": 2011.5,
"valid_targets_min": 772
},
{
"epoch": 4.438202247191011,
"grad_norm": 0.8341886619638011,
"learning_rate": 1.4238374601775617e-05,
"loss": 0.1667,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.175085186958313,
"step": 2765,
"valid_targets_mean": 2030.1,
"valid_targets_min": 513
},
{
"epoch": 4.446227929373997,
"grad_norm": 0.7861876079484966,
"learning_rate": 1.4161754102766892e-05,
"loss": 0.1644,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16237448155879974,
"step": 2770,
"valid_targets_mean": 2125.4,
"valid_targets_min": 639
},
{
"epoch": 4.454253611556982,
"grad_norm": 0.7974795438274449,
"learning_rate": 1.4085227158016355e-05,
"loss": 0.1604,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1793215423822403,
"step": 2775,
"valid_targets_mean": 2240.8,
"valid_targets_min": 888
},
{
"epoch": 4.462279293739968,
"grad_norm": 0.7610583199711114,
"learning_rate": 1.4008794993820676e-05,
"loss": 0.1647,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16052846610546112,
"step": 2780,
"valid_targets_mean": 2020.9,
"valid_targets_min": 1038
},
{
"epoch": 4.470304975922954,
"grad_norm": 0.763307262888446,
"learning_rate": 1.3932458834957745e-05,
"loss": 0.1744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16174271702766418,
"step": 2785,
"valid_targets_mean": 2038.5,
"valid_targets_min": 869
},
{
"epoch": 4.478330658105939,
"grad_norm": 0.7090993165393538,
"learning_rate": 1.3856219904667012e-05,
"loss": 0.1617,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17628321051597595,
"step": 2790,
"valid_targets_mean": 2747.6,
"valid_targets_min": 1289
},
{
"epoch": 4.486356340288925,
"grad_norm": 0.7844335568292791,
"learning_rate": 1.3780079424629893e-05,
"loss": 0.1675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1669953465461731,
"step": 2795,
"valid_targets_mean": 2251.4,
"valid_targets_min": 792
},
{
"epoch": 4.49438202247191,
"grad_norm": 0.7237391782540498,
"learning_rate": 1.3704038614950221e-05,
"loss": 0.1634,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1593700349330902,
"step": 2800,
"valid_targets_mean": 2246.4,
"valid_targets_min": 635
},
{
"epoch": 4.502407704654896,
"grad_norm": 0.6662862730256653,
"learning_rate": 1.362809869413466e-05,
"loss": 0.1625,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15161554515361786,
"step": 2805,
"valid_targets_mean": 3524.4,
"valid_targets_min": 656
},
{
"epoch": 4.510433386837882,
"grad_norm": 0.7261025807643624,
"learning_rate": 1.355226087907319e-05,
"loss": 0.1699,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16334782540798187,
"step": 2810,
"valid_targets_mean": 2492.2,
"valid_targets_min": 635
},
{
"epoch": 4.518459069020867,
"grad_norm": 0.6893457421297444,
"learning_rate": 1.3476526385019609e-05,
"loss": 0.1642,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14589521288871765,
"step": 2815,
"valid_targets_mean": 2433.6,
"valid_targets_min": 996
},
{
"epoch": 4.526484751203852,
"grad_norm": 0.9075567951066162,
"learning_rate": 1.3400896425572078e-05,
"loss": 0.1622,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18327827751636505,
"step": 2820,
"valid_targets_mean": 1756.2,
"valid_targets_min": 714
},
{
"epoch": 4.534510433386838,
"grad_norm": 0.7717323287249781,
"learning_rate": 1.3325372212653638e-05,
"loss": 0.1586,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17693357169628143,
"step": 2825,
"valid_targets_mean": 2270.5,
"valid_targets_min": 1109
},
{
"epoch": 4.542536115569823,
"grad_norm": 0.7535197151026929,
"learning_rate": 1.324995495649281e-05,
"loss": 0.1584,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1388244926929474,
"step": 2830,
"valid_targets_mean": 2134.2,
"valid_targets_min": 704
},
{
"epoch": 4.550561797752809,
"grad_norm": 0.7741815820615187,
"learning_rate": 1.3174645865604201e-05,
"loss": 0.1651,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16817861795425415,
"step": 2835,
"valid_targets_mean": 2520.7,
"valid_targets_min": 826
},
{
"epoch": 4.558587479935794,
"grad_norm": 0.8231972416370127,
"learning_rate": 1.3099446146769146e-05,
"loss": 0.1629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17522352933883667,
"step": 2840,
"valid_targets_mean": 2127.5,
"valid_targets_min": 727
},
{
"epoch": 4.56661316211878,
"grad_norm": 0.797161483789656,
"learning_rate": 1.302435700501635e-05,
"loss": 0.1728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16017599403858185,
"step": 2845,
"valid_targets_mean": 2187.6,
"valid_targets_min": 618
},
{
"epoch": 4.574638844301766,
"grad_norm": 0.830389247613262,
"learning_rate": 1.294937964360259e-05,
"loss": 0.1592,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17233622074127197,
"step": 2850,
"valid_targets_mean": 1991.4,
"valid_targets_min": 728
},
{
"epoch": 4.582664526484751,
"grad_norm": 0.8604436677037445,
"learning_rate": 1.2874515263993435e-05,
"loss": 0.1646,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18079304695129395,
"step": 2855,
"valid_targets_mean": 1904.0,
"valid_targets_min": 738
},
{
"epoch": 4.590690208667737,
"grad_norm": 0.8182705272129311,
"learning_rate": 1.2799765065843994e-05,
"loss": 0.1664,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16060321033000946,
"step": 2860,
"valid_targets_mean": 1708.9,
"valid_targets_min": 709
},
{
"epoch": 4.598715890850722,
"grad_norm": 0.7893789950794092,
"learning_rate": 1.2725130246979683e-05,
"loss": 0.1602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15286454558372498,
"step": 2865,
"valid_targets_mean": 1979.1,
"valid_targets_min": 909
},
{
"epoch": 4.606741573033708,
"grad_norm": 0.6505588257536744,
"learning_rate": 1.2650612003377036e-05,
"loss": 0.1597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14304134249687195,
"step": 2870,
"valid_targets_mean": 2717.9,
"valid_targets_min": 1156
},
{
"epoch": 4.614767255216694,
"grad_norm": 0.78593772720222,
"learning_rate": 1.2576211529144554e-05,
"loss": 0.16,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15942759811878204,
"step": 2875,
"valid_targets_mean": 2011.0,
"valid_targets_min": 873
},
{
"epoch": 4.622792937399679,
"grad_norm": 0.8273283308452407,
"learning_rate": 1.2501930016503541e-05,
"loss": 0.1671,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17127399146556854,
"step": 2880,
"valid_targets_mean": 1755.8,
"valid_targets_min": 774
},
{
"epoch": 4.630818619582665,
"grad_norm": 0.7348995377336468,
"learning_rate": 1.2427768655769024e-05,
"loss": 0.1884,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22157861292362213,
"step": 2885,
"valid_targets_mean": 2057.2,
"valid_targets_min": 675
},
{
"epoch": 4.63884430176565,
"grad_norm": 0.8505145389671085,
"learning_rate": 1.2353728635330667e-05,
"loss": 0.1636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16335329413414001,
"step": 2890,
"valid_targets_mean": 1816.2,
"valid_targets_min": 625
},
{
"epoch": 4.646869983948635,
"grad_norm": 1.37076025694794,
"learning_rate": 1.2279811141633735e-05,
"loss": 0.171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1675649881362915,
"step": 2895,
"valid_targets_mean": 2360.0,
"valid_targets_min": 636
},
{
"epoch": 4.654895666131621,
"grad_norm": 0.732275170804169,
"learning_rate": 1.2206017359160075e-05,
"loss": 0.1564,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1485610008239746,
"step": 2900,
"valid_targets_mean": 1736.9,
"valid_targets_min": 700
},
{
"epoch": 4.662921348314606,
"grad_norm": 0.8216973272949605,
"learning_rate": 1.2132348470409143e-05,
"loss": 0.1689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18894213438034058,
"step": 2905,
"valid_targets_mean": 2240.9,
"valid_targets_min": 1017
},
{
"epoch": 4.670947030497592,
"grad_norm": 0.8075689232117615,
"learning_rate": 1.2058805655879038e-05,
"loss": 0.1607,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16298025846481323,
"step": 2910,
"valid_targets_mean": 2005.5,
"valid_targets_min": 796
},
{
"epoch": 4.678972712680578,
"grad_norm": 0.8159417807899707,
"learning_rate": 1.198539009404762e-05,
"loss": 0.1637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16406571865081787,
"step": 2915,
"valid_targets_mean": 1778.8,
"valid_targets_min": 727
},
{
"epoch": 4.686998394863563,
"grad_norm": 0.8256426953405346,
"learning_rate": 1.1912102961353584e-05,
"loss": 0.1636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17584344744682312,
"step": 2920,
"valid_targets_mean": 1622.3,
"valid_targets_min": 936
},
{
"epoch": 4.695024077046549,
"grad_norm": 0.7691107031706801,
"learning_rate": 1.1838945432177635e-05,
"loss": 0.1699,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18694257736206055,
"step": 2925,
"valid_targets_mean": 2771.9,
"valid_targets_min": 1366
},
{
"epoch": 4.703049759229534,
"grad_norm": 0.7516487224153081,
"learning_rate": 1.1765918678823662e-05,
"loss": 0.1643,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15113398432731628,
"step": 2930,
"valid_targets_mean": 1985.2,
"valid_targets_min": 1092
},
{
"epoch": 4.71107544141252,
"grad_norm": 0.7618974789209155,
"learning_rate": 1.1693023871499957e-05,
"loss": 0.1659,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.165465846657753,
"step": 2935,
"valid_targets_mean": 2225.2,
"valid_targets_min": 746
},
{
"epoch": 4.719101123595506,
"grad_norm": 0.8149074036818159,
"learning_rate": 1.1620262178300456e-05,
"loss": 0.1597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16010752320289612,
"step": 2940,
"valid_targets_mean": 1913.2,
"valid_targets_min": 715
},
{
"epoch": 4.727126805778491,
"grad_norm": 0.8197427071898096,
"learning_rate": 1.1547634765186016e-05,
"loss": 0.1691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17915387451648712,
"step": 2945,
"valid_targets_mean": 2063.6,
"valid_targets_min": 645
},
{
"epoch": 4.735152487961477,
"grad_norm": 0.7472007206086239,
"learning_rate": 1.1475142795965757e-05,
"loss": 0.1592,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14832112193107605,
"step": 2950,
"valid_targets_mean": 2198.4,
"valid_targets_min": 703
},
{
"epoch": 4.743178170144462,
"grad_norm": 0.716859850891493,
"learning_rate": 1.140278743227837e-05,
"loss": 0.1763,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1730707287788391,
"step": 2955,
"valid_targets_mean": 2579.7,
"valid_targets_min": 1013
},
{
"epoch": 4.751203852327448,
"grad_norm": 0.7593041479712695,
"learning_rate": 1.1330569833573551e-05,
"loss": 0.1582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16250699758529663,
"step": 2960,
"valid_targets_mean": 2219.4,
"valid_targets_min": 593
},
{
"epoch": 4.759229534510434,
"grad_norm": 0.7933693825582795,
"learning_rate": 1.1258491157093396e-05,
"loss": 0.1585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1603544056415558,
"step": 2965,
"valid_targets_mean": 2217.6,
"valid_targets_min": 954
},
{
"epoch": 4.767255216693419,
"grad_norm": 0.7743905745905229,
"learning_rate": 1.1186552557853825e-05,
"loss": 0.1579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1547103375196457,
"step": 2970,
"valid_targets_mean": 2139.5,
"valid_targets_min": 909
},
{
"epoch": 4.775280898876405,
"grad_norm": 0.820583631476114,
"learning_rate": 1.1114755188626168e-05,
"loss": 0.1587,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1643066108226776,
"step": 2975,
"valid_targets_mean": 2056.4,
"valid_targets_min": 1132
},
{
"epoch": 4.78330658105939,
"grad_norm": 0.8466563247928943,
"learning_rate": 1.104310019991857e-05,
"loss": 0.1655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1671457588672638,
"step": 2980,
"valid_targets_mean": 1896.4,
"valid_targets_min": 888
},
{
"epoch": 4.791332263242376,
"grad_norm": 0.8354506195581702,
"learning_rate": 1.0971588739957656e-05,
"loss": 0.173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16162726283073425,
"step": 2985,
"valid_targets_mean": 2007.1,
"valid_targets_min": 591
},
{
"epoch": 4.799357945425362,
"grad_norm": 1.062465812109398,
"learning_rate": 1.0900221954670088e-05,
"loss": 0.1657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17890310287475586,
"step": 2990,
"valid_targets_mean": 1936.5,
"valid_targets_min": 638
},
{
"epoch": 4.807383627608346,
"grad_norm": 0.8028726047167257,
"learning_rate": 1.0829000987664182e-05,
"loss": 0.1608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16547292470932007,
"step": 2995,
"valid_targets_mean": 2699.4,
"valid_targets_min": 683
},
{
"epoch": 4.815409309791332,
"grad_norm": 0.8256326317127171,
"learning_rate": 1.0757926980211631e-05,
"loss": 0.1678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1672663390636444,
"step": 3000,
"valid_targets_mean": 1877.8,
"valid_targets_min": 518
},
{
"epoch": 4.823434991974318,
"grad_norm": 0.7478820911221347,
"learning_rate": 1.0687001071229193e-05,
"loss": 0.151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1408068835735321,
"step": 3005,
"valid_targets_mean": 1811.9,
"valid_targets_min": 959
},
{
"epoch": 4.831460674157303,
"grad_norm": 0.726272372822568,
"learning_rate": 1.0616224397260418e-05,
"loss": 0.1585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15432113409042358,
"step": 3010,
"valid_targets_mean": 2357.8,
"valid_targets_min": 893
},
{
"epoch": 4.839486356340289,
"grad_norm": 0.7902014084251503,
"learning_rate": 1.0545598092457486e-05,
"loss": 0.1717,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18471723794937134,
"step": 3015,
"valid_targets_mean": 2332.9,
"valid_targets_min": 1070
},
{
"epoch": 4.847512038523274,
"grad_norm": 0.7605054462637847,
"learning_rate": 1.0475123288562973e-05,
"loss": 0.1638,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17729586362838745,
"step": 3020,
"valid_targets_mean": 2387.9,
"valid_targets_min": 1055
},
{
"epoch": 4.85553772070626,
"grad_norm": 0.7484290704810759,
"learning_rate": 1.0404801114891778e-05,
"loss": 0.1601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16589263081550598,
"step": 3025,
"valid_targets_mean": 2440.9,
"valid_targets_min": 662
},
{
"epoch": 4.863563402889246,
"grad_norm": 0.856515566605694,
"learning_rate": 1.033463269831299e-05,
"loss": 0.1639,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1638427972793579,
"step": 3030,
"valid_targets_mean": 1848.2,
"valid_targets_min": 818
},
{
"epoch": 4.871589085072231,
"grad_norm": 0.8236028327289647,
"learning_rate": 1.0264619163231806e-05,
"loss": 0.1703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14224272966384888,
"step": 3035,
"valid_targets_mean": 1927.8,
"valid_targets_min": 634
},
{
"epoch": 4.879614767255217,
"grad_norm": 0.8834260640383598,
"learning_rate": 1.0194761631571582e-05,
"loss": 0.1659,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1616498827934265,
"step": 3040,
"valid_targets_mean": 1653.1,
"valid_targets_min": 724
},
{
"epoch": 4.887640449438202,
"grad_norm": 0.884548808230801,
"learning_rate": 1.0125061222755803e-05,
"loss": 0.1627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16663256287574768,
"step": 3045,
"valid_targets_mean": 1720.1,
"valid_targets_min": 734
},
{
"epoch": 4.895666131621188,
"grad_norm": 0.749412699231492,
"learning_rate": 1.0055519053690143e-05,
"loss": 0.1675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17901411652565002,
"step": 3050,
"valid_targets_mean": 2867.6,
"valid_targets_min": 957
},
{
"epoch": 4.903691813804174,
"grad_norm": 0.7064928300374316,
"learning_rate": 9.986136238744611e-06,
"loss": 0.1566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14298474788665771,
"step": 3055,
"valid_targets_mean": 2419.4,
"valid_targets_min": 720
},
{
"epoch": 4.911717495987159,
"grad_norm": 0.775858514439901,
"learning_rate": 9.916913889735631e-06,
"loss": 0.1604,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1682652235031128,
"step": 3060,
"valid_targets_mean": 2224.8,
"valid_targets_min": 723
},
{
"epoch": 4.919743178170145,
"grad_norm": 0.7840845068588912,
"learning_rate": 9.847853115908287e-06,
"loss": 0.1651,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16616985201835632,
"step": 3065,
"valid_targets_mean": 2093.0,
"valid_targets_min": 898
},
{
"epoch": 4.9277688603531296,
"grad_norm": 0.7358639310688878,
"learning_rate": 9.778955023918522e-06,
"loss": 0.1631,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16126513481140137,
"step": 3070,
"valid_targets_mean": 2444.2,
"valid_targets_min": 781
},
{
"epoch": 4.935794542536115,
"grad_norm": 0.7019002418904744,
"learning_rate": 9.710220717815378e-06,
"loss": 0.1589,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1442476511001587,
"step": 3075,
"valid_targets_mean": 2195.4,
"valid_targets_min": 858
},
{
"epoch": 4.943820224719101,
"grad_norm": 0.8891523546612572,
"learning_rate": 9.641651299023356e-06,
"loss": 0.1657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17019495368003845,
"step": 3080,
"valid_targets_mean": 1681.1,
"valid_targets_min": 613
},
{
"epoch": 4.951845906902086,
"grad_norm": 0.8057149797037921,
"learning_rate": 9.573247866324735e-06,
"loss": 0.158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14473962783813477,
"step": 3085,
"valid_targets_mean": 1626.6,
"valid_targets_min": 704
},
{
"epoch": 4.959871589085072,
"grad_norm": 0.9372704511945662,
"learning_rate": 9.505011515841955e-06,
"loss": 0.1738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16392774879932404,
"step": 3090,
"valid_targets_mean": 2301.2,
"valid_targets_min": 798
},
{
"epoch": 4.967897271268058,
"grad_norm": 0.8552067075934405,
"learning_rate": 9.436943341020086e-06,
"loss": 0.1555,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1627275049686432,
"step": 3095,
"valid_targets_mean": 2126.2,
"valid_targets_min": 777
},
{
"epoch": 4.975922953451043,
"grad_norm": 0.7875758040462811,
"learning_rate": 9.369044432609286e-06,
"loss": 0.1644,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15442267060279846,
"step": 3100,
"valid_targets_mean": 1900.0,
"valid_targets_min": 790
},
{
"epoch": 4.983948635634029,
"grad_norm": 0.7598316679466666,
"learning_rate": 9.301315878647303e-06,
"loss": 0.1578,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1592252254486084,
"step": 3105,
"valid_targets_mean": 1947.6,
"valid_targets_min": 612
},
{
"epoch": 4.991974317817014,
"grad_norm": 0.8310232291090573,
"learning_rate": 9.233758764442093e-06,
"loss": 0.1654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15542343258857727,
"step": 3110,
"valid_targets_mean": 2550.7,
"valid_targets_min": 763
},
{
"epoch": 5.0,
"grad_norm": 0.812388817451886,
"learning_rate": 9.166374172554362e-06,
"loss": 0.1549,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14916843175888062,
"step": 3115,
"valid_targets_mean": 1729.6,
"valid_targets_min": 663
},
{
"epoch": 5.008025682182986,
"grad_norm": 0.7607033094606126,
"learning_rate": 9.099163182780284e-06,
"loss": 0.1383,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.135885089635849,
"step": 3120,
"valid_targets_mean": 1814.1,
"valid_targets_min": 1124
},
{
"epoch": 5.016051364365971,
"grad_norm": 0.8736465666549718,
"learning_rate": 9.032126872134158e-06,
"loss": 0.1433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13772378861904144,
"step": 3125,
"valid_targets_mean": 1659.3,
"valid_targets_min": 718
},
{
"epoch": 5.024077046548957,
"grad_norm": 0.7904249272604563,
"learning_rate": 8.965266314831137e-06,
"loss": 0.1398,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13139450550079346,
"step": 3130,
"valid_targets_mean": 1946.4,
"valid_targets_min": 732
},
{
"epoch": 5.032102728731942,
"grad_norm": 0.7929407682892132,
"learning_rate": 8.898582582270068e-06,
"loss": 0.1411,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14323486387729645,
"step": 3135,
"valid_targets_mean": 1973.4,
"valid_targets_min": 746
},
{
"epoch": 5.040128410914928,
"grad_norm": 0.866269311457836,
"learning_rate": 8.83207674301628e-06,
"loss": 0.1468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14333856105804443,
"step": 3140,
"valid_targets_mean": 1734.8,
"valid_targets_min": 563
},
{
"epoch": 5.048154093097914,
"grad_norm": 0.9162778441988956,
"learning_rate": 8.765749862784455e-06,
"loss": 0.1456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15251901745796204,
"step": 3145,
"valid_targets_mean": 1654.0,
"valid_targets_min": 591
},
{
"epoch": 5.056179775280899,
"grad_norm": 0.8407736851023895,
"learning_rate": 8.699603004421602e-06,
"loss": 0.1383,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13436079025268555,
"step": 3150,
"valid_targets_mean": 2126.9,
"valid_targets_min": 677
},
{
"epoch": 5.064205457463885,
"grad_norm": 0.7832463394899054,
"learning_rate": 8.633637227889955e-06,
"loss": 0.14,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14068548381328583,
"step": 3155,
"valid_targets_mean": 1925.2,
"valid_targets_min": 923
},
{
"epoch": 5.07223113964687,
"grad_norm": 0.8639774265044126,
"learning_rate": 8.567853590250045e-06,
"loss": 0.1435,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15971428155899048,
"step": 3160,
"valid_targets_mean": 1906.4,
"valid_targets_min": 802
},
{
"epoch": 5.080256821829855,
"grad_norm": 0.7906584083707138,
"learning_rate": 8.502253145643752e-06,
"loss": 0.1384,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14278461039066315,
"step": 3165,
"valid_targets_mean": 2237.5,
"valid_targets_min": 823
},
{
"epoch": 5.088282504012841,
"grad_norm": 0.7628112750420695,
"learning_rate": 8.436836945277368e-06,
"loss": 0.1394,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12936154007911682,
"step": 3170,
"valid_targets_mean": 2202.6,
"valid_targets_min": 704
},
{
"epoch": 5.096308186195826,
"grad_norm": 0.8267306131640556,
"learning_rate": 8.371606037404815e-06,
"loss": 0.1405,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14580325782299042,
"step": 3175,
"valid_targets_mean": 2161.2,
"valid_targets_min": 771
},
{
"epoch": 5.104333868378812,
"grad_norm": 0.6460612310814934,
"learning_rate": 8.306561467310812e-06,
"loss": 0.1394,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12587103247642517,
"step": 3180,
"valid_targets_mean": 3042.2,
"valid_targets_min": 1359
},
{
"epoch": 5.112359550561798,
"grad_norm": 0.8017584928015836,
"learning_rate": 8.241704277294111e-06,
"loss": 0.1429,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1343742311000824,
"step": 3185,
"valid_targets_mean": 2129.9,
"valid_targets_min": 1002
},
{
"epoch": 5.120385232744783,
"grad_norm": 0.9038978661911155,
"learning_rate": 8.17703550665084e-06,
"loss": 0.1453,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15416087210178375,
"step": 3190,
"valid_targets_mean": 1875.1,
"valid_targets_min": 734
},
{
"epoch": 5.128410914927769,
"grad_norm": 0.8573022613515127,
"learning_rate": 8.112556191657824e-06,
"loss": 0.1483,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16371378302574158,
"step": 3195,
"valid_targets_mean": 2166.3,
"valid_targets_min": 768
},
{
"epoch": 5.136436597110754,
"grad_norm": 0.7790246108354407,
"learning_rate": 8.04826736555595e-06,
"loss": 0.1376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13910721242427826,
"step": 3200,
"valid_targets_mean": 1948.4,
"valid_targets_min": 891
},
{
"epoch": 5.14446227929374,
"grad_norm": 0.7766255832740316,
"learning_rate": 7.984170058533675e-06,
"loss": 0.1464,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12751339375972748,
"step": 3205,
"valid_targets_mean": 2555.9,
"valid_targets_min": 638
},
{
"epoch": 5.152487961476726,
"grad_norm": 0.7917119654505816,
"learning_rate": 7.920265297710451e-06,
"loss": 0.1389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1495143473148346,
"step": 3210,
"valid_targets_mean": 2617.8,
"valid_targets_min": 801
},
{
"epoch": 5.160513643659711,
"grad_norm": 0.7844470449050925,
"learning_rate": 7.85655410712032e-06,
"loss": 0.1504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15069085359573364,
"step": 3215,
"valid_targets_mean": 2413.8,
"valid_targets_min": 691
},
{
"epoch": 5.168539325842697,
"grad_norm": 0.8339048928177408,
"learning_rate": 7.793037507695478e-06,
"loss": 0.1405,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1523759961128235,
"step": 3220,
"valid_targets_mean": 1656.4,
"valid_targets_min": 818
},
{
"epoch": 5.176565008025682,
"grad_norm": 0.7967130499731122,
"learning_rate": 7.729716517249899e-06,
"loss": 0.1468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14771035313606262,
"step": 3225,
"valid_targets_mean": 2035.6,
"valid_targets_min": 722
},
{
"epoch": 5.184590690208668,
"grad_norm": 0.7684917293766128,
"learning_rate": 7.666592150463069e-06,
"loss": 0.1369,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12404549866914749,
"step": 3230,
"valid_targets_mean": 2203.1,
"valid_targets_min": 713
},
{
"epoch": 5.192616372391654,
"grad_norm": 0.8176758283630357,
"learning_rate": 7.603665418863693e-06,
"loss": 0.1373,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1301923543214798,
"step": 3235,
"valid_targets_mean": 1912.1,
"valid_targets_min": 992
},
{
"epoch": 5.200642054574639,
"grad_norm": 0.838834519570343,
"learning_rate": 7.540937330813487e-06,
"loss": 0.1493,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1450478732585907,
"step": 3240,
"valid_targets_mean": 1830.1,
"valid_targets_min": 716
},
{
"epoch": 5.208667736757624,
"grad_norm": 0.85879810687639,
"learning_rate": 7.47840889149104e-06,
"loss": 0.1478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1518646478652954,
"step": 3245,
"valid_targets_mean": 2411.8,
"valid_targets_min": 979
},
{
"epoch": 5.21669341894061,
"grad_norm": 0.9231616255122982,
"learning_rate": 7.416081102875696e-06,
"loss": 0.1458,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1643749177455902,
"step": 3250,
"valid_targets_mean": 2091.4,
"valid_targets_min": 776
},
{
"epoch": 5.224719101123595,
"grad_norm": 0.8492677793062714,
"learning_rate": 7.353954963731475e-06,
"loss": 0.1501,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13949257135391235,
"step": 3255,
"valid_targets_mean": 1654.9,
"valid_targets_min": 1093
},
{
"epoch": 5.232744783306581,
"grad_norm": 0.7820953395694332,
"learning_rate": 7.292031469591121e-06,
"loss": 0.1453,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1359032392501831,
"step": 3260,
"valid_targets_mean": 1941.2,
"valid_targets_min": 787
},
{
"epoch": 5.240770465489566,
"grad_norm": 0.7968901999980463,
"learning_rate": 7.230311612740086e-06,
"loss": 0.1358,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14728347957134247,
"step": 3265,
"valid_targets_mean": 2289.1,
"valid_targets_min": 826
},
{
"epoch": 5.248796147672552,
"grad_norm": 0.8900568965689445,
"learning_rate": 7.168796382200682e-06,
"loss": 0.1411,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14544740319252014,
"step": 3270,
"valid_targets_mean": 1736.2,
"valid_targets_min": 676
},
{
"epoch": 5.256821829855538,
"grad_norm": 0.8484989618392149,
"learning_rate": 7.1074867637162185e-06,
"loss": 0.138,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13557720184326172,
"step": 3275,
"valid_targets_mean": 1689.6,
"valid_targets_min": 957
},
{
"epoch": 5.264847512038523,
"grad_norm": 0.7914982828194392,
"learning_rate": 7.046383739735166e-06,
"loss": 0.1504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15681229531764984,
"step": 3280,
"valid_targets_mean": 2608.4,
"valid_targets_min": 1052
},
{
"epoch": 5.272873194221509,
"grad_norm": 0.8523244039078887,
"learning_rate": 6.985488289395479e-06,
"loss": 0.1404,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13885071873664856,
"step": 3285,
"valid_targets_mean": 1940.9,
"valid_targets_min": 876
},
{
"epoch": 5.280898876404494,
"grad_norm": 0.9243935198555188,
"learning_rate": 6.924801388508868e-06,
"loss": 0.1494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1328265368938446,
"step": 3290,
"valid_targets_mean": 1775.9,
"valid_targets_min": 641
},
{
"epoch": 5.28892455858748,
"grad_norm": 1.1133751117817525,
"learning_rate": 6.864324009545154e-06,
"loss": 0.1392,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14222298562526703,
"step": 3295,
"valid_targets_mean": 1608.2,
"valid_targets_min": 911
},
{
"epoch": 5.296950240770466,
"grad_norm": 0.7767976367343669,
"learning_rate": 6.804057121616714e-06,
"loss": 0.1437,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14329108595848083,
"step": 3300,
"valid_targets_mean": 2415.2,
"valid_targets_min": 756
},
{
"epoch": 5.304975922953451,
"grad_norm": 0.9041112781790765,
"learning_rate": 6.744001690462922e-06,
"loss": 0.1439,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17742100358009338,
"step": 3305,
"valid_targets_mean": 2027.3,
"valid_targets_min": 658
},
{
"epoch": 5.313001605136437,
"grad_norm": 0.8736023871852377,
"learning_rate": 6.684158678434707e-06,
"loss": 0.1406,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14842301607131958,
"step": 3310,
"valid_targets_mean": 2091.2,
"valid_targets_min": 777
},
{
"epoch": 5.321027287319422,
"grad_norm": 0.7618181166503121,
"learning_rate": 6.624529044479109e-06,
"loss": 0.1476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1443331241607666,
"step": 3315,
"valid_targets_mean": 2625.0,
"valid_targets_min": 657
},
{
"epoch": 5.329052969502408,
"grad_norm": 0.8555745405542319,
"learning_rate": 6.565113744123901e-06,
"loss": 0.1364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1390853226184845,
"step": 3320,
"valid_targets_mean": 2440.4,
"valid_targets_min": 679
},
{
"epoch": 5.337078651685394,
"grad_norm": 0.8485080262580758,
"learning_rate": 6.50591372946231e-06,
"loss": 0.1467,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15979576110839844,
"step": 3325,
"valid_targets_mean": 2120.2,
"valid_targets_min": 741
},
{
"epoch": 5.345104333868379,
"grad_norm": 0.9223840058497179,
"learning_rate": 6.446929949137748e-06,
"loss": 0.1387,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13735276460647583,
"step": 3330,
"valid_targets_mean": 1705.1,
"valid_targets_min": 890
},
{
"epoch": 5.353130016051364,
"grad_norm": 0.831007979180398,
"learning_rate": 6.388163348328582e-06,
"loss": 0.1461,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13778018951416016,
"step": 3335,
"valid_targets_mean": 1862.8,
"valid_targets_min": 848
},
{
"epoch": 5.36115569823435,
"grad_norm": 0.8576931373884364,
"learning_rate": 6.329614868733038e-06,
"loss": 0.1345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12894180417060852,
"step": 3340,
"valid_targets_mean": 1832.2,
"valid_targets_min": 504
},
{
"epoch": 5.369181380417335,
"grad_norm": 0.9081132027537362,
"learning_rate": 6.271285448554072e-06,
"loss": 0.148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1540372371673584,
"step": 3345,
"valid_targets_mean": 2121.2,
"valid_targets_min": 827
},
{
"epoch": 5.377207062600321,
"grad_norm": 0.7729268997973129,
"learning_rate": 6.213176022484353e-06,
"loss": 0.1397,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13177214562892914,
"step": 3350,
"valid_targets_mean": 2114.1,
"valid_targets_min": 953
},
{
"epoch": 5.385232744783306,
"grad_norm": 0.9645437263591448,
"learning_rate": 6.1552875216912866e-06,
"loss": 0.1399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14385467767715454,
"step": 3355,
"valid_targets_mean": 1654.4,
"valid_targets_min": 742
},
{
"epoch": 5.393258426966292,
"grad_norm": 0.8829811829270534,
"learning_rate": 6.097620873802068e-06,
"loss": 0.1424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14625263214111328,
"step": 3360,
"valid_targets_mean": 2065.6,
"valid_targets_min": 612
},
{
"epoch": 5.401284109149278,
"grad_norm": 0.8201170172984508,
"learning_rate": 6.0401770028888675e-06,
"loss": 0.1441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13578824698925018,
"step": 3365,
"valid_targets_mean": 1911.6,
"valid_targets_min": 776
},
{
"epoch": 5.409309791332263,
"grad_norm": 0.7807754561817747,
"learning_rate": 5.982956829453965e-06,
"loss": 0.1364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14298827946186066,
"step": 3370,
"valid_targets_mean": 2299.7,
"valid_targets_min": 826
},
{
"epoch": 5.417335473515249,
"grad_norm": 0.8242125235152692,
"learning_rate": 5.925961270415042e-06,
"loss": 0.145,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14364124834537506,
"step": 3375,
"valid_targets_mean": 1832.5,
"valid_targets_min": 734
},
{
"epoch": 5.425361155698234,
"grad_norm": 0.8447270823261972,
"learning_rate": 5.8691912390904815e-06,
"loss": 0.1437,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15039601922035217,
"step": 3380,
"valid_targets_mean": 2066.4,
"valid_targets_min": 730
},
{
"epoch": 5.43338683788122,
"grad_norm": 0.9092987692988171,
"learning_rate": 5.812647645184704e-06,
"loss": 0.1417,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15466216206550598,
"step": 3385,
"valid_targets_mean": 1961.2,
"valid_targets_min": 933
},
{
"epoch": 5.441412520064206,
"grad_norm": 0.8683991460939533,
"learning_rate": 5.756331394773624e-06,
"loss": 0.1462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15245194733142853,
"step": 3390,
"valid_targets_mean": 1784.2,
"valid_targets_min": 655
},
{
"epoch": 5.449438202247191,
"grad_norm": 0.892968643755484,
"learning_rate": 5.7002433902901276e-06,
"loss": 0.1488,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15332868695259094,
"step": 3395,
"valid_targets_mean": 1742.7,
"valid_targets_min": 816
},
{
"epoch": 5.457463884430177,
"grad_norm": 0.7642059744988553,
"learning_rate": 5.644384530509574e-06,
"loss": 0.1413,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14609497785568237,
"step": 3400,
"valid_targets_mean": 2508.6,
"valid_targets_min": 1018
},
{
"epoch": 5.465489566613162,
"grad_norm": 0.8768706215913115,
"learning_rate": 5.588755710535452e-06,
"loss": 0.1432,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14894311130046844,
"step": 3405,
"valid_targets_mean": 1854.5,
"valid_targets_min": 621
},
{
"epoch": 5.473515248796148,
"grad_norm": 0.7918482061402888,
"learning_rate": 5.533357821784991e-06,
"loss": 0.1558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20110508799552917,
"step": 3410,
"valid_targets_mean": 2252.2,
"valid_targets_min": 591
},
{
"epoch": 5.481540930979134,
"grad_norm": 0.6880735681435827,
"learning_rate": 5.47819175197488e-06,
"loss": 0.1483,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14852222800254822,
"step": 3415,
"valid_targets_mean": 3205.2,
"valid_targets_min": 708
},
{
"epoch": 5.489566613162118,
"grad_norm": 0.6767067170795432,
"learning_rate": 5.42325838510708e-06,
"loss": 0.1366,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11822806298732758,
"step": 3420,
"valid_targets_mean": 2824.0,
"valid_targets_min": 802
},
{
"epoch": 5.497592295345104,
"grad_norm": 0.8718548056137807,
"learning_rate": 5.3685586014546075e-06,
"loss": 0.1433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1538342833518982,
"step": 3425,
"valid_targets_mean": 1895.7,
"valid_targets_min": 658
},
{
"epoch": 5.50561797752809,
"grad_norm": 0.8040243257756551,
"learning_rate": 5.314093277547465e-06,
"loss": 0.1411,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13354749977588654,
"step": 3430,
"valid_targets_mean": 2219.4,
"valid_targets_min": 776
},
{
"epoch": 5.513643659711075,
"grad_norm": 0.8548517241885055,
"learning_rate": 5.259863286158591e-06,
"loss": 0.1438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13882416486740112,
"step": 3435,
"valid_targets_mean": 2167.7,
"valid_targets_min": 887
},
{
"epoch": 5.521669341894061,
"grad_norm": 0.8964297825625066,
"learning_rate": 5.205869496289846e-06,
"loss": 0.1504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1575285792350769,
"step": 3440,
"valid_targets_mean": 1769.5,
"valid_targets_min": 720
},
{
"epoch": 5.529695024077046,
"grad_norm": 0.7937327005355985,
"learning_rate": 5.152112773158125e-06,
"loss": 0.1341,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14235813915729523,
"step": 3445,
"valid_targets_mean": 2031.9,
"valid_targets_min": 851
},
{
"epoch": 5.537720706260032,
"grad_norm": 0.8719446158769936,
"learning_rate": 5.0985939781814765e-06,
"loss": 0.1442,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1630193591117859,
"step": 3450,
"valid_targets_mean": 1731.4,
"valid_targets_min": 629
},
{
"epoch": 5.545746388443018,
"grad_norm": 0.8295730035601938,
"learning_rate": 5.045313968965282e-06,
"loss": 0.1346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14717170596122742,
"step": 3455,
"valid_targets_mean": 1955.8,
"valid_targets_min": 950
},
{
"epoch": 5.553772070626003,
"grad_norm": 0.8964496498020716,
"learning_rate": 4.992273599288546e-06,
"loss": 0.1451,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14559556543827057,
"step": 3460,
"valid_targets_mean": 1855.2,
"valid_targets_min": 737
},
{
"epoch": 5.561797752808989,
"grad_norm": 0.8774241059648222,
"learning_rate": 4.9394737190902e-06,
"loss": 0.1486,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16202348470687866,
"step": 3465,
"valid_targets_mean": 2333.4,
"valid_targets_min": 727
},
{
"epoch": 5.569823434991974,
"grad_norm": 0.7667078264832548,
"learning_rate": 4.88691517445546e-06,
"loss": 0.1352,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1312371790409088,
"step": 3470,
"valid_targets_mean": 1970.1,
"valid_targets_min": 1011
},
{
"epoch": 5.57784911717496,
"grad_norm": 0.8467942832579569,
"learning_rate": 4.834598807602317e-06,
"loss": 0.1495,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13902528584003448,
"step": 3475,
"valid_targets_mean": 1953.3,
"valid_targets_min": 728
},
{
"epoch": 5.585874799357946,
"grad_norm": 1.1418994519461927,
"learning_rate": 4.78252545686799e-06,
"loss": 0.143,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13345175981521606,
"step": 3480,
"valid_targets_mean": 1804.4,
"valid_targets_min": 782
},
{
"epoch": 5.593900481540931,
"grad_norm": 0.829765999744519,
"learning_rate": 4.730695956695532e-06,
"loss": 0.1474,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14543312788009644,
"step": 3485,
"valid_targets_mean": 1963.8,
"valid_targets_min": 1141
},
{
"epoch": 5.601926163723917,
"grad_norm": 0.8564170677263149,
"learning_rate": 4.679111137620442e-06,
"loss": 0.1498,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14116448163986206,
"step": 3490,
"valid_targets_mean": 1803.9,
"valid_targets_min": 837
},
{
"epoch": 5.609951845906902,
"grad_norm": 0.9258578493411536,
"learning_rate": 4.627771826257341e-06,
"loss": 0.1444,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15053588151931763,
"step": 3495,
"valid_targets_mean": 1818.8,
"valid_targets_min": 920
},
{
"epoch": 5.617977528089888,
"grad_norm": 0.7635041251336951,
"learning_rate": 4.576678845286757e-06,
"loss": 0.1391,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13723108172416687,
"step": 3500,
"valid_targets_mean": 2557.6,
"valid_targets_min": 679
},
{
"epoch": 5.626003210272874,
"grad_norm": 0.720755360308493,
"learning_rate": 4.525833013441931e-06,
"loss": 0.1348,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1270107477903366,
"step": 3505,
"valid_targets_mean": 2256.1,
"valid_targets_min": 716
},
{
"epoch": 5.634028892455858,
"grad_norm": 0.8869362920498091,
"learning_rate": 4.475235145495669e-06,
"loss": 0.1374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1467820107936859,
"step": 3510,
"valid_targets_mean": 1817.4,
"valid_targets_min": 522
},
{
"epoch": 5.642054574638844,
"grad_norm": 0.8025610722259726,
"learning_rate": 4.424886052247339e-06,
"loss": 0.1397,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13881070911884308,
"step": 3515,
"valid_targets_mean": 1964.7,
"valid_targets_min": 721
},
{
"epoch": 5.65008025682183,
"grad_norm": 0.7037787309221992,
"learning_rate": 4.374786540509821e-06,
"loss": 0.1404,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13750547170639038,
"step": 3520,
"valid_targets_mean": 2488.4,
"valid_targets_min": 1306
},
{
"epoch": 5.658105939004815,
"grad_norm": 0.8339701185276572,
"learning_rate": 4.324937413096628e-06,
"loss": 0.1471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14046938717365265,
"step": 3525,
"valid_targets_mean": 1705.5,
"valid_targets_min": 657
},
{
"epoch": 5.666131621187801,
"grad_norm": 0.7586982214483773,
"learning_rate": 4.275339468809019e-06,
"loss": 0.138,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13911622762680054,
"step": 3530,
"valid_targets_mean": 2551.6,
"valid_targets_min": 1126
},
{
"epoch": 5.674157303370786,
"grad_norm": 0.9119810062418106,
"learning_rate": 4.225993502423182e-06,
"loss": 0.1477,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1517258733510971,
"step": 3535,
"valid_targets_mean": 1962.5,
"valid_targets_min": 675
},
{
"epoch": 5.682182985553772,
"grad_norm": 0.8619483579361343,
"learning_rate": 4.1769003046775315e-06,
"loss": 0.1513,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1552795171737671,
"step": 3540,
"valid_targets_mean": 1997.1,
"valid_targets_min": 950
},
{
"epoch": 5.690208667736758,
"grad_norm": 0.865824081520984,
"learning_rate": 4.128060662260025e-06,
"loss": 0.1426,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13369613885879517,
"step": 3545,
"valid_targets_mean": 1609.4,
"valid_targets_min": 665
},
{
"epoch": 5.698234349919743,
"grad_norm": 0.7527647909300139,
"learning_rate": 4.079475357795535e-06,
"loss": 0.1319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12556613981723785,
"step": 3550,
"valid_targets_mean": 2171.1,
"valid_targets_min": 960
},
{
"epoch": 5.706260032102729,
"grad_norm": 1.1716775797352907,
"learning_rate": 4.031145169833342e-06,
"loss": 0.1429,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11673303693532944,
"step": 3555,
"valid_targets_mean": 2320.8,
"valid_targets_min": 677
},
{
"epoch": 5.714285714285714,
"grad_norm": 0.9267941895909233,
"learning_rate": 3.9830708728346445e-06,
"loss": 0.1409,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15212789177894592,
"step": 3560,
"valid_targets_mean": 1611.5,
"valid_targets_min": 800
},
{
"epoch": 5.7223113964687,
"grad_norm": 1.0419238252836576,
"learning_rate": 3.935253237160132e-06,
"loss": 0.1418,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13419196009635925,
"step": 3565,
"valid_targets_mean": 1984.1,
"valid_targets_min": 794
},
{
"epoch": 5.730337078651686,
"grad_norm": 0.8798559697698835,
"learning_rate": 3.887693029057675e-06,
"loss": 0.1396,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1552184522151947,
"step": 3570,
"valid_targets_mean": 1911.6,
"valid_targets_min": 777
},
{
"epoch": 5.738362760834671,
"grad_norm": 0.8518956486042853,
"learning_rate": 3.8403910106500104e-06,
"loss": 0.144,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14175641536712646,
"step": 3575,
"valid_targets_mean": 1880.1,
"valid_targets_min": 744
},
{
"epoch": 5.746388443017657,
"grad_norm": 0.9148318859217006,
"learning_rate": 3.7933479399225604e-06,
"loss": 0.1481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1558597981929779,
"step": 3580,
"valid_targets_mean": 1775.1,
"valid_targets_min": 924
},
{
"epoch": 5.754414125200642,
"grad_norm": 0.8566250351217594,
"learning_rate": 3.746564570711266e-06,
"loss": 0.1481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13671304285526276,
"step": 3585,
"valid_targets_mean": 1997.3,
"valid_targets_min": 662
},
{
"epoch": 5.762439807383627,
"grad_norm": 0.8092341832129542,
"learning_rate": 3.7000416526905026e-06,
"loss": 0.1433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1414514183998108,
"step": 3590,
"valid_targets_mean": 1647.3,
"valid_targets_min": 727
},
{
"epoch": 5.770465489566613,
"grad_norm": 0.8530070873913949,
"learning_rate": 3.6537799313610946e-06,
"loss": 0.1427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13695083558559418,
"step": 3595,
"valid_targets_mean": 1496.6,
"valid_targets_min": 611
},
{
"epoch": 5.778491171749598,
"grad_norm": 0.8542613937155389,
"learning_rate": 3.607780148038347e-06,
"loss": 0.1569,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14914162456989288,
"step": 3600,
"valid_targets_mean": 2354.6,
"valid_targets_min": 933
},
{
"epoch": 5.786516853932584,
"grad_norm": 0.837623744528209,
"learning_rate": 3.5620430398401596e-06,
"loss": 0.1437,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13059459626674652,
"step": 3605,
"valid_targets_mean": 2035.4,
"valid_targets_min": 687
},
{
"epoch": 5.79454253611557,
"grad_norm": 0.8111804173729541,
"learning_rate": 3.5165693396752443e-06,
"loss": 0.1361,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1243569403886795,
"step": 3610,
"valid_targets_mean": 2214.9,
"valid_targets_min": 1101
},
{
"epoch": 5.802568218298555,
"grad_norm": 0.8833303698013306,
"learning_rate": 3.471359776231347e-06,
"loss": 0.1459,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16278022527694702,
"step": 3615,
"valid_targets_mean": 1972.5,
"valid_targets_min": 882
},
{
"epoch": 5.810593900481541,
"grad_norm": 0.8415725209000036,
"learning_rate": 3.426415073963594e-06,
"loss": 0.1447,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1425856500864029,
"step": 3620,
"valid_targets_mean": 1869.6,
"valid_targets_min": 704
},
{
"epoch": 5.818619582664526,
"grad_norm": 0.9466397913974439,
"learning_rate": 3.3817359530828873e-06,
"loss": 0.1463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1392950862646103,
"step": 3625,
"valid_targets_mean": 1488.4,
"valid_targets_min": 670
},
{
"epoch": 5.826645264847512,
"grad_norm": 0.8152618375051688,
"learning_rate": 3.3373231295443277e-06,
"loss": 0.1451,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1470872461795807,
"step": 3630,
"valid_targets_mean": 2061.8,
"valid_targets_min": 874
},
{
"epoch": 5.834670947030498,
"grad_norm": 0.8554361536678649,
"learning_rate": 3.2931773150357893e-06,
"loss": 0.1382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1473013013601303,
"step": 3635,
"valid_targets_mean": 1860.9,
"valid_targets_min": 770
},
{
"epoch": 5.842696629213483,
"grad_norm": 0.8497228090683818,
"learning_rate": 3.2492992169664837e-06,
"loss": 0.144,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14080603420734406,
"step": 3640,
"valid_targets_mean": 1779.9,
"valid_targets_min": 1141
},
{
"epoch": 5.850722311396469,
"grad_norm": 0.8236171503439341,
"learning_rate": 3.2056895384556275e-06,
"loss": 0.1393,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14260318875312805,
"step": 3645,
"valid_targets_mean": 1947.2,
"valid_targets_min": 1110
},
{
"epoch": 5.858747993579454,
"grad_norm": 0.8212400811046316,
"learning_rate": 3.1623489783211904e-06,
"loss": 0.1443,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14351606369018555,
"step": 3650,
"valid_targets_mean": 1747.2,
"valid_targets_min": 945
},
{
"epoch": 5.86677367576244,
"grad_norm": 0.77766697126824,
"learning_rate": 3.1192782310686874e-06,
"loss": 0.1418,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1273421049118042,
"step": 3655,
"valid_targets_mean": 2407.2,
"valid_targets_min": 1050
},
{
"epoch": 5.874799357945426,
"grad_norm": 0.8663557165534255,
"learning_rate": 3.0764779868800398e-06,
"loss": 0.1489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17279453575611115,
"step": 3660,
"valid_targets_mean": 2015.9,
"valid_targets_min": 533
},
{
"epoch": 5.882825040128411,
"grad_norm": 0.8558801380283106,
"learning_rate": 3.0339489316025394e-06,
"loss": 0.1388,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14702408015727997,
"step": 3665,
"valid_targets_mean": 2130.3,
"valid_targets_min": 824
},
{
"epoch": 5.890850722311397,
"grad_norm": 0.7505646399517081,
"learning_rate": 2.991691746737828e-06,
"loss": 0.1499,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13228633999824524,
"step": 3670,
"valid_targets_mean": 2391.9,
"valid_targets_min": 684
},
{
"epoch": 5.898876404494382,
"grad_norm": 0.8199757285730112,
"learning_rate": 2.949707109431006e-06,
"loss": 0.141,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14933696389198303,
"step": 3675,
"valid_targets_mean": 1866.2,
"valid_targets_min": 545
},
{
"epoch": 5.906902086677368,
"grad_norm": 0.8965249228046941,
"learning_rate": 2.907995692459773e-06,
"loss": 0.136,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15130048990249634,
"step": 3680,
"valid_targets_mean": 2021.9,
"valid_targets_min": 618
},
{
"epoch": 5.914927768860353,
"grad_norm": 0.8777238241939872,
"learning_rate": 2.8665581642236227e-06,
"loss": 0.1419,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1442902833223343,
"step": 3685,
"valid_targets_mean": 1744.5,
"valid_targets_min": 677
},
{
"epoch": 5.922953451043338,
"grad_norm": 0.8252807172148935,
"learning_rate": 2.825395188733169e-06,
"loss": 0.1393,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1298397034406662,
"step": 3690,
"valid_targets_mean": 1682.1,
"valid_targets_min": 818
},
{
"epoch": 5.930979133226324,
"grad_norm": 0.7888917751614268,
"learning_rate": 2.784507425599492e-06,
"loss": 0.1382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1363508403301239,
"step": 3695,
"valid_targets_mean": 1906.1,
"valid_targets_min": 741
},
{
"epoch": 5.93900481540931,
"grad_norm": 0.9105325822568995,
"learning_rate": 2.743895530023544e-06,
"loss": 0.1386,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13701778650283813,
"step": 3700,
"valid_targets_mean": 1610.4,
"valid_targets_min": 729
},
{
"epoch": 5.947030497592295,
"grad_norm": 0.8647716265607804,
"learning_rate": 2.7035601527856914e-06,
"loss": 0.1338,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12563112378120422,
"step": 3705,
"valid_targets_mean": 1931.8,
"valid_targets_min": 638
},
{
"epoch": 5.955056179775281,
"grad_norm": 0.9083802247250276,
"learning_rate": 2.6635019402352645e-06,
"loss": 0.1429,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14448779821395874,
"step": 3710,
"valid_targets_mean": 1673.9,
"valid_targets_min": 849
},
{
"epoch": 5.963081861958266,
"grad_norm": 0.6538474603186538,
"learning_rate": 2.6237215342801857e-06,
"loss": 0.1411,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1227862536907196,
"step": 3715,
"valid_targets_mean": 3093.8,
"valid_targets_min": 973
},
{
"epoch": 5.971107544141252,
"grad_norm": 0.8126909161583662,
"learning_rate": 2.5842195723767205e-06,
"loss": 0.1391,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14033716917037964,
"step": 3720,
"valid_targets_mean": 2245.1,
"valid_targets_min": 892
},
{
"epoch": 5.979133226324238,
"grad_norm": 0.8847974712352168,
"learning_rate": 2.544996687519219e-06,
"loss": 0.1451,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.147241473197937,
"step": 3725,
"valid_targets_mean": 1698.0,
"valid_targets_min": 1055
},
{
"epoch": 5.987158908507223,
"grad_norm": 0.823026519904926,
"learning_rate": 2.5060535082300266e-06,
"loss": 0.1451,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15312634408473969,
"step": 3730,
"valid_targets_mean": 2188.0,
"valid_targets_min": 639
},
{
"epoch": 5.995184590690209,
"grad_norm": 0.8213365844788153,
"learning_rate": 2.467390658549349e-06,
"loss": 0.141,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13517561554908752,
"step": 3735,
"valid_targets_mean": 2128.8,
"valid_targets_min": 797
},
{
"epoch": 6.003210272873194,
"grad_norm": 0.8196675867105674,
"learning_rate": 2.429008758025302e-06,
"loss": 0.1359,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13686616718769073,
"step": 3740,
"valid_targets_mean": 1792.6,
"valid_targets_min": 788
},
{
"epoch": 6.01123595505618,
"grad_norm": 0.7101099418791215,
"learning_rate": 2.3909084217039634e-06,
"loss": 0.1278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12406958639621735,
"step": 3745,
"valid_targets_mean": 2482.2,
"valid_targets_min": 1025
},
{
"epoch": 6.019261637239166,
"grad_norm": 0.8233493110334807,
"learning_rate": 2.353090260119515e-06,
"loss": 0.1353,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13340730965137482,
"step": 3750,
"valid_targets_mean": 1969.3,
"valid_targets_min": 820
},
{
"epoch": 6.027287319422151,
"grad_norm": 0.9151878902447068,
"learning_rate": 2.3155548792844674e-06,
"loss": 0.1265,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11424959450960159,
"step": 3755,
"valid_targets_mean": 1564.1,
"valid_targets_min": 725
},
{
"epoch": 6.035313001605137,
"grad_norm": 0.8326440606539028,
"learning_rate": 2.27830288067995e-06,
"loss": 0.1323,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13482320308685303,
"step": 3760,
"valid_targets_mean": 1919.4,
"valid_targets_min": 1078
},
{
"epoch": 6.043338683788122,
"grad_norm": 0.8742588018506022,
"learning_rate": 2.241334861246058e-06,
"loss": 0.1261,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1303100883960724,
"step": 3765,
"valid_targets_mean": 1689.5,
"valid_targets_min": 697
},
{
"epoch": 6.051364365971107,
"grad_norm": 0.8283773699034884,
"learning_rate": 2.2046514133723075e-06,
"loss": 0.126,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11725350469350815,
"step": 3770,
"valid_targets_mean": 1564.1,
"valid_targets_min": 592
},
{
"epoch": 6.059390048154093,
"grad_norm": 0.9066721433616125,
"learning_rate": 2.1682531248881266e-06,
"loss": 0.1336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13146190345287323,
"step": 3775,
"valid_targets_mean": 1457.2,
"valid_targets_min": 597
},
{
"epoch": 6.067415730337078,
"grad_norm": 0.7917186831995832,
"learning_rate": 2.1321405790534412e-06,
"loss": 0.1238,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14324235916137695,
"step": 3780,
"valid_targets_mean": 2544.8,
"valid_targets_min": 792
},
{
"epoch": 6.075441412520064,
"grad_norm": 0.7995015410713523,
"learning_rate": 2.096314354549334e-06,
"loss": 0.1352,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12818962335586548,
"step": 3785,
"valid_targets_mean": 1735.4,
"valid_targets_min": 682
},
{
"epoch": 6.08346709470305,
"grad_norm": 0.8043412796343894,
"learning_rate": 2.0607750254687554e-06,
"loss": 0.1289,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12518352270126343,
"step": 3790,
"valid_targets_mean": 2304.7,
"valid_targets_min": 625
},
{
"epoch": 6.091492776886035,
"grad_norm": 0.8688221477476388,
"learning_rate": 2.025523161307348e-06,
"loss": 0.1364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1296396106481552,
"step": 3795,
"valid_targets_mean": 1634.8,
"valid_targets_min": 667
},
{
"epoch": 6.099518459069021,
"grad_norm": 0.9117796677606809,
"learning_rate": 1.990559326954307e-06,
"loss": 0.1355,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13730370998382568,
"step": 3800,
"valid_targets_mean": 1711.1,
"valid_targets_min": 700
},
{
"epoch": 6.107544141252006,
"grad_norm": 0.721550972186035,
"learning_rate": 1.955884082683317e-06,
"loss": 0.13,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1108551174402237,
"step": 3805,
"valid_targets_mean": 2403.3,
"valid_targets_min": 892
},
{
"epoch": 6.115569823434992,
"grad_norm": 0.8248557024007874,
"learning_rate": 1.9214979841435967e-06,
"loss": 0.1322,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13973233103752136,
"step": 3810,
"valid_targets_mean": 2137.4,
"valid_targets_min": 669
},
{
"epoch": 6.123595505617978,
"grad_norm": 0.8121793695204608,
"learning_rate": 1.8874015823509873e-06,
"loss": 0.1245,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12547042965888977,
"step": 3815,
"valid_targets_mean": 2604.6,
"valid_targets_min": 797
},
{
"epoch": 6.131621187800963,
"grad_norm": 0.7351257868663279,
"learning_rate": 1.8535954236791044e-06,
"loss": 0.1326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12898236513137817,
"step": 3820,
"valid_targets_mean": 2703.9,
"valid_targets_min": 765
},
{
"epoch": 6.139646869983949,
"grad_norm": 0.8858783243545603,
"learning_rate": 1.8200800498506166e-06,
"loss": 0.1352,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15943001210689545,
"step": 3825,
"valid_targets_mean": 1791.6,
"valid_targets_min": 891
},
{
"epoch": 6.147672552166934,
"grad_norm": 0.8144635580836179,
"learning_rate": 1.7868559979285293e-06,
"loss": 0.1263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12163649499416351,
"step": 3830,
"valid_targets_mean": 1813.3,
"valid_targets_min": 796
},
{
"epoch": 6.15569823434992,
"grad_norm": 0.8011893230062246,
"learning_rate": 1.7539238003076087e-06,
"loss": 0.1291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13179343938827515,
"step": 3835,
"valid_targets_mean": 2422.9,
"valid_targets_min": 1109
},
{
"epoch": 6.163723916532906,
"grad_norm": 0.9556250644794508,
"learning_rate": 1.721283984705835e-06,
"loss": 0.1318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14184167981147766,
"step": 3840,
"valid_targets_mean": 1440.4,
"valid_targets_min": 728
},
{
"epoch": 6.171749598715891,
"grad_norm": 0.7764479036008669,
"learning_rate": 1.6889370741559407e-06,
"loss": 0.1274,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1197129637002945,
"step": 3845,
"valid_targets_mean": 2076.1,
"valid_targets_min": 672
},
{
"epoch": 6.179775280898877,
"grad_norm": 0.7481548950692756,
"learning_rate": 1.6568835869970445e-06,
"loss": 0.1306,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13337062299251556,
"step": 3850,
"valid_targets_mean": 2484.6,
"valid_targets_min": 789
},
{
"epoch": 6.187800963081862,
"grad_norm": 0.821740266972904,
"learning_rate": 1.625124036866339e-06,
"loss": 0.1337,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14121049642562866,
"step": 3855,
"valid_targets_mean": 2158.6,
"valid_targets_min": 830
},
{
"epoch": 6.195826645264847,
"grad_norm": 0.8251617106369992,
"learning_rate": 1.5936589326908513e-06,
"loss": 0.141,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1286158710718155,
"step": 3860,
"valid_targets_mean": 1933.1,
"valid_targets_min": 798
},
{
"epoch": 6.203852327447833,
"grad_norm": 0.9413267314341657,
"learning_rate": 1.5624887786793008e-06,
"loss": 0.1339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13531285524368286,
"step": 3865,
"valid_targets_mean": 1385.5,
"valid_targets_min": 655
},
{
"epoch": 6.211878009630818,
"grad_norm": 0.8800324368070407,
"learning_rate": 1.531614074314014e-06,
"loss": 0.1365,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13416577875614166,
"step": 3870,
"valid_targets_mean": 2019.1,
"valid_targets_min": 729
},
{
"epoch": 6.219903691813804,
"grad_norm": 0.9054587413802373,
"learning_rate": 1.501035314342918e-06,
"loss": 0.1327,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13169649243354797,
"step": 3875,
"valid_targets_mean": 1469.8,
"valid_targets_min": 715
},
{
"epoch": 6.22792937399679,
"grad_norm": 0.8324924083699635,
"learning_rate": 1.4707529887716177e-06,
"loss": 0.1258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1314225196838379,
"step": 3880,
"valid_targets_mean": 1870.7,
"valid_targets_min": 691
},
{
"epoch": 6.235955056179775,
"grad_norm": 0.757807099087046,
"learning_rate": 1.4407675828555378e-06,
"loss": 0.1295,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13538961112499237,
"step": 3885,
"valid_targets_mean": 2662.4,
"valid_targets_min": 549
},
{
"epoch": 6.243980738362761,
"grad_norm": 0.9112108378646868,
"learning_rate": 1.4110795770921536e-06,
"loss": 0.1317,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14746998250484467,
"step": 3890,
"valid_targets_mean": 1878.4,
"valid_targets_min": 629
},
{
"epoch": 6.252006420545746,
"grad_norm": 0.8130635027374573,
"learning_rate": 1.3816894472132903e-06,
"loss": 0.1308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1274118721485138,
"step": 3895,
"valid_targets_mean": 2159.9,
"valid_targets_min": 868
},
{
"epoch": 6.260032102728732,
"grad_norm": 0.8766350494372456,
"learning_rate": 1.3525976641774862e-06,
"loss": 0.1268,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12585480511188507,
"step": 3900,
"valid_targets_mean": 1828.7,
"valid_targets_min": 684
},
{
"epoch": 6.268057784911718,
"grad_norm": 0.8414903174334402,
"learning_rate": 1.3238046941624694e-06,
"loss": 0.1343,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1348039209842682,
"step": 3905,
"valid_targets_mean": 2230.7,
"valid_targets_min": 762
},
{
"epoch": 6.276083467094703,
"grad_norm": 0.8692836229326116,
"learning_rate": 1.295310998557673e-06,
"loss": 0.1334,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13138556480407715,
"step": 3910,
"valid_targets_mean": 1685.2,
"valid_targets_min": 693
},
{
"epoch": 6.284109149277689,
"grad_norm": 0.9927992924551751,
"learning_rate": 1.2671170339568372e-06,
"loss": 0.1303,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12924659252166748,
"step": 3915,
"valid_targets_mean": 1712.9,
"valid_targets_min": 768
},
{
"epoch": 6.292134831460674,
"grad_norm": 0.8708385582623096,
"learning_rate": 1.239223252150703e-06,
"loss": 0.1375,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1407126933336258,
"step": 3920,
"valid_targets_mean": 1895.5,
"valid_targets_min": 825
},
{
"epoch": 6.30016051364366,
"grad_norm": 0.9462826534291934,
"learning_rate": 1.211630100119776e-06,
"loss": 0.1364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15399542450904846,
"step": 3925,
"valid_targets_mean": 1808.5,
"valid_targets_min": 701
},
{
"epoch": 6.308186195826646,
"grad_norm": 0.8338027195464212,
"learning_rate": 1.1843380200271426e-06,
"loss": 0.1328,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11450174450874329,
"step": 3930,
"valid_targets_mean": 1831.6,
"valid_targets_min": 557
},
{
"epoch": 6.31621187800963,
"grad_norm": 0.7844532891368925,
"learning_rate": 1.1573474492114122e-06,
"loss": 0.1269,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11957096308469772,
"step": 3935,
"valid_targets_mean": 2298.2,
"valid_targets_min": 760
},
{
"epoch": 6.324237560192616,
"grad_norm": 0.7148468016806782,
"learning_rate": 1.1306588201796863e-06,
"loss": 0.1237,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10497011244297028,
"step": 3940,
"valid_targets_mean": 2023.3,
"valid_targets_min": 567
},
{
"epoch": 6.332263242375602,
"grad_norm": 0.8075062564380106,
"learning_rate": 1.1042725606006388e-06,
"loss": 0.144,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15959270298480988,
"step": 3945,
"valid_targets_mean": 2724.1,
"valid_targets_min": 1269
},
{
"epoch": 6.340288924558587,
"grad_norm": 0.8319131176662817,
"learning_rate": 1.078189093297668e-06,
"loss": 0.1339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13696303963661194,
"step": 3950,
"valid_targets_mean": 2162.0,
"valid_targets_min": 735
},
{
"epoch": 6.348314606741573,
"grad_norm": 0.777206520799545,
"learning_rate": 1.0524088362421048e-06,
"loss": 0.1237,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12403260171413422,
"step": 3955,
"valid_targets_mean": 2233.1,
"valid_targets_min": 613
},
{
"epoch": 6.356340288924558,
"grad_norm": 0.7451807347978312,
"learning_rate": 1.0269322025465334e-06,
"loss": 0.1308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13250204920768738,
"step": 3960,
"valid_targets_mean": 2690.4,
"valid_targets_min": 626
},
{
"epoch": 6.364365971107544,
"grad_norm": 0.8253339601537156,
"learning_rate": 1.0017596004581564e-06,
"loss": 0.1295,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1278865784406662,
"step": 3965,
"valid_targets_mean": 1848.6,
"valid_targets_min": 800
},
{
"epoch": 6.37239165329053,
"grad_norm": 0.8584721668386178,
"learning_rate": 9.768914333522584e-07,
"loss": 0.1289,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13879048824310303,
"step": 3970,
"valid_targets_mean": 1834.6,
"valid_targets_min": 926
},
{
"epoch": 6.380417335473515,
"grad_norm": 0.8283576544061164,
"learning_rate": 9.5232809972575e-07,
"loss": 0.1309,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13557694852352142,
"step": 3975,
"valid_targets_mean": 1815.6,
"valid_targets_min": 998
},
{
"epoch": 6.388443017656501,
"grad_norm": 0.8748562146778729,
"learning_rate": 9.280699931907633e-07,
"loss": 0.1415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15249726176261902,
"step": 3980,
"valid_targets_mean": 2136.6,
"valid_targets_min": 657
},
{
"epoch": 6.396468699839486,
"grad_norm": 0.777927436115682,
"learning_rate": 9.04117502468369e-07,
"loss": 0.1327,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14238354563713074,
"step": 3985,
"valid_targets_mean": 2248.8,
"valid_targets_min": 689
},
{
"epoch": 6.404494382022472,
"grad_norm": 0.8043827719833165,
"learning_rate": 8.804710113823311e-07,
"loss": 0.126,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12348157912492752,
"step": 3990,
"valid_targets_mean": 1787.2,
"valid_targets_min": 734
},
{
"epoch": 6.412520064205458,
"grad_norm": 0.9862275060605692,
"learning_rate": 8.571308988529492e-07,
"loss": 0.1288,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13508912920951843,
"step": 3995,
"valid_targets_mean": 1392.4,
"valid_targets_min": 696
},
{
"epoch": 6.420545746388443,
"grad_norm": 0.8431627989023698,
"learning_rate": 8.3409753889101e-07,
"loss": 0.1318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13289272785186768,
"step": 4000,
"valid_targets_mean": 1806.3,
"valid_targets_min": 709
},
{
"epoch": 6.428571428571429,
"grad_norm": 0.8239565380374946,
"learning_rate": 8.11371300591779e-07,
"loss": 0.1286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13981223106384277,
"step": 4005,
"valid_targets_mean": 2153.0,
"valid_targets_min": 1102
},
{
"epoch": 6.436597110754414,
"grad_norm": 0.9432509501592777,
"learning_rate": 7.889525481290805e-07,
"loss": 0.1366,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1455557495355606,
"step": 4010,
"valid_targets_mean": 1852.8,
"valid_targets_min": 819
},
{
"epoch": 6.4446227929374,
"grad_norm": 0.9014367927531765,
"learning_rate": 7.668416407494761e-07,
"loss": 0.1351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13227035105228424,
"step": 4015,
"valid_targets_mean": 1789.1,
"valid_targets_min": 793
},
{
"epoch": 6.452648475120386,
"grad_norm": 0.8171835228507035,
"learning_rate": 7.450389327665042e-07,
"loss": 0.1291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13154827058315277,
"step": 4020,
"valid_targets_mean": 2095.6,
"valid_targets_min": 752
},
{
"epoch": 6.460674157303371,
"grad_norm": 0.7683854828646659,
"learning_rate": 7.235447735549895e-07,
"loss": 0.132,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13109341263771057,
"step": 4025,
"valid_targets_mean": 2461.7,
"valid_targets_min": 788
},
{
"epoch": 6.468699839486356,
"grad_norm": 0.9022184794419694,
"learning_rate": 7.02359507545467e-07,
"loss": 0.1365,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13602422177791595,
"step": 4030,
"valid_targets_mean": 1908.5,
"valid_targets_min": 809
},
{
"epoch": 6.476725521669342,
"grad_norm": 0.8680280298928634,
"learning_rate": 6.814834742186361e-07,
"loss": 0.1288,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13595837354660034,
"step": 4035,
"valid_targets_mean": 1791.1,
"valid_targets_min": 708
},
{
"epoch": 6.484751203852327,
"grad_norm": 0.8624861818881404,
"learning_rate": 6.60917008099946e-07,
"loss": 0.1384,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13239216804504395,
"step": 4040,
"valid_targets_mean": 1472.7,
"valid_targets_min": 909
},
{
"epoch": 6.492776886035313,
"grad_norm": 0.8372254606922392,
"learning_rate": 6.406604387542259e-07,
"loss": 0.1348,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12756837904453278,
"step": 4045,
"valid_targets_mean": 1802.8,
"valid_targets_min": 638
},
{
"epoch": 6.500802568218298,
"grad_norm": 0.8845183639085258,
"learning_rate": 6.207140907803877e-07,
"loss": 0.1341,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11851681768894196,
"step": 4050,
"valid_targets_mean": 1879.1,
"valid_targets_min": 687
},
{
"epoch": 6.508828250401284,
"grad_norm": 0.9939476432578076,
"learning_rate": 6.010782838062534e-07,
"loss": 0.1363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16492959856987,
"step": 4055,
"valid_targets_mean": 1637.2,
"valid_targets_min": 680
},
{
"epoch": 6.51685393258427,
"grad_norm": 0.7876122251990382,
"learning_rate": 5.817533324834146e-07,
"loss": 0.1364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1363506019115448,
"step": 4060,
"valid_targets_mean": 1869.1,
"valid_targets_min": 648
},
{
"epoch": 6.524879614767255,
"grad_norm": 0.8344114489032715,
"learning_rate": 5.627395464821894e-07,
"loss": 0.1343,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.140853613615036,
"step": 4065,
"valid_targets_mean": 2610.0,
"valid_targets_min": 1355
},
{
"epoch": 6.532905296950241,
"grad_norm": 0.6902659152306734,
"learning_rate": 5.440372304866692e-07,
"loss": 0.1336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13164812326431274,
"step": 4070,
"valid_targets_mean": 3041.7,
"valid_targets_min": 883
},
{
"epoch": 6.540930979133226,
"grad_norm": 0.7503481708658517,
"learning_rate": 5.256466841898334e-07,
"loss": 0.1332,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13292858004570007,
"step": 4075,
"valid_targets_mean": 2455.9,
"valid_targets_min": 1030
},
{
"epoch": 6.548956661316212,
"grad_norm": 0.7994462646941594,
"learning_rate": 5.075682022887441e-07,
"loss": 0.1444,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1420678347349167,
"step": 4080,
"valid_targets_mean": 2302.2,
"valid_targets_min": 823
},
{
"epoch": 6.556982343499198,
"grad_norm": 0.8804572670066306,
"learning_rate": 4.898020744798282e-07,
"loss": 0.1324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14195245504379272,
"step": 4085,
"valid_targets_mean": 2165.8,
"valid_targets_min": 1104
},
{
"epoch": 6.565008025682183,
"grad_norm": 0.7713249621956143,
"learning_rate": 4.7234858545422536e-07,
"loss": 0.1336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12661638855934143,
"step": 4090,
"valid_targets_mean": 2549.3,
"valid_targets_min": 1000
},
{
"epoch": 6.573033707865169,
"grad_norm": 0.8013666556551141,
"learning_rate": 4.552080148932425e-07,
"loss": 0.1351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1386134922504425,
"step": 4095,
"valid_targets_mean": 2510.6,
"valid_targets_min": 882
},
{
"epoch": 6.581059390048154,
"grad_norm": 0.9379662069494056,
"learning_rate": 4.383806374638555e-07,
"loss": 0.1278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1294247806072235,
"step": 4100,
"valid_targets_mean": 1812.6,
"valid_targets_min": 715
},
{
"epoch": 6.589085072231139,
"grad_norm": 0.8157148561089532,
"learning_rate": 4.2186672281432363e-07,
"loss": 0.1343,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12697714567184448,
"step": 4105,
"valid_targets_mean": 2067.0,
"valid_targets_min": 686
},
{
"epoch": 6.597110754414125,
"grad_norm": 0.8532772772866162,
"learning_rate": 4.056665355698508e-07,
"loss": 0.1403,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15566185116767883,
"step": 4110,
"valid_targets_mean": 1932.4,
"valid_targets_min": 765
},
{
"epoch": 6.60513643659711,
"grad_norm": 0.7347366895405252,
"learning_rate": 3.89780335328358e-07,
"loss": 0.1256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1240445151925087,
"step": 4115,
"valid_targets_mean": 2558.4,
"valid_targets_min": 698
},
{
"epoch": 6.613162118780096,
"grad_norm": 0.7844171389786991,
"learning_rate": 3.7420837665632205e-07,
"loss": 0.1321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1311158537864685,
"step": 4120,
"valid_targets_mean": 2435.1,
"valid_targets_min": 993
},
{
"epoch": 6.621187800963082,
"grad_norm": 1.016494260012105,
"learning_rate": 3.5895090908469433e-07,
"loss": 0.1365,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13737598061561584,
"step": 4125,
"valid_targets_mean": 2182.8,
"valid_targets_min": 1001
},
{
"epoch": 6.629213483146067,
"grad_norm": 0.7662698129244558,
"learning_rate": 3.4400817710489754e-07,
"loss": 0.1314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13481801748275757,
"step": 4130,
"valid_targets_mean": 2539.6,
"valid_targets_min": 650
},
{
"epoch": 6.637239165329053,
"grad_norm": 0.8804946515187855,
"learning_rate": 3.293804201649131e-07,
"loss": 0.1363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14753307402133942,
"step": 4135,
"valid_targets_mean": 1763.6,
"valid_targets_min": 779
},
{
"epoch": 6.645264847512038,
"grad_norm": 0.8509011624485113,
"learning_rate": 3.1506787266545104e-07,
"loss": 0.1369,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13469921052455902,
"step": 4140,
"valid_targets_mean": 1757.4,
"valid_targets_min": 809
},
{
"epoch": 6.653290529695024,
"grad_norm": 0.7972105200462379,
"learning_rate": 3.010707639561727e-07,
"loss": 0.1276,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11612634360790253,
"step": 4145,
"valid_targets_mean": 2148.2,
"valid_targets_min": 612
},
{
"epoch": 6.66131621187801,
"grad_norm": 0.8607825669685812,
"learning_rate": 2.873893183320431e-07,
"loss": 0.1368,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1409863531589508,
"step": 4150,
"valid_targets_mean": 1988.0,
"valid_targets_min": 621
},
{
"epoch": 6.669341894060995,
"grad_norm": 0.8114169187350514,
"learning_rate": 2.740237550297131e-07,
"loss": 0.1414,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1218997910618782,
"step": 4155,
"valid_targets_mean": 2225.8,
"valid_targets_min": 522
},
{
"epoch": 6.677367576243981,
"grad_norm": 0.8553063985701393,
"learning_rate": 2.609742882240207e-07,
"loss": 0.1457,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1512482464313507,
"step": 4160,
"valid_targets_mean": 2193.6,
"valid_targets_min": 705
},
{
"epoch": 6.685393258426966,
"grad_norm": 0.7842315608676794,
"learning_rate": 2.482411270245533e-07,
"loss": 0.1316,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12290303409099579,
"step": 4165,
"valid_targets_mean": 2215.3,
"valid_targets_min": 820
},
{
"epoch": 6.693418940609952,
"grad_norm": 0.8288014529828364,
"learning_rate": 2.358244754722927e-07,
"loss": 0.1354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13061775267124176,
"step": 4170,
"valid_targets_mean": 1987.8,
"valid_targets_min": 695
},
{
"epoch": 6.701444622792938,
"grad_norm": 0.7471758228205548,
"learning_rate": 2.2372453253635796e-07,
"loss": 0.1373,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12854477763175964,
"step": 4175,
"valid_targets_mean": 2526.5,
"valid_targets_min": 782
},
{
"epoch": 6.709470304975923,
"grad_norm": 0.9506746700643623,
"learning_rate": 2.1194149211080982e-07,
"loss": 0.1355,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15296323597431183,
"step": 4180,
"valid_targets_mean": 1742.1,
"valid_targets_min": 765
},
{
"epoch": 6.717495987158909,
"grad_norm": 0.8755571800580249,
"learning_rate": 2.004755430115335e-07,
"loss": 0.1353,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14241819083690643,
"step": 4185,
"valid_targets_mean": 1680.2,
"valid_targets_min": 656
},
{
"epoch": 6.725521669341894,
"grad_norm": 0.8620961091565507,
"learning_rate": 1.8932686897323417e-07,
"loss": 0.1301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12413826584815979,
"step": 4190,
"valid_targets_mean": 1665.9,
"valid_targets_min": 802
},
{
"epoch": 6.73354735152488,
"grad_norm": 0.8368572454303962,
"learning_rate": 1.7849564864647506e-07,
"loss": 0.1425,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1286819726228714,
"step": 4195,
"valid_targets_mean": 2069.0,
"valid_targets_min": 1155
},
{
"epoch": 6.741573033707866,
"grad_norm": 0.8146985305426502,
"learning_rate": 1.679820555948264e-07,
"loss": 0.1376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11927329003810883,
"step": 4200,
"valid_targets_mean": 1932.9,
"valid_targets_min": 661
},
{
"epoch": 6.74959871589085,
"grad_norm": 0.8866600690370785,
"learning_rate": 1.5778625829207196e-07,
"loss": 0.1342,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13215553760528564,
"step": 4205,
"valid_targets_mean": 1920.4,
"valid_targets_min": 635
},
{
"epoch": 6.757624398073836,
"grad_norm": 0.701924183183066,
"learning_rate": 1.4790842011952023e-07,
"loss": 0.1314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11789841204881668,
"step": 4210,
"valid_targets_mean": 2835.7,
"valid_targets_min": 823
},
{
"epoch": 6.765650080256822,
"grad_norm": 0.9501322619954992,
"learning_rate": 1.3834869936338424e-07,
"loss": 0.1312,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1307641565799713,
"step": 4215,
"valid_targets_mean": 2221.1,
"valid_targets_min": 746
},
{
"epoch": 6.773675762439807,
"grad_norm": 0.8812623724815387,
"learning_rate": 1.2910724921224139e-07,
"loss": 0.1349,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1285921037197113,
"step": 4220,
"valid_targets_mean": 1583.2,
"valid_targets_min": 788
},
{
"epoch": 6.781701444622793,
"grad_norm": 0.8385562110933432,
"learning_rate": 1.2018421775457978e-07,
"loss": 0.1297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14212295413017273,
"step": 4225,
"valid_targets_mean": 1936.7,
"valid_targets_min": 661
},
{
"epoch": 6.789727126805778,
"grad_norm": 0.7834916138029038,
"learning_rate": 1.115797479764269e-07,
"loss": 0.1295,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12338066846132278,
"step": 4230,
"valid_targets_mean": 2082.6,
"valid_targets_min": 867
},
{
"epoch": 6.797752808988764,
"grad_norm": 0.8288684199479489,
"learning_rate": 1.0329397775905802e-07,
"loss": 0.1385,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14609648287296295,
"step": 4235,
"valid_targets_mean": 2241.5,
"valid_targets_min": 611
},
{
"epoch": 6.80577849117175,
"grad_norm": 0.8404101812550286,
"learning_rate": 9.532703987678692e-08,
"loss": 0.1322,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15395131707191467,
"step": 4240,
"valid_targets_mean": 2035.6,
"valid_targets_min": 1106
},
{
"epoch": 6.813804173354735,
"grad_norm": 0.8562736483627456,
"learning_rate": 8.767906199483422e-08,
"loss": 0.132,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1289074420928955,
"step": 4245,
"valid_targets_mean": 1866.0,
"valid_targets_min": 734
},
{
"epoch": 6.821829855537721,
"grad_norm": 0.8444371886099169,
"learning_rate": 8.0350166667289e-08,
"loss": 0.1295,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12709850072860718,
"step": 4250,
"valid_targets_mean": 1635.1,
"valid_targets_min": 789
},
{
"epoch": 6.829855537720706,
"grad_norm": 0.7699603449450781,
"learning_rate": 7.33404713351371e-08,
"loss": 0.1318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12732994556427002,
"step": 4255,
"valid_targets_mean": 2395.6,
"valid_targets_min": 1057
},
{
"epoch": 6.837881219903692,
"grad_norm": 0.8872853267014166,
"learning_rate": 6.665008832438923e-08,
"loss": 0.1317,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13180556893348694,
"step": 4260,
"valid_targets_mean": 2180.7,
"valid_targets_min": 551
},
{
"epoch": 6.845906902086678,
"grad_norm": 0.7725443532887755,
"learning_rate": 6.027912484426468e-08,
"loss": 0.1385,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11179924011230469,
"step": 4265,
"valid_targets_mean": 1924.9,
"valid_targets_min": 746
},
{
"epoch": 6.853932584269663,
"grad_norm": 0.8216166028267735,
"learning_rate": 5.4227682985494854e-08,
"loss": 0.1257,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11613370478153229,
"step": 4270,
"valid_targets_mean": 2039.6,
"valid_targets_min": 605
},
{
"epoch": 6.861958266452649,
"grad_norm": 0.716010306215438,
"learning_rate": 4.849585971866688e-08,
"loss": 0.141,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13099314272403717,
"step": 4275,
"valid_targets_mean": 2827.7,
"valid_targets_min": 1177
},
{
"epoch": 6.8699839486356336,
"grad_norm": 1.008634190990714,
"learning_rate": 4.3083746892684796e-08,
"loss": 0.1366,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13648265600204468,
"step": 4280,
"valid_targets_mean": 2092.2,
"valid_targets_min": 750
},
{
"epoch": 6.878009630818619,
"grad_norm": 0.8050911139139982,
"learning_rate": 3.7991431233288525e-08,
"loss": 0.1281,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12041358649730682,
"step": 4285,
"valid_targets_mean": 2016.8,
"valid_targets_min": 694
},
{
"epoch": 6.886035313001605,
"grad_norm": 0.7538681689851715,
"learning_rate": 3.321899434166831e-08,
"loss": 0.1315,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12728962302207947,
"step": 4290,
"valid_targets_mean": 2348.8,
"valid_targets_min": 739
},
{
"epoch": 6.89406099518459,
"grad_norm": 0.9078340983454675,
"learning_rate": 2.876651269315689e-08,
"loss": 0.13,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13924184441566467,
"step": 4295,
"valid_targets_mean": 1564.9,
"valid_targets_min": 973
},
{
"epoch": 6.902086677367576,
"grad_norm": 0.8322797461761388,
"learning_rate": 2.4634057636001573e-08,
"loss": 0.1326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13911721110343933,
"step": 4300,
"valid_targets_mean": 1888.2,
"valid_targets_min": 841
},
{
"epoch": 6.910112359550562,
"grad_norm": 0.8873358332613721,
"learning_rate": 2.082169539022294e-08,
"loss": 0.1383,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1478015035390854,
"step": 4305,
"valid_targets_mean": 1802.1,
"valid_targets_min": 692
},
{
"epoch": 6.918138041733547,
"grad_norm": 0.8910795462193187,
"learning_rate": 1.7329487046555683e-08,
"loss": 0.1275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13803160190582275,
"step": 4310,
"valid_targets_mean": 1852.9,
"valid_targets_min": 888
},
{
"epoch": 6.926163723916533,
"grad_norm": 0.7929871067815147,
"learning_rate": 1.4157488565464949e-08,
"loss": 0.136,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12524215877056122,
"step": 4315,
"valid_targets_mean": 2124.4,
"valid_targets_min": 652
},
{
"epoch": 6.934189406099518,
"grad_norm": 0.8321158322797556,
"learning_rate": 1.1305750776253733e-08,
"loss": 0.1295,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12520332634449005,
"step": 4320,
"valid_targets_mean": 2153.6,
"valid_targets_min": 692
},
{
"epoch": 6.942215088282504,
"grad_norm": 0.8721383068519388,
"learning_rate": 8.774319376245733e-09,
"loss": 0.1336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13430440425872803,
"step": 4325,
"valid_targets_mean": 1598.9,
"valid_targets_min": 737
},
{
"epoch": 6.95024077046549,
"grad_norm": 0.7481357903290494,
"learning_rate": 6.56323493005262e-09,
"loss": 0.1284,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11327686160802841,
"step": 4330,
"valid_targets_mean": 2174.6,
"valid_targets_min": 909
},
{
"epoch": 6.958266452648475,
"grad_norm": 0.8510993038307517,
"learning_rate": 4.672532868927882e-09,
"loss": 0.1268,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1371006816625595,
"step": 4335,
"valid_targets_mean": 1838.2,
"valid_targets_min": 769
},
{
"epoch": 6.966292134831461,
"grad_norm": 0.8256184023206394,
"learning_rate": 3.102243490196166e-09,
"loss": 0.1355,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12108443677425385,
"step": 4340,
"valid_targets_mean": 1822.3,
"valid_targets_min": 711
},
{
"epoch": 6.974317817014446,
"grad_norm": 0.6715633485519991,
"learning_rate": 1.8523919567692283e-09,
"loss": 0.1289,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11774402111768723,
"step": 4345,
"valid_targets_mean": 2833.9,
"valid_targets_min": 978
},
{
"epoch": 6.982343499197432,
"grad_norm": 0.7122923788742873,
"learning_rate": 9.229982967373652e-10,
"loss": 0.127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13086260855197906,
"step": 4350,
"valid_targets_mean": 3114.6,
"valid_targets_min": 1397
},
{
"epoch": 6.990369181380418,
"grad_norm": 0.7497754087372094,
"learning_rate": 3.1407740305633425e-10,
"loss": 0.1304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12377274036407471,
"step": 4355,
"valid_targets_mean": 2433.6,
"valid_targets_min": 855
},
{
"epoch": 6.998394863563403,
"grad_norm": 0.9056604423294736,
"learning_rate": 2.563903330532469e-11,
"loss": 0.1313,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12367966026067734,
"step": 4360,
"valid_targets_mean": 2186.9,
"valid_targets_min": 714
},
{
"epoch": 7.0,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12605062127113342,
"step": 4361,
"total_flos": 649913807929344.0,
"train_loss": 0.21077685282949843,
"train_runtime": 19161.6847,
"train_samples_per_second": 3.639,
"train_steps_per_second": 0.228,
"valid_targets_mean": 2205.3,
"valid_targets_min": 939
}
],
"logging_steps": 5,
"max_steps": 4361,
"num_input_tokens_seen": 0,
"num_train_epochs": 7,
"save_steps": 200,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 649913807929344.0,
"train_batch_size": 1,
"trial_name": null,
"trial_params": null
}