a1-taskmaster2 / trainer_state.json
EtashGuha's picture
Upload folder using huggingface_hub
2d7a441 verified
{
"best_global_step": null,
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 7.0,
"eval_steps": 500,
"global_step": 3913,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.008944543828264758,
"grad_norm": 21.606822638718377,
"learning_rate": 4.0816326530612243e-07,
"loss": 0.9157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.9071354866027832,
"step": 5,
"valid_targets_mean": 4165.1,
"valid_targets_min": 1481
},
{
"epoch": 0.017889087656529516,
"grad_norm": 19.04995792657104,
"learning_rate": 9.183673469387756e-07,
"loss": 0.9249,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.8876984119415283,
"step": 10,
"valid_targets_mean": 3925.7,
"valid_targets_min": 1499
},
{
"epoch": 0.026833631484794274,
"grad_norm": 19.84564044371412,
"learning_rate": 1.4285714285714286e-06,
"loss": 0.8728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.8913623690605164,
"step": 15,
"valid_targets_mean": 4151.1,
"valid_targets_min": 2060
},
{
"epoch": 0.03577817531305903,
"grad_norm": 12.750163023484031,
"learning_rate": 1.938775510204082e-06,
"loss": 0.8513,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.8227970600128174,
"step": 20,
"valid_targets_mean": 3907.8,
"valid_targets_min": 1805
},
{
"epoch": 0.044722719141323794,
"grad_norm": 7.2429705482367055,
"learning_rate": 2.4489795918367347e-06,
"loss": 0.7962,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7579451203346252,
"step": 25,
"valid_targets_mean": 4374.8,
"valid_targets_min": 538
},
{
"epoch": 0.05366726296958855,
"grad_norm": 4.437835296542112,
"learning_rate": 2.959183673469388e-06,
"loss": 0.7424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7099573612213135,
"step": 30,
"valid_targets_mean": 3956.7,
"valid_targets_min": 954
},
{
"epoch": 0.0626118067978533,
"grad_norm": 2.7488646562577306,
"learning_rate": 3.469387755102041e-06,
"loss": 0.6793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6850540041923523,
"step": 35,
"valid_targets_mean": 4000.8,
"valid_targets_min": 579
},
{
"epoch": 0.07155635062611806,
"grad_norm": 2.1085770347953767,
"learning_rate": 3.979591836734694e-06,
"loss": 0.6197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6641137003898621,
"step": 40,
"valid_targets_mean": 3597.0,
"valid_targets_min": 1574
},
{
"epoch": 0.08050089445438283,
"grad_norm": 1.6255237321311984,
"learning_rate": 4.489795918367348e-06,
"loss": 0.6116,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6154483556747437,
"step": 45,
"valid_targets_mean": 3623.8,
"valid_targets_min": 850
},
{
"epoch": 0.08944543828264759,
"grad_norm": 1.2082356599373048,
"learning_rate": 5e-06,
"loss": 0.6101,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5458171367645264,
"step": 50,
"valid_targets_mean": 3971.1,
"valid_targets_min": 627
},
{
"epoch": 0.09838998211091235,
"grad_norm": 1.0504686350094798,
"learning_rate": 5.510204081632653e-06,
"loss": 0.5949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.573982834815979,
"step": 55,
"valid_targets_mean": 4307.6,
"valid_targets_min": 1734
},
{
"epoch": 0.1073345259391771,
"grad_norm": 0.9226116061847508,
"learning_rate": 6.020408163265307e-06,
"loss": 0.5738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.559834361076355,
"step": 60,
"valid_targets_mean": 4199.9,
"valid_targets_min": 1122
},
{
"epoch": 0.11627906976744186,
"grad_norm": 0.8020567416774592,
"learning_rate": 6.530612244897959e-06,
"loss": 0.5668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5514993071556091,
"step": 65,
"valid_targets_mean": 4092.1,
"valid_targets_min": 1833
},
{
"epoch": 0.1252236135957066,
"grad_norm": 0.7566279895205129,
"learning_rate": 7.0408163265306125e-06,
"loss": 0.5578,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5654456615447998,
"step": 70,
"valid_targets_mean": 4476.8,
"valid_targets_min": 1837
},
{
"epoch": 0.13416815742397137,
"grad_norm": 0.8277372126838092,
"learning_rate": 7.551020408163265e-06,
"loss": 0.5356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4986897110939026,
"step": 75,
"valid_targets_mean": 3277.0,
"valid_targets_min": 1319
},
{
"epoch": 0.14311270125223613,
"grad_norm": 0.7706280252042736,
"learning_rate": 8.06122448979592e-06,
"loss": 0.5068,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5114747285842896,
"step": 80,
"valid_targets_mean": 3939.2,
"valid_targets_min": 1961
},
{
"epoch": 0.1520572450805009,
"grad_norm": 0.7370945804564825,
"learning_rate": 8.571428571428571e-06,
"loss": 0.5039,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.521478533744812,
"step": 85,
"valid_targets_mean": 3797.7,
"valid_targets_min": 864
},
{
"epoch": 0.16100178890876565,
"grad_norm": 0.6156667263403908,
"learning_rate": 9.081632653061225e-06,
"loss": 0.4835,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4676780104637146,
"step": 90,
"valid_targets_mean": 4991.2,
"valid_targets_min": 1062
},
{
"epoch": 0.16994633273703041,
"grad_norm": 0.6654121843319102,
"learning_rate": 9.591836734693878e-06,
"loss": 0.4785,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.48915815353393555,
"step": 95,
"valid_targets_mean": 3783.8,
"valid_targets_min": 705
},
{
"epoch": 0.17889087656529518,
"grad_norm": 0.5656478848830337,
"learning_rate": 1.0102040816326531e-05,
"loss": 0.4789,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4592038094997406,
"step": 100,
"valid_targets_mean": 4946.6,
"valid_targets_min": 743
},
{
"epoch": 0.18783542039355994,
"grad_norm": 0.5753964943707206,
"learning_rate": 1.0612244897959186e-05,
"loss": 0.4481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4560643434524536,
"step": 105,
"valid_targets_mean": 4798.2,
"valid_targets_min": 1049
},
{
"epoch": 0.1967799642218247,
"grad_norm": 0.6637720894363032,
"learning_rate": 1.1122448979591838e-05,
"loss": 0.4584,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.47521623969078064,
"step": 110,
"valid_targets_mean": 3852.6,
"valid_targets_min": 1835
},
{
"epoch": 0.20572450805008943,
"grad_norm": 0.6937897615661168,
"learning_rate": 1.1632653061224491e-05,
"loss": 0.4686,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45546483993530273,
"step": 115,
"valid_targets_mean": 4407.1,
"valid_targets_min": 2317
},
{
"epoch": 0.2146690518783542,
"grad_norm": 0.6387384496375781,
"learning_rate": 1.2142857142857142e-05,
"loss": 0.4378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.438065767288208,
"step": 120,
"valid_targets_mean": 4181.9,
"valid_targets_min": 1324
},
{
"epoch": 0.22361359570661896,
"grad_norm": 0.6327727639217386,
"learning_rate": 1.2653061224489798e-05,
"loss": 0.4679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.47834330797195435,
"step": 125,
"valid_targets_mean": 4268.0,
"valid_targets_min": 1629
},
{
"epoch": 0.23255813953488372,
"grad_norm": 0.6622093710086933,
"learning_rate": 1.316326530612245e-05,
"loss": 0.427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4127560257911682,
"step": 130,
"valid_targets_mean": 3824.6,
"valid_targets_min": 1371
},
{
"epoch": 0.24150268336314848,
"grad_norm": 0.6285981733100382,
"learning_rate": 1.3673469387755102e-05,
"loss": 0.4394,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4288730323314667,
"step": 135,
"valid_targets_mean": 3877.5,
"valid_targets_min": 1614
},
{
"epoch": 0.2504472271914132,
"grad_norm": 0.7388339921347419,
"learning_rate": 1.4183673469387755e-05,
"loss": 0.4429,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.420998752117157,
"step": 140,
"valid_targets_mean": 3424.4,
"valid_targets_min": 780
},
{
"epoch": 0.259391771019678,
"grad_norm": 0.7101396979725441,
"learning_rate": 1.469387755102041e-05,
"loss": 0.4389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4431981146335602,
"step": 145,
"valid_targets_mean": 3347.7,
"valid_targets_min": 1109
},
{
"epoch": 0.26833631484794274,
"grad_norm": 0.6957496254556903,
"learning_rate": 1.5204081632653063e-05,
"loss": 0.4362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4714646339416504,
"step": 150,
"valid_targets_mean": 4095.1,
"valid_targets_min": 787
},
{
"epoch": 0.2772808586762075,
"grad_norm": 0.6624013827511412,
"learning_rate": 1.5714285714285715e-05,
"loss": 0.4158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4100586771965027,
"step": 155,
"valid_targets_mean": 3521.4,
"valid_targets_min": 1542
},
{
"epoch": 0.28622540250447226,
"grad_norm": 1.0921780130652612,
"learning_rate": 1.6224489795918368e-05,
"loss": 0.4217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44413700699806213,
"step": 160,
"valid_targets_mean": 3212.3,
"valid_targets_min": 945
},
{
"epoch": 0.295169946332737,
"grad_norm": 0.6555406982106572,
"learning_rate": 1.673469387755102e-05,
"loss": 0.411,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43597084283828735,
"step": 165,
"valid_targets_mean": 4127.6,
"valid_targets_min": 732
},
{
"epoch": 0.3041144901610018,
"grad_norm": 0.7156947764144866,
"learning_rate": 1.7244897959183674e-05,
"loss": 0.4142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45090579986572266,
"step": 170,
"valid_targets_mean": 4241.0,
"valid_targets_min": 945
},
{
"epoch": 0.31305903398926654,
"grad_norm": 0.7843406742359783,
"learning_rate": 1.7755102040816327e-05,
"loss": 0.4088,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.409368097782135,
"step": 175,
"valid_targets_mean": 3534.1,
"valid_targets_min": 607
},
{
"epoch": 0.3220035778175313,
"grad_norm": 0.6832085964985579,
"learning_rate": 1.826530612244898e-05,
"loss": 0.4323,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4517691731452942,
"step": 180,
"valid_targets_mean": 4510.8,
"valid_targets_min": 1674
},
{
"epoch": 0.33094812164579607,
"grad_norm": 0.6430408307738346,
"learning_rate": 1.8775510204081636e-05,
"loss": 0.406,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4193289875984192,
"step": 185,
"valid_targets_mean": 4455.5,
"valid_targets_min": 1476
},
{
"epoch": 0.33989266547406083,
"grad_norm": 0.6803856005045361,
"learning_rate": 1.928571428571429e-05,
"loss": 0.3807,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.376784086227417,
"step": 190,
"valid_targets_mean": 3769.6,
"valid_targets_min": 715
},
{
"epoch": 0.3488372093023256,
"grad_norm": 0.7962416214555187,
"learning_rate": 1.979591836734694e-05,
"loss": 0.4095,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40137556195259094,
"step": 195,
"valid_targets_mean": 3348.6,
"valid_targets_min": 831
},
{
"epoch": 0.35778175313059035,
"grad_norm": 0.6163018468674557,
"learning_rate": 2.0306122448979594e-05,
"loss": 0.4097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4052973985671997,
"step": 200,
"valid_targets_mean": 4064.9,
"valid_targets_min": 928
},
{
"epoch": 0.3667262969588551,
"grad_norm": 0.5825225301762951,
"learning_rate": 2.0816326530612247e-05,
"loss": 0.3895,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.379678338766098,
"step": 205,
"valid_targets_mean": 4561.4,
"valid_targets_min": 1682
},
{
"epoch": 0.3756708407871199,
"grad_norm": 0.7186506278507635,
"learning_rate": 2.13265306122449e-05,
"loss": 0.3987,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3955579996109009,
"step": 210,
"valid_targets_mean": 3334.4,
"valid_targets_min": 877
},
{
"epoch": 0.38461538461538464,
"grad_norm": 0.7102346399517735,
"learning_rate": 2.1836734693877552e-05,
"loss": 0.3996,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3910446763038635,
"step": 215,
"valid_targets_mean": 3237.5,
"valid_targets_min": 1604
},
{
"epoch": 0.3935599284436494,
"grad_norm": 0.6261071087270799,
"learning_rate": 2.2346938775510205e-05,
"loss": 0.3979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.371921181678772,
"step": 220,
"valid_targets_mean": 4290.6,
"valid_targets_min": 1637
},
{
"epoch": 0.40250447227191416,
"grad_norm": 0.6481717381436756,
"learning_rate": 2.2857142857142858e-05,
"loss": 0.3915,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3760562539100647,
"step": 225,
"valid_targets_mean": 3945.3,
"valid_targets_min": 1767
},
{
"epoch": 0.41144901610017887,
"grad_norm": 0.6201712385655748,
"learning_rate": 2.336734693877551e-05,
"loss": 0.3929,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4008695185184479,
"step": 230,
"valid_targets_mean": 4555.8,
"valid_targets_min": 1312
},
{
"epoch": 0.4203935599284436,
"grad_norm": 0.6203763910651068,
"learning_rate": 2.3877551020408167e-05,
"loss": 0.3889,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41413581371307373,
"step": 235,
"valid_targets_mean": 4777.6,
"valid_targets_min": 2200
},
{
"epoch": 0.4293381037567084,
"grad_norm": 0.65351087223048,
"learning_rate": 2.438775510204082e-05,
"loss": 0.3809,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3872208297252655,
"step": 240,
"valid_targets_mean": 3722.7,
"valid_targets_min": 1608
},
{
"epoch": 0.43828264758497315,
"grad_norm": 0.6802074572655615,
"learning_rate": 2.4897959183673473e-05,
"loss": 0.3602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36208364367485046,
"step": 245,
"valid_targets_mean": 4687.7,
"valid_targets_min": 1944
},
{
"epoch": 0.4472271914132379,
"grad_norm": 0.8869715993980485,
"learning_rate": 2.5408163265306125e-05,
"loss": 0.3921,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4071674942970276,
"step": 250,
"valid_targets_mean": 4066.7,
"valid_targets_min": 1633
},
{
"epoch": 0.4561717352415027,
"grad_norm": 0.7031570375051375,
"learning_rate": 2.5918367346938778e-05,
"loss": 0.3945,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38449206948280334,
"step": 255,
"valid_targets_mean": 3275.8,
"valid_targets_min": 807
},
{
"epoch": 0.46511627906976744,
"grad_norm": 0.6401965700906631,
"learning_rate": 2.642857142857143e-05,
"loss": 0.3799,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4059576094150543,
"step": 260,
"valid_targets_mean": 4899.2,
"valid_targets_min": 1869
},
{
"epoch": 0.4740608228980322,
"grad_norm": 0.68848774995671,
"learning_rate": 2.6938775510204084e-05,
"loss": 0.3899,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42488914728164673,
"step": 265,
"valid_targets_mean": 4040.0,
"valid_targets_min": 1784
},
{
"epoch": 0.48300536672629696,
"grad_norm": 0.6555186879962056,
"learning_rate": 2.7448979591836737e-05,
"loss": 0.3747,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37860578298568726,
"step": 270,
"valid_targets_mean": 3953.7,
"valid_targets_min": 1120
},
{
"epoch": 0.4919499105545617,
"grad_norm": 0.6958637124427978,
"learning_rate": 2.7959183673469393e-05,
"loss": 0.3657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.353659987449646,
"step": 275,
"valid_targets_mean": 4198.6,
"valid_targets_min": 867
},
{
"epoch": 0.5008944543828264,
"grad_norm": 0.7270956530331304,
"learning_rate": 2.8469387755102046e-05,
"loss": 0.3695,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3616817593574524,
"step": 280,
"valid_targets_mean": 3319.2,
"valid_targets_min": 1008
},
{
"epoch": 0.5098389982110912,
"grad_norm": 0.6584523988533558,
"learning_rate": 2.89795918367347e-05,
"loss": 0.3639,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3544594645500183,
"step": 285,
"valid_targets_mean": 3901.2,
"valid_targets_min": 1630
},
{
"epoch": 0.518783542039356,
"grad_norm": 0.6603276785502654,
"learning_rate": 2.948979591836735e-05,
"loss": 0.3765,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3783223032951355,
"step": 290,
"valid_targets_mean": 4002.2,
"valid_targets_min": 1031
},
{
"epoch": 0.5277280858676208,
"grad_norm": 0.6256302987866349,
"learning_rate": 3.0000000000000004e-05,
"loss": 0.3801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3801421523094177,
"step": 295,
"valid_targets_mean": 4247.8,
"valid_targets_min": 825
},
{
"epoch": 0.5366726296958855,
"grad_norm": 0.641725168293166,
"learning_rate": 3.0510204081632654e-05,
"loss": 0.3661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3630704879760742,
"step": 300,
"valid_targets_mean": 3875.1,
"valid_targets_min": 1685
},
{
"epoch": 0.5456171735241503,
"grad_norm": 0.811210240684181,
"learning_rate": 3.102040816326531e-05,
"loss": 0.3741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36272579431533813,
"step": 305,
"valid_targets_mean": 3257.9,
"valid_targets_min": 1264
},
{
"epoch": 0.554561717352415,
"grad_norm": 0.667191922839525,
"learning_rate": 3.153061224489796e-05,
"loss": 0.3667,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3673118054866791,
"step": 310,
"valid_targets_mean": 4112.9,
"valid_targets_min": 923
},
{
"epoch": 0.5635062611806798,
"grad_norm": 0.6483488033218554,
"learning_rate": 3.2040816326530615e-05,
"loss": 0.3695,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3770442008972168,
"step": 315,
"valid_targets_mean": 4392.9,
"valid_targets_min": 2212
},
{
"epoch": 0.5724508050089445,
"grad_norm": 0.6594195347781112,
"learning_rate": 3.255102040816327e-05,
"loss": 0.3851,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3894268274307251,
"step": 320,
"valid_targets_mean": 4147.8,
"valid_targets_min": 1795
},
{
"epoch": 0.5813953488372093,
"grad_norm": 0.5800198159071142,
"learning_rate": 3.306122448979592e-05,
"loss": 0.3612,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3446458876132965,
"step": 325,
"valid_targets_mean": 4526.3,
"valid_targets_min": 1608
},
{
"epoch": 0.590339892665474,
"grad_norm": 0.6476011130202899,
"learning_rate": 3.357142857142858e-05,
"loss": 0.3631,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36270543932914734,
"step": 330,
"valid_targets_mean": 4024.4,
"valid_targets_min": 1450
},
{
"epoch": 0.5992844364937389,
"grad_norm": 0.6522027257372564,
"learning_rate": 3.408163265306123e-05,
"loss": 0.3654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3855012357234955,
"step": 335,
"valid_targets_mean": 4163.4,
"valid_targets_min": 1675
},
{
"epoch": 0.6082289803220036,
"grad_norm": 0.6243810739429985,
"learning_rate": 3.459183673469388e-05,
"loss": 0.3671,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3456933796405792,
"step": 340,
"valid_targets_mean": 3930.6,
"valid_targets_min": 1588
},
{
"epoch": 0.6171735241502684,
"grad_norm": 0.6158815913365016,
"learning_rate": 3.510204081632653e-05,
"loss": 0.3655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35427260398864746,
"step": 345,
"valid_targets_mean": 4795.0,
"valid_targets_min": 1934
},
{
"epoch": 0.6261180679785331,
"grad_norm": 0.7068523423045154,
"learning_rate": 3.561224489795918e-05,
"loss": 0.3687,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4106198847293854,
"step": 350,
"valid_targets_mean": 4016.4,
"valid_targets_min": 648
},
{
"epoch": 0.6350626118067979,
"grad_norm": 0.7843744948487554,
"learning_rate": 3.612244897959184e-05,
"loss": 0.3634,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36276382207870483,
"step": 355,
"valid_targets_mean": 3936.0,
"valid_targets_min": 1615
},
{
"epoch": 0.6440071556350626,
"grad_norm": 0.6872061405347063,
"learning_rate": 3.6632653061224494e-05,
"loss": 0.3486,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33801645040512085,
"step": 360,
"valid_targets_mean": 3690.8,
"valid_targets_min": 1805
},
{
"epoch": 0.6529516994633273,
"grad_norm": 0.626374760633224,
"learning_rate": 3.714285714285715e-05,
"loss": 0.3685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3595544695854187,
"step": 365,
"valid_targets_mean": 4637.8,
"valid_targets_min": 621
},
{
"epoch": 0.6618962432915921,
"grad_norm": 0.6319521644936286,
"learning_rate": 3.76530612244898e-05,
"loss": 0.3652,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37265145778656006,
"step": 370,
"valid_targets_mean": 4238.1,
"valid_targets_min": 1087
},
{
"epoch": 0.6708407871198568,
"grad_norm": 0.6238512565906754,
"learning_rate": 3.816326530612245e-05,
"loss": 0.3527,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36174702644348145,
"step": 375,
"valid_targets_mean": 4511.5,
"valid_targets_min": 1518
},
{
"epoch": 0.6797853309481217,
"grad_norm": 0.569965173329661,
"learning_rate": 3.8673469387755105e-05,
"loss": 0.3637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34279459714889526,
"step": 380,
"valid_targets_mean": 4155.4,
"valid_targets_min": 1851
},
{
"epoch": 0.6887298747763864,
"grad_norm": 0.6707477926009685,
"learning_rate": 3.9183673469387755e-05,
"loss": 0.3725,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3640945553779602,
"step": 385,
"valid_targets_mean": 4214.8,
"valid_targets_min": 767
},
{
"epoch": 0.6976744186046512,
"grad_norm": 0.5367271020119635,
"learning_rate": 3.969387755102041e-05,
"loss": 0.3422,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3215610384941101,
"step": 390,
"valid_targets_mean": 4804.4,
"valid_targets_min": 1580
},
{
"epoch": 0.7066189624329159,
"grad_norm": 0.6919691468354696,
"learning_rate": 3.9999968156003224e-05,
"loss": 0.3659,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3643749952316284,
"step": 395,
"valid_targets_mean": 3619.4,
"valid_targets_min": 993
},
{
"epoch": 0.7155635062611807,
"grad_norm": 0.6288859512995435,
"learning_rate": 3.999960991220401e-05,
"loss": 0.3524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3619106709957123,
"step": 400,
"valid_targets_mean": 4227.4,
"valid_targets_min": 2088
},
{
"epoch": 0.7245080500894454,
"grad_norm": 0.6317063641588481,
"learning_rate": 3.9998853626763316e-05,
"loss": 0.3548,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3588660657405853,
"step": 405,
"valid_targets_mean": 4536.9,
"valid_targets_min": 1735
},
{
"epoch": 0.7334525939177102,
"grad_norm": 0.6057461041737375,
"learning_rate": 3.999769931473309e-05,
"loss": 0.3654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3536277711391449,
"step": 410,
"valid_targets_mean": 3928.1,
"valid_targets_min": 1408
},
{
"epoch": 0.7423971377459749,
"grad_norm": 0.5865439635131978,
"learning_rate": 3.999614699908698e-05,
"loss": 0.3447,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3287227153778076,
"step": 415,
"valid_targets_mean": 4680.5,
"valid_targets_min": 1738
},
{
"epoch": 0.7513416815742398,
"grad_norm": 0.6236369468759124,
"learning_rate": 3.999419671071993e-05,
"loss": 0.36,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3473414182662964,
"step": 420,
"valid_targets_mean": 4636.2,
"valid_targets_min": 1483
},
{
"epoch": 0.7602862254025045,
"grad_norm": 0.6239705685634717,
"learning_rate": 3.999184848844746e-05,
"loss": 0.3558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31550854444503784,
"step": 425,
"valid_targets_mean": 3627.9,
"valid_targets_min": 1473
},
{
"epoch": 0.7692307692307693,
"grad_norm": 0.7215363445685998,
"learning_rate": 3.9989102379005026e-05,
"loss": 0.3531,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3723289370536804,
"step": 430,
"valid_targets_mean": 3313.8,
"valid_targets_min": 777
},
{
"epoch": 0.778175313059034,
"grad_norm": 0.6314029660945639,
"learning_rate": 3.9985958437046976e-05,
"loss": 0.346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3319028913974762,
"step": 435,
"valid_targets_mean": 4074.1,
"valid_targets_min": 1150
},
{
"epoch": 0.7871198568872988,
"grad_norm": 0.671810871870371,
"learning_rate": 3.998241672514551e-05,
"loss": 0.3593,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3606319725513458,
"step": 440,
"valid_targets_mean": 3716.7,
"valid_targets_min": 1462
},
{
"epoch": 0.7960644007155635,
"grad_norm": 0.6534639604048026,
"learning_rate": 3.997847731378946e-05,
"loss": 0.3545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3522427976131439,
"step": 445,
"valid_targets_mean": 3853.1,
"valid_targets_min": 1761
},
{
"epoch": 0.8050089445438283,
"grad_norm": 0.6256271897448633,
"learning_rate": 3.9974140281382844e-05,
"loss": 0.3523,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3305948078632355,
"step": 450,
"valid_targets_mean": 4348.7,
"valid_targets_min": 2006
},
{
"epoch": 0.813953488372093,
"grad_norm": 0.665427663210199,
"learning_rate": 3.996940571424331e-05,
"loss": 0.3417,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3263488709926605,
"step": 455,
"valid_targets_mean": 3719.2,
"valid_targets_min": 2056
},
{
"epoch": 0.8228980322003577,
"grad_norm": 0.6525668365849738,
"learning_rate": 3.996427370660045e-05,
"loss": 0.3491,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.357142835855484,
"step": 460,
"valid_targets_mean": 4044.6,
"valid_targets_min": 681
},
{
"epoch": 0.8318425760286225,
"grad_norm": 0.5874893016038123,
"learning_rate": 3.995874436059389e-05,
"loss": 0.3463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34184402227401733,
"step": 465,
"valid_targets_mean": 4344.1,
"valid_targets_min": 1744
},
{
"epoch": 0.8407871198568873,
"grad_norm": 0.6543028013713276,
"learning_rate": 3.9952817786271264e-05,
"loss": 0.3456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3407524824142456,
"step": 470,
"valid_targets_mean": 4510.4,
"valid_targets_min": 2428
},
{
"epoch": 0.8497316636851521,
"grad_norm": 0.6482522573193757,
"learning_rate": 3.994649410158605e-05,
"loss": 0.3445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.336134672164917,
"step": 475,
"valid_targets_mean": 3787.4,
"valid_targets_min": 545
},
{
"epoch": 0.8586762075134168,
"grad_norm": 0.6618318888035204,
"learning_rate": 3.99397734323952e-05,
"loss": 0.3559,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39081141352653503,
"step": 480,
"valid_targets_mean": 4617.5,
"valid_targets_min": 778
},
{
"epoch": 0.8676207513416816,
"grad_norm": 0.6461883560383084,
"learning_rate": 3.993265591245662e-05,
"loss": 0.3481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3543085753917694,
"step": 485,
"valid_targets_mean": 4650.8,
"valid_targets_min": 1304
},
{
"epoch": 0.8765652951699463,
"grad_norm": 0.7166558381651617,
"learning_rate": 3.992514168342655e-05,
"loss": 0.355,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3686150312423706,
"step": 490,
"valid_targets_mean": 3723.8,
"valid_targets_min": 927
},
{
"epoch": 0.8855098389982111,
"grad_norm": 0.6815294274219248,
"learning_rate": 3.9917230894856705e-05,
"loss": 0.3437,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3497094511985779,
"step": 495,
"valid_targets_mean": 3219.9,
"valid_targets_min": 669
},
{
"epoch": 0.8944543828264758,
"grad_norm": 0.78386232455594,
"learning_rate": 3.990892370419132e-05,
"loss": 0.3493,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35013243556022644,
"step": 500,
"valid_targets_mean": 3843.9,
"valid_targets_min": 1370
},
{
"epoch": 0.9033989266547406,
"grad_norm": 0.6199422182618969,
"learning_rate": 3.9900220276764013e-05,
"loss": 0.3418,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35459715127944946,
"step": 505,
"valid_targets_mean": 4905.9,
"valid_targets_min": 2222
},
{
"epoch": 0.9123434704830053,
"grad_norm": 0.6761601566190695,
"learning_rate": 3.989112078579449e-05,
"loss": 0.3363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34386712312698364,
"step": 510,
"valid_targets_mean": 3200.0,
"valid_targets_min": 1484
},
{
"epoch": 0.9212880143112702,
"grad_norm": 0.5809388892974982,
"learning_rate": 3.988162541238509e-05,
"loss": 0.3556,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3644087314605713,
"step": 515,
"valid_targets_mean": 4901.0,
"valid_targets_min": 720
},
{
"epoch": 0.9302325581395349,
"grad_norm": 0.6670957667841473,
"learning_rate": 3.98717343455172e-05,
"loss": 0.3468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3259006440639496,
"step": 520,
"valid_targets_mean": 3929.0,
"valid_targets_min": 819
},
{
"epoch": 0.9391771019677997,
"grad_norm": 0.6133306725020052,
"learning_rate": 3.9861447782047495e-05,
"loss": 0.3521,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3232124149799347,
"step": 525,
"valid_targets_mean": 4338.9,
"valid_targets_min": 1621
},
{
"epoch": 0.9481216457960644,
"grad_norm": 0.5945215828915712,
"learning_rate": 3.9850765926704e-05,
"loss": 0.3457,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3464571535587311,
"step": 530,
"valid_targets_mean": 4751.4,
"valid_targets_min": 1880
},
{
"epoch": 0.9570661896243292,
"grad_norm": 0.616855899500005,
"learning_rate": 3.9839688992082004e-05,
"loss": 0.3406,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33732545375823975,
"step": 535,
"valid_targets_mean": 3987.8,
"valid_targets_min": 1435
},
{
"epoch": 0.9660107334525939,
"grad_norm": 0.5714623187800117,
"learning_rate": 3.9828217198639884e-05,
"loss": 0.345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3435646891593933,
"step": 540,
"valid_targets_mean": 4915.8,
"valid_targets_min": 1400
},
{
"epoch": 0.9749552772808586,
"grad_norm": 0.6324746280014568,
"learning_rate": 3.981635077469468e-05,
"loss": 0.3394,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3339131474494934,
"step": 545,
"valid_targets_mean": 3912.2,
"valid_targets_min": 1666
},
{
"epoch": 0.9838998211091234,
"grad_norm": 0.626118262073981,
"learning_rate": 3.980408995641751e-05,
"loss": 0.3219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33410966396331787,
"step": 550,
"valid_targets_mean": 4326.9,
"valid_targets_min": 1565
},
{
"epoch": 0.9928443649373881,
"grad_norm": 0.5559330654712583,
"learning_rate": 3.979143498782898e-05,
"loss": 0.3523,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3249479830265045,
"step": 555,
"valid_targets_mean": 4442.0,
"valid_targets_min": 1579
},
{
"epoch": 1.0017889087656529,
"grad_norm": 0.5744899255811827,
"learning_rate": 3.977838612079419e-05,
"loss": 0.3482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34298670291900635,
"step": 560,
"valid_targets_mean": 4366.9,
"valid_targets_min": 1630
},
{
"epoch": 1.0107334525939178,
"grad_norm": 0.540064997986571,
"learning_rate": 3.976494361501786e-05,
"loss": 0.3255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29019173979759216,
"step": 565,
"valid_targets_mean": 4183.6,
"valid_targets_min": 1293
},
{
"epoch": 1.0196779964221825,
"grad_norm": 0.6708126937194594,
"learning_rate": 3.975110773803904e-05,
"loss": 0.3291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3077584505081177,
"step": 570,
"valid_targets_mean": 3365.9,
"valid_targets_min": 1599
},
{
"epoch": 1.0286225402504472,
"grad_norm": 0.5975546705521818,
"learning_rate": 3.973687876522587e-05,
"loss": 0.3099,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3131313920021057,
"step": 575,
"valid_targets_mean": 3975.9,
"valid_targets_min": 1659
},
{
"epoch": 1.037567084078712,
"grad_norm": 0.5802313523133982,
"learning_rate": 3.9722256979770054e-05,
"loss": 0.3228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3223347067832947,
"step": 580,
"valid_targets_mean": 3876.8,
"valid_targets_min": 1256
},
{
"epoch": 1.0465116279069768,
"grad_norm": 0.5940502139996998,
"learning_rate": 3.970724267268125e-05,
"loss": 0.3316,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3173867166042328,
"step": 585,
"valid_targets_mean": 3916.0,
"valid_targets_min": 1519
},
{
"epoch": 1.0554561717352415,
"grad_norm": 0.5526882078589692,
"learning_rate": 3.969183614278125e-05,
"loss": 0.3205,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3090658187866211,
"step": 590,
"valid_targets_mean": 3783.8,
"valid_targets_min": 1558
},
{
"epoch": 1.0644007155635062,
"grad_norm": 0.5756072638500698,
"learning_rate": 3.9676037696698056e-05,
"loss": 0.3451,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33000075817108154,
"step": 595,
"valid_targets_mean": 4377.0,
"valid_targets_min": 1580
},
{
"epoch": 1.073345259391771,
"grad_norm": 0.6209850679632152,
"learning_rate": 3.9659847648859775e-05,
"loss": 0.3358,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3666132092475891,
"step": 600,
"valid_targets_mean": 3891.3,
"valid_targets_min": 766
},
{
"epoch": 1.0822898032200359,
"grad_norm": 0.574730620347152,
"learning_rate": 3.9643266321488354e-05,
"loss": 0.3297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31989532709121704,
"step": 605,
"valid_targets_mean": 4488.6,
"valid_targets_min": 1565
},
{
"epoch": 1.0912343470483006,
"grad_norm": 0.7137118300894771,
"learning_rate": 3.962629404459317e-05,
"loss": 0.3272,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3319159746170044,
"step": 610,
"valid_targets_mean": 2972.9,
"valid_targets_min": 625
},
{
"epoch": 1.1001788908765653,
"grad_norm": 0.5664071308134078,
"learning_rate": 3.960893115596445e-05,
"loss": 0.3098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2983168065547943,
"step": 615,
"valid_targets_mean": 4385.4,
"valid_targets_min": 1484
},
{
"epoch": 1.10912343470483,
"grad_norm": 0.617788180227712,
"learning_rate": 3.959117800116658e-05,
"loss": 0.3321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3224518299102783,
"step": 620,
"valid_targets_mean": 3728.5,
"valid_targets_min": 988
},
{
"epoch": 1.118067978533095,
"grad_norm": 0.6068172667148498,
"learning_rate": 3.9573034933531195e-05,
"loss": 0.3308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3229108154773712,
"step": 625,
"valid_targets_mean": 4483.8,
"valid_targets_min": 1824
},
{
"epoch": 1.1270125223613596,
"grad_norm": 0.6113158435705944,
"learning_rate": 3.955450231415014e-05,
"loss": 0.3405,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3196060061454773,
"step": 630,
"valid_targets_mean": 4137.5,
"valid_targets_min": 1364
},
{
"epoch": 1.1359570661896243,
"grad_norm": 0.6173710617052496,
"learning_rate": 3.953558051186834e-05,
"loss": 0.3333,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34940510988235474,
"step": 635,
"valid_targets_mean": 4084.4,
"valid_targets_min": 1886
},
{
"epoch": 1.144901610017889,
"grad_norm": 0.6846373488774041,
"learning_rate": 3.95162699032764e-05,
"loss": 0.3244,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3563871383666992,
"step": 640,
"valid_targets_mean": 4735.4,
"valid_targets_min": 1188
},
{
"epoch": 1.1538461538461537,
"grad_norm": 0.6569856707625712,
"learning_rate": 3.949657087270313e-05,
"loss": 0.3199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32631808519363403,
"step": 645,
"valid_targets_mean": 4182.3,
"valid_targets_min": 850
},
{
"epoch": 1.1627906976744187,
"grad_norm": 0.5672879733062905,
"learning_rate": 3.947648381220789e-05,
"loss": 0.3152,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31764596700668335,
"step": 650,
"valid_targets_mean": 3908.7,
"valid_targets_min": 646
},
{
"epoch": 1.1717352415026834,
"grad_norm": 0.6801671519180097,
"learning_rate": 3.9456009121572824e-05,
"loss": 0.3233,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31651636958122253,
"step": 655,
"valid_targets_mean": 3767.4,
"valid_targets_min": 1485
},
{
"epoch": 1.180679785330948,
"grad_norm": 0.5776768005096825,
"learning_rate": 3.943514720829485e-05,
"loss": 0.3302,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3585665225982666,
"step": 660,
"valid_targets_mean": 4321.3,
"valid_targets_min": 1595
},
{
"epoch": 1.1896243291592128,
"grad_norm": 0.6632996529951345,
"learning_rate": 3.941389848757756e-05,
"loss": 0.3293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34740591049194336,
"step": 665,
"valid_targets_mean": 3854.9,
"valid_targets_min": 1643
},
{
"epoch": 1.1985688729874777,
"grad_norm": 0.6568776669609784,
"learning_rate": 3.9392263382323e-05,
"loss": 0.3271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3057899475097656,
"step": 670,
"valid_targets_mean": 3277.4,
"valid_targets_min": 1615
},
{
"epoch": 1.2075134168157424,
"grad_norm": 0.6270834310864767,
"learning_rate": 3.93702423231232e-05,
"loss": 0.3227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32783782482147217,
"step": 675,
"valid_targets_mean": 3216.5,
"valid_targets_min": 1055
},
{
"epoch": 1.2164579606440071,
"grad_norm": 0.6305095200057445,
"learning_rate": 3.9347835748251645e-05,
"loss": 0.332,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3536560535430908,
"step": 680,
"valid_targets_mean": 3572.4,
"valid_targets_min": 552
},
{
"epoch": 1.2254025044722718,
"grad_norm": 0.5736045805917658,
"learning_rate": 3.9325044103654526e-05,
"loss": 0.3348,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3276847004890442,
"step": 685,
"valid_targets_mean": 3811.6,
"valid_targets_min": 1374
},
{
"epoch": 1.2343470483005368,
"grad_norm": 0.5244473851418727,
"learning_rate": 3.9301867842941867e-05,
"loss": 0.3302,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3139815926551819,
"step": 690,
"valid_targets_mean": 4468.8,
"valid_targets_min": 1504
},
{
"epoch": 1.2432915921288015,
"grad_norm": 0.5751467981153631,
"learning_rate": 3.9278307427378495e-05,
"loss": 0.335,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.320250928401947,
"step": 695,
"valid_targets_mean": 4114.9,
"valid_targets_min": 2051
},
{
"epoch": 1.2522361359570662,
"grad_norm": 0.57724364766724,
"learning_rate": 3.92543633258749e-05,
"loss": 0.3328,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3237752914428711,
"step": 700,
"valid_targets_mean": 4272.7,
"valid_targets_min": 1724
},
{
"epoch": 1.2611806797853309,
"grad_norm": 0.6222962371838422,
"learning_rate": 3.923003601497785e-05,
"loss": 0.3096,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2992010712623596,
"step": 705,
"valid_targets_mean": 3838.6,
"valid_targets_min": 1073
},
{
"epoch": 1.2701252236135958,
"grad_norm": 0.5745002540877785,
"learning_rate": 3.920532597886091e-05,
"loss": 0.3273,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33431553840637207,
"step": 710,
"valid_targets_mean": 4709.8,
"valid_targets_min": 1660
},
{
"epoch": 1.2790697674418605,
"grad_norm": 0.8250895929655195,
"learning_rate": 3.918023370931485e-05,
"loss": 0.3325,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34380948543548584,
"step": 715,
"valid_targets_mean": 3260.9,
"valid_targets_min": 1452
},
{
"epoch": 1.2880143112701252,
"grad_norm": 0.5891395257155815,
"learning_rate": 3.915475970573782e-05,
"loss": 0.3116,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31047481298446655,
"step": 720,
"valid_targets_mean": 3394.5,
"valid_targets_min": 728
},
{
"epoch": 1.29695885509839,
"grad_norm": 0.5492069212467995,
"learning_rate": 3.9128904475125414e-05,
"loss": 0.3236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3350293040275574,
"step": 725,
"valid_targets_mean": 4490.6,
"valid_targets_min": 1470
},
{
"epoch": 1.3059033989266546,
"grad_norm": 0.606471839392876,
"learning_rate": 3.910266853206058e-05,
"loss": 0.3227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3107641935348511,
"step": 730,
"valid_targets_mean": 3896.6,
"valid_targets_min": 545
},
{
"epoch": 1.3148479427549196,
"grad_norm": 0.6158261916551597,
"learning_rate": 3.907605239870342e-05,
"loss": 0.3187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31847408413887024,
"step": 735,
"valid_targets_mean": 3804.2,
"valid_targets_min": 741
},
{
"epoch": 1.3237924865831843,
"grad_norm": 0.6321605305603367,
"learning_rate": 3.904905660478072e-05,
"loss": 0.3249,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3120426833629608,
"step": 740,
"valid_targets_mean": 3962.6,
"valid_targets_min": 1180
},
{
"epoch": 1.332737030411449,
"grad_norm": 0.5592948617131595,
"learning_rate": 3.9021681687575465e-05,
"loss": 0.3179,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.323030024766922,
"step": 745,
"valid_targets_mean": 4431.0,
"valid_targets_min": 1535
},
{
"epoch": 1.341681574239714,
"grad_norm": 0.5325276240664678,
"learning_rate": 3.8993928191916134e-05,
"loss": 0.3142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30110353231430054,
"step": 750,
"valid_targets_mean": 4319.6,
"valid_targets_min": 1804
},
{
"epoch": 1.3506261180679786,
"grad_norm": 0.5538507843730288,
"learning_rate": 3.8965796670165856e-05,
"loss": 0.3166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31126099824905396,
"step": 755,
"valid_targets_mean": 4311.1,
"valid_targets_min": 1641
},
{
"epoch": 1.3595706618962433,
"grad_norm": 0.5678960091362133,
"learning_rate": 3.893728768221139e-05,
"loss": 0.3244,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.305950790643692,
"step": 760,
"valid_targets_mean": 3987.8,
"valid_targets_min": 2194
},
{
"epoch": 1.368515205724508,
"grad_norm": 0.5888212617780767,
"learning_rate": 3.8908401795452033e-05,
"loss": 0.3307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3165014684200287,
"step": 765,
"valid_targets_mean": 4065.1,
"valid_targets_min": 1441
},
{
"epoch": 1.3774597495527727,
"grad_norm": 0.6376960259257772,
"learning_rate": 3.8879139584788286e-05,
"loss": 0.3235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3417049050331116,
"step": 770,
"valid_targets_mean": 3551.9,
"valid_targets_min": 1828
},
{
"epoch": 1.3864042933810374,
"grad_norm": 0.5627522323734243,
"learning_rate": 3.884950163261042e-05,
"loss": 0.3218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32489728927612305,
"step": 775,
"valid_targets_mean": 3681.4,
"valid_targets_min": 1565
},
{
"epoch": 1.3953488372093024,
"grad_norm": 0.643663426567113,
"learning_rate": 3.8819488528786904e-05,
"loss": 0.3162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29307177662849426,
"step": 780,
"valid_targets_mean": 3725.8,
"valid_targets_min": 778
},
{
"epoch": 1.404293381037567,
"grad_norm": 0.5860397601189946,
"learning_rate": 3.878910087065264e-05,
"loss": 0.3255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31179744005203247,
"step": 785,
"valid_targets_mean": 3490.3,
"valid_targets_min": 997
},
{
"epoch": 1.4132379248658318,
"grad_norm": 0.6006178361895881,
"learning_rate": 3.8758339262997094e-05,
"loss": 0.3207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3223787546157837,
"step": 790,
"valid_targets_mean": 3681.4,
"valid_targets_min": 1614
},
{
"epoch": 1.4221824686940967,
"grad_norm": 0.5703573435024017,
"learning_rate": 3.872720431805224e-05,
"loss": 0.3108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31823939085006714,
"step": 795,
"valid_targets_mean": 3783.3,
"valid_targets_min": 474
},
{
"epoch": 1.4311270125223614,
"grad_norm": 0.5583054675958945,
"learning_rate": 3.86956966554804e-05,
"loss": 0.3226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3209839463233948,
"step": 800,
"valid_targets_mean": 4748.8,
"valid_targets_min": 1829
},
{
"epoch": 1.4400715563506261,
"grad_norm": 0.5734451464718057,
"learning_rate": 3.8663816902361896e-05,
"loss": 0.3223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3395638167858124,
"step": 805,
"valid_targets_mean": 4469.4,
"valid_targets_min": 954
},
{
"epoch": 1.4490161001788908,
"grad_norm": 0.6240967521849574,
"learning_rate": 3.863156569318256e-05,
"loss": 0.3185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.342720627784729,
"step": 810,
"valid_targets_mean": 3274.9,
"valid_targets_min": 873
},
{
"epoch": 1.4579606440071555,
"grad_norm": 0.5839916094456372,
"learning_rate": 3.8598943669821124e-05,
"loss": 0.3352,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34921061992645264,
"step": 815,
"valid_targets_mean": 4149.1,
"valid_targets_min": 1776
},
{
"epoch": 1.4669051878354205,
"grad_norm": 0.5327258875676051,
"learning_rate": 3.856595148153643e-05,
"loss": 0.332,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29739612340927124,
"step": 820,
"valid_targets_mean": 4420.4,
"valid_targets_min": 1722
},
{
"epoch": 1.4758497316636852,
"grad_norm": 0.5726474256279158,
"learning_rate": 3.853258978495454e-05,
"loss": 0.3283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3427349925041199,
"step": 825,
"valid_targets_mean": 4086.2,
"valid_targets_min": 754
},
{
"epoch": 1.4847942754919499,
"grad_norm": 0.5586681064868766,
"learning_rate": 3.8498859244055616e-05,
"loss": 0.3201,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30017322301864624,
"step": 830,
"valid_targets_mean": 4213.1,
"valid_targets_min": 1521
},
{
"epoch": 1.4937388193202148,
"grad_norm": 0.5545114860278723,
"learning_rate": 3.8464760530160756e-05,
"loss": 0.3041,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3249306082725525,
"step": 835,
"valid_targets_mean": 4479.8,
"valid_targets_min": 1882
},
{
"epoch": 1.5026833631484795,
"grad_norm": 0.5851321941617261,
"learning_rate": 3.843029432191858e-05,
"loss": 0.32,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3026468753814697,
"step": 840,
"valid_targets_mean": 3582.4,
"valid_targets_min": 1779
},
{
"epoch": 1.5116279069767442,
"grad_norm": 0.6559733463498192,
"learning_rate": 3.839546130529179e-05,
"loss": 0.3174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33914104104042053,
"step": 845,
"valid_targets_mean": 4173.3,
"valid_targets_min": 1823
},
{
"epoch": 1.520572450805009,
"grad_norm": 0.6371050604836407,
"learning_rate": 3.8360262173543467e-05,
"loss": 0.3255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32565081119537354,
"step": 850,
"valid_targets_mean": 3549.8,
"valid_targets_min": 822
},
{
"epoch": 1.5295169946332736,
"grad_norm": 0.5768187274321938,
"learning_rate": 3.8324697627223263e-05,
"loss": 0.317,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3176955282688141,
"step": 855,
"valid_targets_mean": 3880.8,
"valid_targets_min": 671
},
{
"epoch": 1.5384615384615383,
"grad_norm": 0.5482702475809518,
"learning_rate": 3.828876837415352e-05,
"loss": 0.3107,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2995319962501526,
"step": 860,
"valid_targets_mean": 4659.9,
"valid_targets_min": 1931
},
{
"epoch": 1.5474060822898033,
"grad_norm": 0.6038821934595454,
"learning_rate": 3.8252475129415127e-05,
"loss": 0.3161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32784345746040344,
"step": 865,
"valid_targets_mean": 3603.8,
"valid_targets_min": 747
},
{
"epoch": 1.556350626118068,
"grad_norm": 0.5283881224885371,
"learning_rate": 3.82158186153333e-05,
"loss": 0.3159,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30888307094573975,
"step": 870,
"valid_targets_mean": 4141.3,
"valid_targets_min": 1381
},
{
"epoch": 1.5652951699463329,
"grad_norm": 0.5983795772826802,
"learning_rate": 3.817879956146323e-05,
"loss": 0.3294,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34233012795448303,
"step": 875,
"valid_targets_mean": 4115.4,
"valid_targets_min": 1008
},
{
"epoch": 1.5742397137745976,
"grad_norm": 0.6611039790326494,
"learning_rate": 3.814141870457553e-05,
"loss": 0.3115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3333245813846588,
"step": 880,
"valid_targets_mean": 3703.6,
"valid_targets_min": 848
},
{
"epoch": 1.5831842576028623,
"grad_norm": 0.5991870251745893,
"learning_rate": 3.810367678864159e-05,
"loss": 0.3237,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30103540420532227,
"step": 885,
"valid_targets_mean": 3587.0,
"valid_targets_min": 1491
},
{
"epoch": 1.592128801431127,
"grad_norm": 0.5618095876534,
"learning_rate": 3.806557456481878e-05,
"loss": 0.3343,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31948399543762207,
"step": 890,
"valid_targets_mean": 3862.9,
"valid_targets_min": 715
},
{
"epoch": 1.6010733452593917,
"grad_norm": 0.6334383283680136,
"learning_rate": 3.8027112791435466e-05,
"loss": 0.3288,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31764253973960876,
"step": 895,
"valid_targets_mean": 3225.9,
"valid_targets_min": 607
},
{
"epoch": 1.6100178890876564,
"grad_norm": 0.582112973475375,
"learning_rate": 3.7988292233975947e-05,
"loss": 0.3329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33960235118865967,
"step": 900,
"valid_targets_mean": 4268.9,
"valid_targets_min": 1483
},
{
"epoch": 1.6189624329159211,
"grad_norm": 0.5815635189350303,
"learning_rate": 3.7949113665065226e-05,
"loss": 0.3234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3374456763267517,
"step": 905,
"valid_targets_mean": 4174.2,
"valid_targets_min": 687
},
{
"epoch": 1.627906976744186,
"grad_norm": 1.0497579746341565,
"learning_rate": 3.7909577864453593e-05,
"loss": 0.325,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3294409513473511,
"step": 910,
"valid_targets_mean": 4344.9,
"valid_targets_min": 827
},
{
"epoch": 1.6368515205724508,
"grad_norm": 0.567491242330487,
"learning_rate": 3.786968561900116e-05,
"loss": 0.3105,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2935563325881958,
"step": 915,
"valid_targets_mean": 3874.4,
"valid_targets_min": 1672
},
{
"epoch": 1.6457960644007157,
"grad_norm": 0.6318743528248707,
"learning_rate": 3.782943772266213e-05,
"loss": 0.3191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3036611080169678,
"step": 920,
"valid_targets_mean": 3250.3,
"valid_targets_min": 911
},
{
"epoch": 1.6547406082289804,
"grad_norm": 0.6392903008216162,
"learning_rate": 3.7788834976469095e-05,
"loss": 0.3083,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3205622434616089,
"step": 925,
"valid_targets_mean": 3400.8,
"valid_targets_min": 978
},
{
"epoch": 1.663685152057245,
"grad_norm": 0.5491612081779448,
"learning_rate": 3.7747878188516965e-05,
"loss": 0.3137,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3106827437877655,
"step": 930,
"valid_targets_mean": 4198.3,
"valid_targets_min": 1757
},
{
"epoch": 1.6726296958855098,
"grad_norm": 0.5396436465197288,
"learning_rate": 3.770656817394703e-05,
"loss": 0.3168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30610522627830505,
"step": 935,
"valid_targets_mean": 4018.6,
"valid_targets_min": 1540
},
{
"epoch": 1.6815742397137745,
"grad_norm": 0.4890047892792955,
"learning_rate": 3.7664905754930616e-05,
"loss": 0.3155,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31638064980506897,
"step": 940,
"valid_targets_mean": 4828.7,
"valid_targets_min": 1454
},
{
"epoch": 1.6905187835420392,
"grad_norm": 0.5488512250424282,
"learning_rate": 3.762289176065276e-05,
"loss": 0.3167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3114585280418396,
"step": 945,
"valid_targets_mean": 4037.7,
"valid_targets_min": 600
},
{
"epoch": 1.6994633273703041,
"grad_norm": 0.643517620390725,
"learning_rate": 3.758052702729576e-05,
"loss": 0.3127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.305495023727417,
"step": 950,
"valid_targets_mean": 4262.5,
"valid_targets_min": 1184
},
{
"epoch": 1.7084078711985689,
"grad_norm": 0.5457086631910586,
"learning_rate": 3.753781239802245e-05,
"loss": 0.3132,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2907237410545349,
"step": 955,
"valid_targets_mean": 3675.6,
"valid_targets_min": 1495
},
{
"epoch": 1.7173524150268338,
"grad_norm": 0.5241171467893824,
"learning_rate": 3.749474872295946e-05,
"loss": 0.3125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2793015241622925,
"step": 960,
"valid_targets_mean": 3477.6,
"valid_targets_min": 1785
},
{
"epoch": 1.7262969588550985,
"grad_norm": 0.5513650345883626,
"learning_rate": 3.745133685918032e-05,
"loss": 0.321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3557593822479248,
"step": 965,
"valid_targets_mean": 4640.1,
"valid_targets_min": 2109
},
{
"epoch": 1.7352415026833632,
"grad_norm": 0.526841550249395,
"learning_rate": 3.740757767068834e-05,
"loss": 0.3022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2938116788864136,
"step": 970,
"valid_targets_mean": 4656.8,
"valid_targets_min": 1424
},
{
"epoch": 1.744186046511628,
"grad_norm": 0.6055246993537275,
"learning_rate": 3.7363472028399476e-05,
"loss": 0.3248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3154802918434143,
"step": 975,
"valid_targets_mean": 3483.9,
"valid_targets_min": 1692
},
{
"epoch": 1.7531305903398926,
"grad_norm": 0.603322342815491,
"learning_rate": 3.7319020810124965e-05,
"loss": 0.3021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3003346920013428,
"step": 980,
"valid_targets_mean": 3828.6,
"valid_targets_min": 621
},
{
"epoch": 1.7620751341681573,
"grad_norm": 0.5626166447337553,
"learning_rate": 3.727422490055386e-05,
"loss": 0.3148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3034425973892212,
"step": 985,
"valid_targets_mean": 4099.6,
"valid_targets_min": 836
},
{
"epoch": 1.7710196779964222,
"grad_norm": 0.4590848854306322,
"learning_rate": 3.72290851912354e-05,
"loss": 0.314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3024485111236572,
"step": 990,
"valid_targets_mean": 5403.2,
"valid_targets_min": 2338
},
{
"epoch": 1.779964221824687,
"grad_norm": 0.5634666645265822,
"learning_rate": 3.718360258056133e-05,
"loss": 0.3173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30547595024108887,
"step": 995,
"valid_targets_mean": 3841.9,
"valid_targets_min": 1685
},
{
"epoch": 1.7889087656529516,
"grad_norm": 0.5618746894535553,
"learning_rate": 3.713777797374794e-05,
"loss": 0.322,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33232662081718445,
"step": 1000,
"valid_targets_mean": 3674.4,
"valid_targets_min": 663
},
{
"epoch": 1.7978533094812166,
"grad_norm": 0.6550093924031264,
"learning_rate": 3.709161228281811e-05,
"loss": 0.3142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30034154653549194,
"step": 1005,
"valid_targets_mean": 3396.8,
"valid_targets_min": 1109
},
{
"epoch": 1.8067978533094813,
"grad_norm": 0.6073692572388313,
"learning_rate": 3.704510642658314e-05,
"loss": 0.3203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3542916178703308,
"step": 1010,
"valid_targets_mean": 3448.8,
"valid_targets_min": 795
},
{
"epoch": 1.815742397137746,
"grad_norm": 0.6171396796866804,
"learning_rate": 3.699826133062443e-05,
"loss": 0.3118,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3225131630897522,
"step": 1015,
"valid_targets_mean": 3759.8,
"valid_targets_min": 1114
},
{
"epoch": 1.8246869409660107,
"grad_norm": 0.6099863228762299,
"learning_rate": 3.6951077927275126e-05,
"loss": 0.332,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3298446834087372,
"step": 1020,
"valid_targets_mean": 3864.5,
"valid_targets_min": 1052
},
{
"epoch": 1.8336314847942754,
"grad_norm": 0.5524141402638945,
"learning_rate": 3.6903557155601503e-05,
"loss": 0.3117,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.291124165058136,
"step": 1025,
"valid_targets_mean": 3606.2,
"valid_targets_min": 1973
},
{
"epoch": 1.84257602862254,
"grad_norm": 0.5169690200399784,
"learning_rate": 3.685569996138431e-05,
"loss": 0.3065,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3137836456298828,
"step": 1030,
"valid_targets_mean": 4619.6,
"valid_targets_min": 1219
},
{
"epoch": 1.851520572450805,
"grad_norm": 0.5316610746415315,
"learning_rate": 3.680750729709993e-05,
"loss": 0.3173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33356547355651855,
"step": 1035,
"valid_targets_mean": 4652.9,
"valid_targets_min": 981
},
{
"epoch": 1.8604651162790697,
"grad_norm": 0.5559235856424838,
"learning_rate": 3.675898012190143e-05,
"loss": 0.3105,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31008175015449524,
"step": 1040,
"valid_targets_mean": 3755.5,
"valid_targets_min": 1368
},
{
"epoch": 1.8694096601073347,
"grad_norm": 0.6298206469639374,
"learning_rate": 3.6710119401599474e-05,
"loss": 0.3252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33441591262817383,
"step": 1045,
"valid_targets_mean": 3854.9,
"valid_targets_min": 1316
},
{
"epoch": 1.8783542039355994,
"grad_norm": 0.5389022768825737,
"learning_rate": 3.6660926108643086e-05,
"loss": 0.3179,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3052956461906433,
"step": 1050,
"valid_targets_mean": 3938.4,
"valid_targets_min": 680
},
{
"epoch": 1.887298747763864,
"grad_norm": 0.5801147385776886,
"learning_rate": 3.661140122210032e-05,
"loss": 0.309,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32204878330230713,
"step": 1055,
"valid_targets_mean": 3663.2,
"valid_targets_min": 839
},
{
"epoch": 1.8962432915921288,
"grad_norm": 0.5606779533763502,
"learning_rate": 3.656154572763877e-05,
"loss": 0.3211,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3348532021045685,
"step": 1060,
"valid_targets_mean": 3548.2,
"valid_targets_min": 622
},
{
"epoch": 1.9051878354203935,
"grad_norm": 0.5573332010454619,
"learning_rate": 3.651136061750592e-05,
"loss": 0.3252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3448393940925598,
"step": 1065,
"valid_targets_mean": 3946.6,
"valid_targets_min": 748
},
{
"epoch": 1.9141323792486582,
"grad_norm": 0.5490778045530725,
"learning_rate": 3.646084689050942e-05,
"loss": 0.3189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3161720633506775,
"step": 1070,
"valid_targets_mean": 3859.4,
"valid_targets_min": 751
},
{
"epoch": 1.9230769230769231,
"grad_norm": 0.5894163589977383,
"learning_rate": 3.641000555199725e-05,
"loss": 0.3105,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3114989697933197,
"step": 1075,
"valid_targets_mean": 3375.2,
"valid_targets_min": 710
},
{
"epoch": 1.9320214669051878,
"grad_norm": 0.5349889235476035,
"learning_rate": 3.6358837613837604e-05,
"loss": 0.315,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30235400795936584,
"step": 1080,
"valid_targets_mean": 3989.0,
"valid_targets_min": 1691
},
{
"epoch": 1.9409660107334525,
"grad_norm": 0.6736523490222415,
"learning_rate": 3.630734409439887e-05,
"loss": 0.3227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3229427635669708,
"step": 1085,
"valid_targets_mean": 3905.6,
"valid_targets_min": 950
},
{
"epoch": 1.9499105545617175,
"grad_norm": 0.5727534078817972,
"learning_rate": 3.625552601852928e-05,
"loss": 0.3119,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31192246079444885,
"step": 1090,
"valid_targets_mean": 3771.9,
"valid_targets_min": 658
},
{
"epoch": 1.9588550983899822,
"grad_norm": 0.6120985202643506,
"learning_rate": 3.6203384417536566e-05,
"loss": 0.31,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3371928036212921,
"step": 1095,
"valid_targets_mean": 3940.8,
"valid_targets_min": 1372
},
{
"epoch": 1.9677996422182469,
"grad_norm": 0.5549601857245118,
"learning_rate": 3.615092032916736e-05,
"loss": 0.3106,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3066266179084778,
"step": 1100,
"valid_targets_mean": 3876.9,
"valid_targets_min": 1122
},
{
"epoch": 1.9767441860465116,
"grad_norm": 0.5131380359563835,
"learning_rate": 3.6098134797586646e-05,
"loss": 0.3019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2861686646938324,
"step": 1105,
"valid_targets_mean": 4285.8,
"valid_targets_min": 1706
},
{
"epoch": 1.9856887298747763,
"grad_norm": 0.527229318850269,
"learning_rate": 3.604502887335688e-05,
"loss": 0.3178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.317037433385849,
"step": 1110,
"valid_targets_mean": 4532.9,
"valid_targets_min": 1358
},
{
"epoch": 1.994633273703041,
"grad_norm": 0.6132587433714716,
"learning_rate": 3.599160361341715e-05,
"loss": 0.3246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35272109508514404,
"step": 1115,
"valid_targets_mean": 4244.4,
"valid_targets_min": 1862
},
{
"epoch": 2.0035778175313057,
"grad_norm": 0.5593406465085026,
"learning_rate": 3.59378600810621e-05,
"loss": 0.3091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30550044775009155,
"step": 1120,
"valid_targets_mean": 3629.8,
"valid_targets_min": 1287
},
{
"epoch": 2.012522361359571,
"grad_norm": 0.5559035299742234,
"learning_rate": 3.588379934592078e-05,
"loss": 0.3007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2961064577102661,
"step": 1125,
"valid_targets_mean": 4219.7,
"valid_targets_min": 2082
},
{
"epoch": 2.0214669051878356,
"grad_norm": 0.5222588666049305,
"learning_rate": 3.5829422483935374e-05,
"loss": 0.2991,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2910686135292053,
"step": 1130,
"valid_targets_mean": 4635.5,
"valid_targets_min": 720
},
{
"epoch": 2.0304114490161003,
"grad_norm": 0.5492856936529431,
"learning_rate": 3.577473057733975e-05,
"loss": 0.2912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2696704864501953,
"step": 1135,
"valid_targets_mean": 3424.2,
"valid_targets_min": 1441
},
{
"epoch": 2.039355992844365,
"grad_norm": 0.5805919255184491,
"learning_rate": 3.571972471463795e-05,
"loss": 0.2914,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2642717957496643,
"step": 1140,
"valid_targets_mean": 3726.3,
"valid_targets_min": 1936
},
{
"epoch": 2.0483005366726297,
"grad_norm": 0.5654677847464393,
"learning_rate": 3.566440599058253e-05,
"loss": 0.2984,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31323423981666565,
"step": 1145,
"valid_targets_mean": 4155.1,
"valid_targets_min": 1574
},
{
"epoch": 2.0572450805008944,
"grad_norm": 0.6258943561807471,
"learning_rate": 3.560877550615275e-05,
"loss": 0.2852,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2951895594596863,
"step": 1150,
"valid_targets_mean": 3085.2,
"valid_targets_min": 732
},
{
"epoch": 2.066189624329159,
"grad_norm": 0.48185508119836556,
"learning_rate": 3.555283436853267e-05,
"loss": 0.292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.277047336101532,
"step": 1155,
"valid_targets_mean": 4333.4,
"valid_targets_min": 1674
},
{
"epoch": 2.075134168157424,
"grad_norm": 0.5337477447807386,
"learning_rate": 3.549658369108911e-05,
"loss": 0.2844,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.290058970451355,
"step": 1160,
"valid_targets_mean": 4003.7,
"valid_targets_min": 667
},
{
"epoch": 2.084078711985689,
"grad_norm": 0.573076273715761,
"learning_rate": 3.544002459334952e-05,
"loss": 0.2941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2986866235733032,
"step": 1165,
"valid_targets_mean": 3509.6,
"valid_targets_min": 827
},
{
"epoch": 2.0930232558139537,
"grad_norm": 0.6434121744773865,
"learning_rate": 3.5383158200979636e-05,
"loss": 0.3013,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29687678813934326,
"step": 1170,
"valid_targets_mean": 2894.1,
"valid_targets_min": 1532
},
{
"epoch": 2.1019677996422184,
"grad_norm": 1.0345078244238066,
"learning_rate": 3.532598564576117e-05,
"loss": 0.2923,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27670419216156006,
"step": 1175,
"valid_targets_mean": 3932.2,
"valid_targets_min": 798
},
{
"epoch": 2.110912343470483,
"grad_norm": 0.5405380881490202,
"learning_rate": 3.526850806556919e-05,
"loss": 0.302,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2855556011199951,
"step": 1180,
"valid_targets_mean": 3778.3,
"valid_targets_min": 696
},
{
"epoch": 2.1198568872987478,
"grad_norm": 0.5976648828621719,
"learning_rate": 3.521072660434952e-05,
"loss": 0.2899,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28265494108200073,
"step": 1185,
"valid_targets_mean": 3455.8,
"valid_targets_min": 866
},
{
"epoch": 2.1288014311270125,
"grad_norm": 0.518386120621355,
"learning_rate": 3.5152642412095984e-05,
"loss": 0.2869,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2857966721057892,
"step": 1190,
"valid_targets_mean": 4677.8,
"valid_targets_min": 2305
},
{
"epoch": 2.137745974955277,
"grad_norm": 0.5447094720161839,
"learning_rate": 3.5094256644827474e-05,
"loss": 0.3016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3032097816467285,
"step": 1195,
"valid_targets_mean": 4234.6,
"valid_targets_min": 1055
},
{
"epoch": 2.146690518783542,
"grad_norm": 0.5406564490251188,
"learning_rate": 3.503557046456501e-05,
"loss": 0.2806,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2764890193939209,
"step": 1200,
"valid_targets_mean": 4025.9,
"valid_targets_min": 1610
},
{
"epoch": 2.1556350626118066,
"grad_norm": 0.5167292603339387,
"learning_rate": 3.4976585039308535e-05,
"loss": 0.3053,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2947821617126465,
"step": 1205,
"valid_targets_mean": 4129.1,
"valid_targets_min": 1605
},
{
"epoch": 2.1645796064400717,
"grad_norm": 0.7469544699185315,
"learning_rate": 3.491730154301372e-05,
"loss": 0.3068,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3116210401058197,
"step": 1210,
"valid_targets_mean": 3251.5,
"valid_targets_min": 1606
},
{
"epoch": 2.1735241502683365,
"grad_norm": 0.5769662832718492,
"learning_rate": 3.485772115556859e-05,
"loss": 0.2967,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2989100217819214,
"step": 1215,
"valid_targets_mean": 3717.8,
"valid_targets_min": 1327
},
{
"epoch": 2.182468694096601,
"grad_norm": 0.5888498917346773,
"learning_rate": 3.4797845062770045e-05,
"loss": 0.2985,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2971697747707367,
"step": 1220,
"valid_targets_mean": 3346.9,
"valid_targets_min": 1827
},
{
"epoch": 2.191413237924866,
"grad_norm": 0.5385601523875473,
"learning_rate": 3.473767445630022e-05,
"loss": 0.2938,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2714182436466217,
"step": 1225,
"valid_targets_mean": 3834.8,
"valid_targets_min": 1393
},
{
"epoch": 2.2003577817531306,
"grad_norm": 0.5095146941186255,
"learning_rate": 3.467721053370284e-05,
"loss": 0.2914,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3141205608844757,
"step": 1230,
"valid_targets_mean": 4676.5,
"valid_targets_min": 1372
},
{
"epoch": 2.2093023255813953,
"grad_norm": 0.6020826429693371,
"learning_rate": 3.4616454498359306e-05,
"loss": 0.3047,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29343247413635254,
"step": 1235,
"valid_targets_mean": 3196.5,
"valid_targets_min": 1524
},
{
"epoch": 2.21824686940966,
"grad_norm": 0.5403496852716332,
"learning_rate": 3.4555407559464825e-05,
"loss": 0.3081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3097769618034363,
"step": 1240,
"valid_targets_mean": 4774.0,
"valid_targets_min": 1541
},
{
"epoch": 2.2271914132379247,
"grad_norm": 0.5120840671547888,
"learning_rate": 3.4494070932004274e-05,
"loss": 0.3015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.284509539604187,
"step": 1245,
"valid_targets_mean": 4208.5,
"valid_targets_min": 1295
},
{
"epoch": 2.23613595706619,
"grad_norm": 0.5914343254506964,
"learning_rate": 3.4432445836728055e-05,
"loss": 0.2834,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2789539694786072,
"step": 1250,
"valid_targets_mean": 4127.3,
"valid_targets_min": 872
},
{
"epoch": 2.2450805008944545,
"grad_norm": 0.5645415624490583,
"learning_rate": 3.4370533500127794e-05,
"loss": 0.3038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30053240060806274,
"step": 1255,
"valid_targets_mean": 3852.9,
"valid_targets_min": 1580
},
{
"epoch": 2.2540250447227193,
"grad_norm": 0.5806828746585898,
"learning_rate": 3.430833515441193e-05,
"loss": 0.3006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31069332361221313,
"step": 1260,
"valid_targets_mean": 3907.2,
"valid_targets_min": 1436
},
{
"epoch": 2.262969588550984,
"grad_norm": 0.5626831319283796,
"learning_rate": 3.424585203748119e-05,
"loss": 0.3021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3043138086795807,
"step": 1265,
"valid_targets_mean": 4106.3,
"valid_targets_min": 1718
},
{
"epoch": 2.2719141323792487,
"grad_norm": 0.5419828214534085,
"learning_rate": 3.4183085392903965e-05,
"loss": 0.285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28403908014297485,
"step": 1270,
"valid_targets_mean": 3841.6,
"valid_targets_min": 1794
},
{
"epoch": 2.2808586762075134,
"grad_norm": 0.5881372643406569,
"learning_rate": 3.41200364698915e-05,
"loss": 0.2899,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30241650342941284,
"step": 1275,
"valid_targets_mean": 3480.4,
"valid_targets_min": 1784
},
{
"epoch": 2.289803220035778,
"grad_norm": 0.5027336153791081,
"learning_rate": 3.405670652327313e-05,
"loss": 0.3028,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28809165954589844,
"step": 1280,
"valid_targets_mean": 4556.8,
"valid_targets_min": 2196
},
{
"epoch": 2.298747763864043,
"grad_norm": 0.5959906299682153,
"learning_rate": 3.399309681347123e-05,
"loss": 0.2956,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.305059552192688,
"step": 1285,
"valid_targets_mean": 4217.6,
"valid_targets_min": 1517
},
{
"epoch": 2.3076923076923075,
"grad_norm": 0.47359707150452485,
"learning_rate": 3.392920860647617e-05,
"loss": 0.2975,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3012004792690277,
"step": 1290,
"valid_targets_mean": 4578.0,
"valid_targets_min": 1297
},
{
"epoch": 2.3166368515205726,
"grad_norm": 0.5369785466687547,
"learning_rate": 3.3865043173821074e-05,
"loss": 0.2854,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2727619409561157,
"step": 1295,
"valid_targets_mean": 3760.1,
"valid_targets_min": 1539
},
{
"epoch": 2.3255813953488373,
"grad_norm": 0.57676869627547,
"learning_rate": 3.380060179255656e-05,
"loss": 0.3036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31669068336486816,
"step": 1300,
"valid_targets_mean": 3117.1,
"valid_targets_min": 1662
},
{
"epoch": 2.334525939177102,
"grad_norm": 0.5283474540373422,
"learning_rate": 3.37358857452253e-05,
"loss": 0.3005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.303724467754364,
"step": 1305,
"valid_targets_mean": 4069.7,
"valid_targets_min": 1847
},
{
"epoch": 2.3434704830053668,
"grad_norm": 0.48205035846371097,
"learning_rate": 3.367089631983651e-05,
"loss": 0.3018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27161988615989685,
"step": 1310,
"valid_targets_mean": 4610.1,
"valid_targets_min": 625
},
{
"epoch": 2.3524150268336315,
"grad_norm": 0.5018852845147292,
"learning_rate": 3.360563480984029e-05,
"loss": 0.2908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2748308479785919,
"step": 1315,
"valid_targets_mean": 4035.2,
"valid_targets_min": 1483
},
{
"epoch": 2.361359570661896,
"grad_norm": 0.6082741514089518,
"learning_rate": 3.3540102514101904e-05,
"loss": 0.3009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2947337031364441,
"step": 1320,
"valid_targets_mean": 3258.3,
"valid_targets_min": 863
},
{
"epoch": 2.370304114490161,
"grad_norm": 0.5119247145544926,
"learning_rate": 3.347430073687592e-05,
"loss": 0.3057,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3057720363140106,
"step": 1325,
"valid_targets_mean": 5325.2,
"valid_targets_min": 2447
},
{
"epoch": 2.3792486583184256,
"grad_norm": 0.5545132272446245,
"learning_rate": 3.340823078778024e-05,
"loss": 0.2904,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.329643577337265,
"step": 1330,
"valid_targets_mean": 4703.9,
"valid_targets_min": 822
},
{
"epoch": 2.3881932021466907,
"grad_norm": 0.5611524701506613,
"learning_rate": 3.3341893981770086e-05,
"loss": 0.2999,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28520113229751587,
"step": 1335,
"valid_targets_mean": 3347.0,
"valid_targets_min": 1432
},
{
"epoch": 2.3971377459749554,
"grad_norm": 0.5360100187741607,
"learning_rate": 3.327529163911174e-05,
"loss": 0.29,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27396950125694275,
"step": 1340,
"valid_targets_mean": 4146.1,
"valid_targets_min": 1777
},
{
"epoch": 2.40608228980322,
"grad_norm": 0.5232182650009217,
"learning_rate": 3.320842508535636e-05,
"loss": 0.3023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.294733464717865,
"step": 1345,
"valid_targets_mean": 3978.9,
"valid_targets_min": 1969
},
{
"epoch": 2.415026833631485,
"grad_norm": 0.6341635562060696,
"learning_rate": 3.314129565131355e-05,
"loss": 0.3001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2832929491996765,
"step": 1350,
"valid_targets_mean": 3560.1,
"valid_targets_min": 1561
},
{
"epoch": 2.4239713774597496,
"grad_norm": 0.5512350224651154,
"learning_rate": 3.3073904673024854e-05,
"loss": 0.3018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2930479943752289,
"step": 1355,
"valid_targets_mean": 4085.1,
"valid_targets_min": 1762
},
{
"epoch": 2.4329159212880143,
"grad_norm": 0.5089586101245678,
"learning_rate": 3.300625349173723e-05,
"loss": 0.2983,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.304643452167511,
"step": 1360,
"valid_targets_mean": 4801.9,
"valid_targets_min": 1725
},
{
"epoch": 2.441860465116279,
"grad_norm": 0.5712139371917907,
"learning_rate": 3.29383434538763e-05,
"loss": 0.2893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.290343314409256,
"step": 1365,
"valid_targets_mean": 4540.5,
"valid_targets_min": 1504
},
{
"epoch": 2.4508050089445437,
"grad_norm": 0.6223435319453212,
"learning_rate": 3.287017591101957e-05,
"loss": 0.3061,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3304898738861084,
"step": 1370,
"valid_targets_mean": 3340.2,
"valid_targets_min": 1231
},
{
"epoch": 2.4597495527728084,
"grad_norm": 0.548835445285655,
"learning_rate": 3.2801752219869536e-05,
"loss": 0.2962,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29954493045806885,
"step": 1375,
"valid_targets_mean": 3768.6,
"valid_targets_min": 1507
},
{
"epoch": 2.4686940966010735,
"grad_norm": 0.5273857106581554,
"learning_rate": 3.273307374222667e-05,
"loss": 0.2956,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29336017370224,
"step": 1380,
"valid_targets_mean": 3922.8,
"valid_targets_min": 527
},
{
"epoch": 2.4776386404293382,
"grad_norm": 0.461716385493086,
"learning_rate": 3.266414184496233e-05,
"loss": 0.2867,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29551392793655396,
"step": 1385,
"valid_targets_mean": 4960.4,
"valid_targets_min": 1853
},
{
"epoch": 2.486583184257603,
"grad_norm": 0.5233231328137401,
"learning_rate": 3.2594957899991566e-05,
"loss": 0.3022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30951058864593506,
"step": 1390,
"valid_targets_mean": 4894.6,
"valid_targets_min": 1705
},
{
"epoch": 2.4955277280858676,
"grad_norm": 0.5483474982667876,
"learning_rate": 3.2525523284245766e-05,
"loss": 0.2837,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2956357002258301,
"step": 1395,
"valid_targets_mean": 4093.8,
"valid_targets_min": 1158
},
{
"epoch": 2.5044722719141324,
"grad_norm": 0.5470117760522922,
"learning_rate": 3.245583937964532e-05,
"loss": 0.2757,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29229462146759033,
"step": 1400,
"valid_targets_mean": 4277.4,
"valid_targets_min": 1526
},
{
"epoch": 2.513416815742397,
"grad_norm": 0.5692210997559785,
"learning_rate": 3.238590757307206e-05,
"loss": 0.2907,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28669655323028564,
"step": 1405,
"valid_targets_mean": 4107.9,
"valid_targets_min": 2476
},
{
"epoch": 2.5223613595706618,
"grad_norm": 0.5999394928447368,
"learning_rate": 3.2315729256341686e-05,
"loss": 0.3037,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3192169666290283,
"step": 1410,
"valid_targets_mean": 3115.0,
"valid_targets_min": 482
},
{
"epoch": 2.531305903398927,
"grad_norm": 0.5067438226356301,
"learning_rate": 3.2245305826176063e-05,
"loss": 0.2978,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30782514810562134,
"step": 1415,
"valid_targets_mean": 4176.4,
"valid_targets_min": 1489
},
{
"epoch": 2.5402504472271916,
"grad_norm": 0.5670153939929208,
"learning_rate": 3.217463868417541e-05,
"loss": 0.2904,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2898740768432617,
"step": 1420,
"valid_targets_mean": 4424.1,
"valid_targets_min": 877
},
{
"epoch": 2.5491949910554563,
"grad_norm": 0.5320142185017729,
"learning_rate": 3.2103729236790434e-05,
"loss": 0.292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3135606646537781,
"step": 1425,
"valid_targets_mean": 4807.0,
"valid_targets_min": 1759
},
{
"epoch": 2.558139534883721,
"grad_norm": 0.5377685633015429,
"learning_rate": 3.203257889529428e-05,
"loss": 0.3005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3080807626247406,
"step": 1430,
"valid_targets_mean": 4145.8,
"valid_targets_min": 1470
},
{
"epoch": 2.5670840787119857,
"grad_norm": 0.9791809632288329,
"learning_rate": 3.196118907575452e-05,
"loss": 0.3046,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32376378774642944,
"step": 1435,
"valid_targets_mean": 2997.5,
"valid_targets_min": 1849
},
{
"epoch": 2.5760286225402504,
"grad_norm": 0.5199580890989173,
"learning_rate": 3.188956119900491e-05,
"loss": 0.2942,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27378737926483154,
"step": 1440,
"valid_targets_mean": 3816.5,
"valid_targets_min": 835
},
{
"epoch": 2.584973166368515,
"grad_norm": 0.5360826743649624,
"learning_rate": 3.181769669061713e-05,
"loss": 0.2917,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3072686791419983,
"step": 1445,
"valid_targets_mean": 3774.3,
"valid_targets_min": 529
},
{
"epoch": 2.59391771019678,
"grad_norm": 0.5009124650640604,
"learning_rate": 3.174559698087244e-05,
"loss": 0.3046,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2810012698173523,
"step": 1450,
"valid_targets_mean": 3802.2,
"valid_targets_min": 1494
},
{
"epoch": 2.6028622540250446,
"grad_norm": 0.5463511449260107,
"learning_rate": 3.1673263504733136e-05,
"loss": 0.2966,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28489333391189575,
"step": 1455,
"valid_targets_mean": 3726.8,
"valid_targets_min": 737
},
{
"epoch": 2.6118067978533093,
"grad_norm": 0.6037481930684999,
"learning_rate": 3.160069770181411e-05,
"loss": 0.2875,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3057287335395813,
"step": 1460,
"valid_targets_mean": 3358.2,
"valid_targets_min": 1491
},
{
"epoch": 2.620751341681574,
"grad_norm": 0.504749731879137,
"learning_rate": 3.152790101635408e-05,
"loss": 0.2903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2742614150047302,
"step": 1465,
"valid_targets_mean": 4562.9,
"valid_targets_min": 710
},
{
"epoch": 2.629695885509839,
"grad_norm": 0.5501576116598611,
"learning_rate": 3.145487489718692e-05,
"loss": 0.3005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29383790493011475,
"step": 1470,
"valid_targets_mean": 4014.8,
"valid_targets_min": 1590
},
{
"epoch": 2.638640429338104,
"grad_norm": 0.6055643551418105,
"learning_rate": 3.138162079771278e-05,
"loss": 0.2971,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30859410762786865,
"step": 1475,
"valid_targets_mean": 3838.2,
"valid_targets_min": 1093
},
{
"epoch": 2.6475849731663685,
"grad_norm": 0.6069047010077838,
"learning_rate": 3.1308140175869216e-05,
"loss": 0.2978,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29912006855010986,
"step": 1480,
"valid_targets_mean": 3958.1,
"valid_targets_min": 1677
},
{
"epoch": 2.6565295169946332,
"grad_norm": 0.5738673372037972,
"learning_rate": 3.123443449410211e-05,
"loss": 0.291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29722023010253906,
"step": 1485,
"valid_targets_mean": 3427.4,
"valid_targets_min": 527
},
{
"epoch": 2.665474060822898,
"grad_norm": 0.5133193729173582,
"learning_rate": 3.1160505219336594e-05,
"loss": 0.3037,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26430267095565796,
"step": 1490,
"valid_targets_mean": 4530.4,
"valid_targets_min": 1263
},
{
"epoch": 2.6744186046511627,
"grad_norm": 0.5734809599747189,
"learning_rate": 3.108635382294787e-05,
"loss": 0.2919,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2972019910812378,
"step": 1495,
"valid_targets_mean": 3677.4,
"valid_targets_min": 1602
},
{
"epoch": 2.683363148479428,
"grad_norm": 0.5428678152914708,
"learning_rate": 3.101198178073189e-05,
"loss": 0.2907,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2788999080657959,
"step": 1500,
"valid_targets_mean": 4050.4,
"valid_targets_min": 1841
},
{
"epoch": 2.6923076923076925,
"grad_norm": 0.5346131939463955,
"learning_rate": 3.093739057287603e-05,
"loss": 0.2943,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3178672790527344,
"step": 1505,
"valid_targets_mean": 4216.1,
"valid_targets_min": 2013
},
{
"epoch": 2.701252236135957,
"grad_norm": 0.5546663057017248,
"learning_rate": 3.086258168392957e-05,
"loss": 0.2927,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2941766381263733,
"step": 1510,
"valid_targets_mean": 4037.4,
"valid_targets_min": 2094
},
{
"epoch": 2.710196779964222,
"grad_norm": 0.6007631310576768,
"learning_rate": 3.0787556602774195e-05,
"loss": 0.2995,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3104172348976135,
"step": 1515,
"valid_targets_mean": 3226.3,
"valid_targets_min": 699
},
{
"epoch": 2.7191413237924866,
"grad_norm": 0.5246652173150378,
"learning_rate": 3.071231682259437e-05,
"loss": 0.2993,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31006383895874023,
"step": 1520,
"valid_targets_mean": 3979.1,
"valid_targets_min": 1929
},
{
"epoch": 2.7280858676207513,
"grad_norm": 0.4917003682982894,
"learning_rate": 3.063686384084756e-05,
"loss": 0.2894,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3010290265083313,
"step": 1525,
"valid_targets_mean": 4885.2,
"valid_targets_min": 1695
},
{
"epoch": 2.737030411449016,
"grad_norm": 0.5164120363148196,
"learning_rate": 3.05611991592345e-05,
"loss": 0.292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28511500358581543,
"step": 1530,
"valid_targets_mean": 4332.8,
"valid_targets_min": 2130
},
{
"epoch": 2.7459749552772807,
"grad_norm": 0.546710521171786,
"learning_rate": 3.0485324283669288e-05,
"loss": 0.2976,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2977195382118225,
"step": 1535,
"valid_targets_mean": 3932.6,
"valid_targets_min": 835
},
{
"epoch": 2.7549194991055455,
"grad_norm": 0.4987699796804533,
"learning_rate": 3.0409240724249334e-05,
"loss": 0.2974,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28613370656967163,
"step": 1540,
"valid_targets_mean": 4534.4,
"valid_targets_min": 932
},
{
"epoch": 2.76386404293381,
"grad_norm": 0.5318282523003093,
"learning_rate": 3.033294999522545e-05,
"loss": 0.291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29021310806274414,
"step": 1545,
"valid_targets_mean": 4185.5,
"valid_targets_min": 1805
},
{
"epoch": 2.772808586762075,
"grad_norm": 0.5878956920224669,
"learning_rate": 3.0256453614971594e-05,
"loss": 0.3034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2993810772895813,
"step": 1550,
"valid_targets_mean": 3415.2,
"valid_targets_min": 715
},
{
"epoch": 2.78175313059034,
"grad_norm": 0.5178111135961665,
"learning_rate": 3.017975310595469e-05,
"loss": 0.3122,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32516568899154663,
"step": 1555,
"valid_targets_mean": 4719.7,
"valid_targets_min": 2013
},
{
"epoch": 2.7906976744186047,
"grad_norm": 0.5581315425684471,
"learning_rate": 3.0102849994704343e-05,
"loss": 0.3007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2962647080421448,
"step": 1560,
"valid_targets_mean": 3870.3,
"valid_targets_min": 1774
},
{
"epoch": 2.7996422182468694,
"grad_norm": 0.6256471631470097,
"learning_rate": 3.0025745811782444e-05,
"loss": 0.3041,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29967325925827026,
"step": 1565,
"valid_targets_mean": 3177.1,
"valid_targets_min": 772
},
{
"epoch": 2.808586762075134,
"grad_norm": 0.5320691282381641,
"learning_rate": 2.994844209175269e-05,
"loss": 0.2977,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.331190824508667,
"step": 1570,
"valid_targets_mean": 4638.9,
"valid_targets_min": 1626
},
{
"epoch": 2.817531305903399,
"grad_norm": 0.6752470008469027,
"learning_rate": 2.987094037315008e-05,
"loss": 0.2964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3196222186088562,
"step": 1575,
"valid_targets_mean": 2458.3,
"valid_targets_min": 658
},
{
"epoch": 2.8264758497316635,
"grad_norm": 0.5531523191801033,
"learning_rate": 2.9793242198450258e-05,
"loss": 0.2781,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28398263454437256,
"step": 1580,
"valid_targets_mean": 4128.9,
"valid_targets_min": 1775
},
{
"epoch": 2.8354203935599287,
"grad_norm": 0.5237471309819827,
"learning_rate": 2.9715349114038825e-05,
"loss": 0.2842,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2685989737510681,
"step": 1585,
"valid_targets_mean": 5779.9,
"valid_targets_min": 1305
},
{
"epoch": 2.8443649373881934,
"grad_norm": 0.47372842550809013,
"learning_rate": 2.9637262670180597e-05,
"loss": 0.2924,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29568806290626526,
"step": 1590,
"valid_targets_mean": 4608.0,
"valid_targets_min": 607
},
{
"epoch": 2.853309481216458,
"grad_norm": 0.5192555722225825,
"learning_rate": 2.955898442098869e-05,
"loss": 0.2932,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28541460633277893,
"step": 1595,
"valid_targets_mean": 4063.2,
"valid_targets_min": 919
},
{
"epoch": 2.862254025044723,
"grad_norm": 0.5309547559574028,
"learning_rate": 2.948051592439363e-05,
"loss": 0.2887,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31091922521591187,
"step": 1600,
"valid_targets_mean": 3888.9,
"valid_targets_min": 823
},
{
"epoch": 2.8711985688729875,
"grad_norm": 0.5461932654893836,
"learning_rate": 2.9401858742112334e-05,
"loss": 0.2952,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30643460154533386,
"step": 1605,
"valid_targets_mean": 3989.2,
"valid_targets_min": 1666
},
{
"epoch": 2.8801431127012522,
"grad_norm": 0.5151199812668427,
"learning_rate": 2.9323014439617044e-05,
"loss": 0.2969,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3191748559474945,
"step": 1610,
"valid_targets_mean": 4541.9,
"valid_targets_min": 2209
},
{
"epoch": 2.889087656529517,
"grad_norm": 0.452227709754697,
"learning_rate": 2.924398458610414e-05,
"loss": 0.2677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23286093771457672,
"step": 1615,
"valid_targets_mean": 4696.9,
"valid_targets_min": 2143
},
{
"epoch": 2.8980322003577816,
"grad_norm": 0.5294903977491242,
"learning_rate": 2.9164770754462926e-05,
"loss": 0.2983,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27453750371932983,
"step": 1620,
"valid_targets_mean": 4409.6,
"valid_targets_min": 2448
},
{
"epoch": 2.9069767441860463,
"grad_norm": 0.5116227108871184,
"learning_rate": 2.9085374521244333e-05,
"loss": 0.2839,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2921096682548523,
"step": 1625,
"valid_targets_mean": 4203.6,
"valid_targets_min": 774
},
{
"epoch": 2.915921288014311,
"grad_norm": 0.8886084421935505,
"learning_rate": 2.900579746662954e-05,
"loss": 0.2994,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2785966992378235,
"step": 1630,
"valid_targets_mean": 4256.9,
"valid_targets_min": 1439
},
{
"epoch": 2.9248658318425758,
"grad_norm": 0.5165202216086147,
"learning_rate": 2.8926041174398496e-05,
"loss": 0.2903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2874126434326172,
"step": 1635,
"valid_targets_mean": 3910.6,
"valid_targets_min": 1567
},
{
"epoch": 2.933810375670841,
"grad_norm": 0.5227694759657353,
"learning_rate": 2.8846107231898445e-05,
"loss": 0.2982,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2759662866592407,
"step": 1640,
"valid_targets_mean": 3917.8,
"valid_targets_min": 928
},
{
"epoch": 2.9427549194991056,
"grad_norm": 0.610425871678501,
"learning_rate": 2.8765997230012295e-05,
"loss": 0.2952,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28333795070648193,
"step": 1645,
"valid_targets_mean": 4170.1,
"valid_targets_min": 2193
},
{
"epoch": 2.9516994633273703,
"grad_norm": 0.46116236306935077,
"learning_rate": 2.868571276312698e-05,
"loss": 0.2866,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28075987100601196,
"step": 1650,
"valid_targets_mean": 4360.5,
"valid_targets_min": 1737
},
{
"epoch": 2.960644007155635,
"grad_norm": 0.5095418283669151,
"learning_rate": 2.860525542910171e-05,
"loss": 0.2839,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2718711495399475,
"step": 1655,
"valid_targets_mean": 3928.2,
"valid_targets_min": 1604
},
{
"epoch": 2.9695885509838997,
"grad_norm": 0.5085610495904306,
"learning_rate": 2.852462682923619e-05,
"loss": 0.2815,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2917214334011078,
"step": 1660,
"valid_targets_mean": 3901.8,
"valid_targets_min": 1275
},
{
"epoch": 2.9785330948121644,
"grad_norm": 0.5658892685832217,
"learning_rate": 2.844382856823872e-05,
"loss": 0.2934,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29110509157180786,
"step": 1665,
"valid_targets_mean": 3285.5,
"valid_targets_min": 690
},
{
"epoch": 2.9874776386404296,
"grad_norm": 0.6573066368722159,
"learning_rate": 2.8362862254194298e-05,
"loss": 0.29,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28502312302589417,
"step": 1670,
"valid_targets_mean": 4089.2,
"valid_targets_min": 787
},
{
"epoch": 2.9964221824686943,
"grad_norm": 0.5079392607819926,
"learning_rate": 2.8281729498532574e-05,
"loss": 0.312,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3002755045890808,
"step": 1675,
"valid_targets_mean": 4365.2,
"valid_targets_min": 1049
},
{
"epoch": 3.005366726296959,
"grad_norm": 0.5393232205748715,
"learning_rate": 2.8200431915995805e-05,
"loss": 0.2826,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28886353969573975,
"step": 1680,
"valid_targets_mean": 3904.8,
"valid_targets_min": 863
},
{
"epoch": 3.0143112701252237,
"grad_norm": 0.5476424824827836,
"learning_rate": 2.8118971124606712e-05,
"loss": 0.2629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2710658311843872,
"step": 1685,
"valid_targets_mean": 4062.5,
"valid_targets_min": 2017
},
{
"epoch": 3.0232558139534884,
"grad_norm": 0.606499437576894,
"learning_rate": 2.8037348745636274e-05,
"loss": 0.2872,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2897275388240814,
"step": 1690,
"valid_targets_mean": 3168.9,
"valid_targets_min": 1034
},
{
"epoch": 3.032200357781753,
"grad_norm": 0.5222073176909986,
"learning_rate": 2.7955566403571464e-05,
"loss": 0.2845,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26425305008888245,
"step": 1695,
"valid_targets_mean": 4216.6,
"valid_targets_min": 1906
},
{
"epoch": 3.041144901610018,
"grad_norm": 0.533081866038887,
"learning_rate": 2.78736257260829e-05,
"loss": 0.2724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2789760231971741,
"step": 1700,
"valid_targets_mean": 4355.0,
"valid_targets_min": 1674
},
{
"epoch": 3.0500894454382825,
"grad_norm": 0.5395830050252504,
"learning_rate": 2.7791528343992494e-05,
"loss": 0.2914,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2874540090560913,
"step": 1705,
"valid_targets_mean": 3905.8,
"valid_targets_min": 1662
},
{
"epoch": 3.0590339892665472,
"grad_norm": 0.5327375583639009,
"learning_rate": 2.7709275891240936e-05,
"loss": 0.2751,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2773253917694092,
"step": 1710,
"valid_targets_mean": 3790.8,
"valid_targets_min": 1228
},
{
"epoch": 3.067978533094812,
"grad_norm": 0.5332213202740119,
"learning_rate": 2.7626870004855236e-05,
"loss": 0.2732,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2752811312675476,
"step": 1715,
"valid_targets_mean": 4314.0,
"valid_targets_min": 2290
},
{
"epoch": 3.076923076923077,
"grad_norm": 0.5771000275440432,
"learning_rate": 2.7544312324916088e-05,
"loss": 0.2824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3129065930843353,
"step": 1720,
"valid_targets_mean": 3639.2,
"valid_targets_min": 1703
},
{
"epoch": 3.085867620751342,
"grad_norm": 0.4926160303249595,
"learning_rate": 2.7461604494525257e-05,
"loss": 0.2681,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27431702613830566,
"step": 1725,
"valid_targets_mean": 4959.2,
"valid_targets_min": 1500
},
{
"epoch": 3.0948121645796065,
"grad_norm": 0.5440762244035418,
"learning_rate": 2.7378748159772888e-05,
"loss": 0.2668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2572042942047119,
"step": 1730,
"valid_targets_mean": 3845.3,
"valid_targets_min": 867
},
{
"epoch": 3.103756708407871,
"grad_norm": 0.5468975063253847,
"learning_rate": 2.7295744969704725e-05,
"loss": 0.2654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2830193340778351,
"step": 1735,
"valid_targets_mean": 3994.4,
"valid_targets_min": 793
},
{
"epoch": 3.112701252236136,
"grad_norm": 0.5247791983633943,
"learning_rate": 2.7212596576289264e-05,
"loss": 0.2749,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25497889518737793,
"step": 1740,
"valid_targets_mean": 3932.6,
"valid_targets_min": 867
},
{
"epoch": 3.1216457960644006,
"grad_norm": 0.5097180897051293,
"learning_rate": 2.712930463438496e-05,
"loss": 0.2764,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2678571343421936,
"step": 1745,
"valid_targets_mean": 4393.1,
"valid_targets_min": 1763
},
{
"epoch": 3.1305903398926653,
"grad_norm": 0.5054371550866157,
"learning_rate": 2.7045870801707194e-05,
"loss": 0.2761,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2683069109916687,
"step": 1750,
"valid_targets_mean": 4437.9,
"valid_targets_min": 1725
},
{
"epoch": 3.13953488372093,
"grad_norm": 0.5389786007076532,
"learning_rate": 2.6962296738795344e-05,
"loss": 0.2906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29220160841941833,
"step": 1755,
"valid_targets_mean": 4123.8,
"valid_targets_min": 579
},
{
"epoch": 3.148479427549195,
"grad_norm": 0.5762090201207496,
"learning_rate": 2.687858410897971e-05,
"loss": 0.2636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25318244099617004,
"step": 1760,
"valid_targets_mean": 3570.9,
"valid_targets_min": 743
},
{
"epoch": 3.15742397137746,
"grad_norm": 0.5279696697699028,
"learning_rate": 2.679473457834842e-05,
"loss": 0.2916,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29287105798721313,
"step": 1765,
"valid_targets_mean": 4093.7,
"valid_targets_min": 2342
},
{
"epoch": 3.1663685152057246,
"grad_norm": 0.6183882195312416,
"learning_rate": 2.6710749815714262e-05,
"loss": 0.2707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26889514923095703,
"step": 1770,
"valid_targets_mean": 3194.8,
"valid_targets_min": 676
},
{
"epoch": 3.1753130590339893,
"grad_norm": 0.5656736312850078,
"learning_rate": 2.6626631492581475e-05,
"loss": 0.2834,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28966403007507324,
"step": 1775,
"valid_targets_mean": 3782.7,
"valid_targets_min": 1258
},
{
"epoch": 3.184257602862254,
"grad_norm": 0.5484222792379775,
"learning_rate": 2.654238128311249e-05,
"loss": 0.2845,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2807530164718628,
"step": 1780,
"valid_targets_mean": 3794.1,
"valid_targets_min": 1944
},
{
"epoch": 3.1932021466905187,
"grad_norm": 0.5453822622258856,
"learning_rate": 2.645800086409458e-05,
"loss": 0.2761,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2747189402580261,
"step": 1785,
"valid_targets_mean": 4427.3,
"valid_targets_min": 1608
},
{
"epoch": 3.2021466905187834,
"grad_norm": 0.5001051263184161,
"learning_rate": 2.637349191490654e-05,
"loss": 0.2796,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2797410488128662,
"step": 1790,
"valid_targets_mean": 4777.8,
"valid_targets_min": 2640
},
{
"epoch": 3.211091234347048,
"grad_norm": 0.5575267617456836,
"learning_rate": 2.6288856117485216e-05,
"loss": 0.2896,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.298971951007843,
"step": 1795,
"valid_targets_mean": 4380.4,
"valid_targets_min": 1213
},
{
"epoch": 3.220035778175313,
"grad_norm": 0.5382921298878789,
"learning_rate": 2.6204095156292048e-05,
"loss": 0.2644,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26511919498443604,
"step": 1800,
"valid_targets_mean": 4108.1,
"valid_targets_min": 2044
},
{
"epoch": 3.228980322003578,
"grad_norm": 0.5252112327673899,
"learning_rate": 2.6119210718279538e-05,
"loss": 0.2798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28953590989112854,
"step": 1805,
"valid_targets_mean": 4361.9,
"valid_targets_min": 1299
},
{
"epoch": 3.2379248658318427,
"grad_norm": 0.5410954452724649,
"learning_rate": 2.60342044928577e-05,
"loss": 0.2808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30843818187713623,
"step": 1810,
"valid_targets_mean": 4546.8,
"valid_targets_min": 1329
},
{
"epoch": 3.2468694096601074,
"grad_norm": 0.581674111347238,
"learning_rate": 2.5949078171860395e-05,
"loss": 0.2845,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30058762431144714,
"step": 1815,
"valid_targets_mean": 3899.8,
"valid_targets_min": 763
},
{
"epoch": 3.255813953488372,
"grad_norm": 0.5237279678403152,
"learning_rate": 2.5863833449511706e-05,
"loss": 0.2649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27064049243927,
"step": 1820,
"valid_targets_mean": 4455.4,
"valid_targets_min": 1818
},
{
"epoch": 3.264758497316637,
"grad_norm": 0.5533963196851126,
"learning_rate": 2.5778472022392184e-05,
"loss": 0.2757,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2702397108078003,
"step": 1825,
"valid_targets_mean": 4271.4,
"valid_targets_min": 2002
},
{
"epoch": 3.2737030411449015,
"grad_norm": 0.5313362157055852,
"learning_rate": 2.5692995589405087e-05,
"loss": 0.2906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2803131341934204,
"step": 1830,
"valid_targets_mean": 4208.0,
"valid_targets_min": 1639
},
{
"epoch": 3.282647584973166,
"grad_norm": 0.5541192810579373,
"learning_rate": 2.5607405851742578e-05,
"loss": 0.2786,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2655271291732788,
"step": 1835,
"valid_targets_mean": 4423.6,
"valid_targets_min": 1631
},
{
"epoch": 3.2915921288014314,
"grad_norm": 0.581829811898252,
"learning_rate": 2.5521704512851884e-05,
"loss": 0.2836,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28082770109176636,
"step": 1840,
"valid_targets_mean": 3964.4,
"valid_targets_min": 1481
},
{
"epoch": 3.300536672629696,
"grad_norm": 0.5564304499542477,
"learning_rate": 2.5435893278401328e-05,
"loss": 0.2768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2610231637954712,
"step": 1845,
"valid_targets_mean": 3748.6,
"valid_targets_min": 1052
},
{
"epoch": 3.309481216457961,
"grad_norm": 0.5890948907758241,
"learning_rate": 2.534997385624647e-05,
"loss": 0.2651,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2398790717124939,
"step": 1850,
"valid_targets_mean": 3603.0,
"valid_targets_min": 552
},
{
"epoch": 3.3184257602862255,
"grad_norm": 0.563595381422207,
"learning_rate": 2.5263947956396043e-05,
"loss": 0.2768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2689689099788666,
"step": 1855,
"valid_targets_mean": 3884.8,
"valid_targets_min": 922
},
{
"epoch": 3.32737030411449,
"grad_norm": 0.5202754657752621,
"learning_rate": 2.5177817290977967e-05,
"loss": 0.275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2853309214115143,
"step": 1860,
"valid_targets_mean": 4258.4,
"valid_targets_min": 1557
},
{
"epoch": 3.336314847942755,
"grad_norm": 0.5125955462826816,
"learning_rate": 2.5091583574205247e-05,
"loss": 0.2813,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26263585686683655,
"step": 1865,
"valid_targets_mean": 4235.4,
"valid_targets_min": 2097
},
{
"epoch": 3.3452593917710196,
"grad_norm": 0.5366296714092318,
"learning_rate": 2.5005248522341868e-05,
"loss": 0.2741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2572114169597626,
"step": 1870,
"valid_targets_mean": 3658.3,
"valid_targets_min": 1843
},
{
"epoch": 3.3542039355992843,
"grad_norm": 0.5473866663101812,
"learning_rate": 2.4918813853668632e-05,
"loss": 0.2807,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2796470522880554,
"step": 1875,
"valid_targets_mean": 3708.9,
"valid_targets_min": 1482
},
{
"epoch": 3.363148479427549,
"grad_norm": 0.5566454634749927,
"learning_rate": 2.483228128844896e-05,
"loss": 0.2715,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2780247926712036,
"step": 1880,
"valid_targets_mean": 3811.8,
"valid_targets_min": 842
},
{
"epoch": 3.3720930232558137,
"grad_norm": 0.5573845593232436,
"learning_rate": 2.4745652548894654e-05,
"loss": 0.273,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2704911231994629,
"step": 1885,
"valid_targets_mean": 4766.7,
"valid_targets_min": 2080
},
{
"epoch": 3.381037567084079,
"grad_norm": 0.5104062442322098,
"learning_rate": 2.4658929359131634e-05,
"loss": 0.273,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2546011209487915,
"step": 1890,
"valid_targets_mean": 4313.2,
"valid_targets_min": 993
},
{
"epoch": 3.3899821109123436,
"grad_norm": 0.6120011359863383,
"learning_rate": 2.4572113445165603e-05,
"loss": 0.2944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29367899894714355,
"step": 1895,
"valid_targets_mean": 3432.7,
"valid_targets_min": 758
},
{
"epoch": 3.3989266547406083,
"grad_norm": 0.5470654579653317,
"learning_rate": 2.4485206534847706e-05,
"loss": 0.2786,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2764478921890259,
"step": 1900,
"valid_targets_mean": 3888.6,
"valid_targets_min": 1597
},
{
"epoch": 3.407871198568873,
"grad_norm": 0.5631697298734966,
"learning_rate": 2.439821035784014e-05,
"loss": 0.2801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29474952816963196,
"step": 1905,
"valid_targets_mean": 3846.1,
"valid_targets_min": 1665
},
{
"epoch": 3.4168157423971377,
"grad_norm": 0.522999992256365,
"learning_rate": 2.431112664558173e-05,
"loss": 0.2704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2620839476585388,
"step": 1910,
"valid_targets_mean": 3582.1,
"valid_targets_min": 1304
},
{
"epoch": 3.4257602862254024,
"grad_norm": 0.49262352099697787,
"learning_rate": 2.4223957131253467e-05,
"loss": 0.2743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26315534114837646,
"step": 1915,
"valid_targets_mean": 4538.1,
"valid_targets_min": 2028
},
{
"epoch": 3.434704830053667,
"grad_norm": 0.5515685545090246,
"learning_rate": 2.4136703549744028e-05,
"loss": 0.2888,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2935299873352051,
"step": 1920,
"valid_targets_mean": 4080.0,
"valid_targets_min": 794
},
{
"epoch": 3.4436493738819323,
"grad_norm": 0.48476650247349296,
"learning_rate": 2.4049367637615215e-05,
"loss": 0.2964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2544916272163391,
"step": 1925,
"valid_targets_mean": 4508.7,
"valid_targets_min": 1366
},
{
"epoch": 3.452593917710197,
"grad_norm": 0.4860033907502521,
"learning_rate": 2.396195113306742e-05,
"loss": 0.2764,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2550594210624695,
"step": 1930,
"valid_targets_mean": 4433.0,
"valid_targets_min": 1985
},
{
"epoch": 3.4615384615384617,
"grad_norm": 0.5353229674635286,
"learning_rate": 2.3874455775905036e-05,
"loss": 0.2666,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2665395736694336,
"step": 1935,
"valid_targets_mean": 3745.3,
"valid_targets_min": 937
},
{
"epoch": 3.4704830053667264,
"grad_norm": 0.5901472498319702,
"learning_rate": 2.3786883307501794e-05,
"loss": 0.2822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29798996448516846,
"step": 1940,
"valid_targets_mean": 4030.6,
"valid_targets_min": 1812
},
{
"epoch": 3.479427549194991,
"grad_norm": 0.5296365133279529,
"learning_rate": 2.3699235470766147e-05,
"loss": 0.2778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2898460030555725,
"step": 1945,
"valid_targets_mean": 4661.3,
"valid_targets_min": 2092
},
{
"epoch": 3.488372093023256,
"grad_norm": 0.6738643909015106,
"learning_rate": 2.3611514010106564e-05,
"loss": 0.2818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2727169990539551,
"step": 1950,
"valid_targets_mean": 4183.0,
"valid_targets_min": 1207
},
{
"epoch": 3.4973166368515205,
"grad_norm": 0.5074455770952165,
"learning_rate": 2.35237206713968e-05,
"loss": 0.265,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24378815293312073,
"step": 1955,
"valid_targets_mean": 4246.9,
"valid_targets_min": 1394
},
{
"epoch": 3.506261180679785,
"grad_norm": 0.5374442471219851,
"learning_rate": 2.3435857201941172e-05,
"loss": 0.2717,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27619755268096924,
"step": 1960,
"valid_targets_mean": 3896.1,
"valid_targets_min": 1301
},
{
"epoch": 3.51520572450805,
"grad_norm": 0.5087843696552686,
"learning_rate": 2.3347925350439765e-05,
"loss": 0.2799,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2813979387283325,
"step": 1965,
"valid_targets_mean": 3997.4,
"valid_targets_min": 1369
},
{
"epoch": 3.5241502683363146,
"grad_norm": 0.5980560849762698,
"learning_rate": 2.3259926866953636e-05,
"loss": 0.2801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28663375973701477,
"step": 1970,
"valid_targets_mean": 3297.6,
"valid_targets_min": 1305
},
{
"epoch": 3.5330948121645798,
"grad_norm": 0.5193924325842352,
"learning_rate": 2.3171863502869993e-05,
"loss": 0.2671,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26521211862564087,
"step": 1975,
"valid_targets_mean": 4117.4,
"valid_targets_min": 2056
},
{
"epoch": 3.5420393559928445,
"grad_norm": 0.5449182986186685,
"learning_rate": 2.3083737010867316e-05,
"loss": 0.2765,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26807746291160583,
"step": 1980,
"valid_targets_mean": 3758.1,
"valid_targets_min": 1563
},
{
"epoch": 3.550983899821109,
"grad_norm": 0.6191157830270809,
"learning_rate": 2.2995549144880487e-05,
"loss": 0.2805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31274452805519104,
"step": 1985,
"valid_targets_mean": 3152.6,
"valid_targets_min": 710
},
{
"epoch": 3.559928443649374,
"grad_norm": 0.4986923272606033,
"learning_rate": 2.290730166006589e-05,
"loss": 0.2733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27044352889060974,
"step": 1990,
"valid_targets_mean": 4526.8,
"valid_targets_min": 1712
},
{
"epoch": 3.5688729874776386,
"grad_norm": 0.5291098132220836,
"learning_rate": 2.2818996312766474e-05,
"loss": 0.2784,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28628769516944885,
"step": 1995,
"valid_targets_mean": 4237.6,
"valid_targets_min": 1300
},
{
"epoch": 3.5778175313059033,
"grad_norm": 0.5395780033336437,
"learning_rate": 2.2730634860476778e-05,
"loss": 0.2837,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2602778673171997,
"step": 2000,
"valid_targets_mean": 3754.7,
"valid_targets_min": 2238
},
{
"epoch": 3.586762075134168,
"grad_norm": 0.5654796524167398,
"learning_rate": 2.264221906180798e-05,
"loss": 0.2853,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26922616362571716,
"step": 2005,
"valid_targets_mean": 3893.6,
"valid_targets_min": 1565
},
{
"epoch": 3.595706618962433,
"grad_norm": 0.5747944159759851,
"learning_rate": 2.255375067645289e-05,
"loss": 0.2888,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29051297903060913,
"step": 2010,
"valid_targets_mean": 3719.8,
"valid_targets_min": 1764
},
{
"epoch": 3.604651162790698,
"grad_norm": 1.076215188277447,
"learning_rate": 2.2465231465150902e-05,
"loss": 0.2711,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2821960151195526,
"step": 2015,
"valid_targets_mean": 4530.9,
"valid_targets_min": 1666
},
{
"epoch": 3.6135957066189626,
"grad_norm": 0.5041678901004969,
"learning_rate": 2.2376663189653002e-05,
"loss": 0.2773,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25614356994628906,
"step": 2020,
"valid_targets_mean": 4557.1,
"valid_targets_min": 2257
},
{
"epoch": 3.6225402504472273,
"grad_norm": 0.49697468351907303,
"learning_rate": 2.2288047612686655e-05,
"loss": 0.2639,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2509356737136841,
"step": 2025,
"valid_targets_mean": 4656.5,
"valid_targets_min": 2178
},
{
"epoch": 3.631484794275492,
"grad_norm": 0.5593780074340731,
"learning_rate": 2.219938649792074e-05,
"loss": 0.2768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2787664532661438,
"step": 2030,
"valid_targets_mean": 3585.8,
"valid_targets_min": 725
},
{
"epoch": 3.6404293381037567,
"grad_norm": 0.6058445555907487,
"learning_rate": 2.2110681609930458e-05,
"loss": 0.283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28542840480804443,
"step": 2035,
"valid_targets_mean": 3754.0,
"valid_targets_min": 1893
},
{
"epoch": 3.6493738819320214,
"grad_norm": 0.6592434752132575,
"learning_rate": 2.2021934714162212e-05,
"loss": 0.2771,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30062779784202576,
"step": 2040,
"valid_targets_mean": 3522.3,
"valid_targets_min": 527
},
{
"epoch": 3.658318425760286,
"grad_norm": 0.511485872021097,
"learning_rate": 2.1933147576898447e-05,
"loss": 0.2728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25937914848327637,
"step": 2045,
"valid_targets_mean": 3873.6,
"valid_targets_min": 1491
},
{
"epoch": 3.667262969588551,
"grad_norm": 0.5594642686607454,
"learning_rate": 2.1844321965222525e-05,
"loss": 0.2825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3036922216415405,
"step": 2050,
"valid_targets_mean": 3970.2,
"valid_targets_min": 1673
},
{
"epoch": 3.6762075134168155,
"grad_norm": 0.5162375365075016,
"learning_rate": 2.1755459646983545e-05,
"loss": 0.2824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27681976556777954,
"step": 2055,
"valid_targets_mean": 4571.4,
"valid_targets_min": 1171
},
{
"epoch": 3.6851520572450807,
"grad_norm": 0.507537692969965,
"learning_rate": 2.1666562390761147e-05,
"loss": 0.2799,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2693493664264679,
"step": 2060,
"valid_targets_mean": 5078.4,
"valid_targets_min": 1264
},
{
"epoch": 3.6940966010733454,
"grad_norm": 0.5780198663275775,
"learning_rate": 2.1577631965830324e-05,
"loss": 0.2734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2515581250190735,
"step": 2065,
"valid_targets_mean": 3473.2,
"valid_targets_min": 1525
},
{
"epoch": 3.70304114490161,
"grad_norm": 0.5015533752033411,
"learning_rate": 2.1488670142126234e-05,
"loss": 0.2659,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2759404182434082,
"step": 2070,
"valid_targets_mean": 4662.1,
"valid_targets_min": 1440
},
{
"epoch": 3.7119856887298748,
"grad_norm": 0.518248052496532,
"learning_rate": 2.13996786902089e-05,
"loss": 0.274,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27556905150413513,
"step": 2075,
"valid_targets_mean": 4112.4,
"valid_targets_min": 2299
},
{
"epoch": 3.7209302325581395,
"grad_norm": 0.53651912472871,
"learning_rate": 2.1310659381228066e-05,
"loss": 0.2846,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2784693241119385,
"step": 2080,
"valid_targets_mean": 3839.6,
"valid_targets_min": 1588
},
{
"epoch": 3.729874776386404,
"grad_norm": 0.5764048848203882,
"learning_rate": 2.122161398688788e-05,
"loss": 0.2903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28273123502731323,
"step": 2085,
"valid_targets_mean": 3669.2,
"valid_targets_min": 741
},
{
"epoch": 3.738819320214669,
"grad_norm": 0.4820289047101863,
"learning_rate": 2.1132544279411655e-05,
"loss": 0.2747,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26568305492401123,
"step": 2090,
"valid_targets_mean": 4602.2,
"valid_targets_min": 786
},
{
"epoch": 3.747763864042934,
"grad_norm": 0.6120891450370751,
"learning_rate": 2.1043452031506578e-05,
"loss": 0.2807,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2671006917953491,
"step": 2095,
"valid_targets_mean": 3208.0,
"valid_targets_min": 1621
},
{
"epoch": 3.7567084078711988,
"grad_norm": 0.4891187435236056,
"learning_rate": 2.0954339016328485e-05,
"loss": 0.2781,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25922301411628723,
"step": 2100,
"valid_targets_mean": 4271.0,
"valid_targets_min": 1612
},
{
"epoch": 3.7656529516994635,
"grad_norm": 0.5464092724861203,
"learning_rate": 2.08652070074465e-05,
"loss": 0.2805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3047419786453247,
"step": 2105,
"valid_targets_mean": 3791.9,
"valid_targets_min": 1102
},
{
"epoch": 3.774597495527728,
"grad_norm": 0.6364819542700682,
"learning_rate": 2.077605777880778e-05,
"loss": 0.2681,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31326138973236084,
"step": 2110,
"valid_targets_mean": 3016.8,
"valid_targets_min": 748
},
{
"epoch": 3.783542039355993,
"grad_norm": 0.5001257137373921,
"learning_rate": 2.0686893104702198e-05,
"loss": 0.2589,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2531580328941345,
"step": 2115,
"valid_targets_mean": 4102.5,
"valid_targets_min": 1660
},
{
"epoch": 3.7924865831842576,
"grad_norm": 0.474779949675362,
"learning_rate": 2.0597714759727028e-05,
"loss": 0.2834,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2678177058696747,
"step": 2120,
"valid_targets_mean": 4861.8,
"valid_targets_min": 1696
},
{
"epoch": 3.8014311270125223,
"grad_norm": 0.46813381967025147,
"learning_rate": 2.050852451875163e-05,
"loss": 0.2715,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27863186597824097,
"step": 2125,
"valid_targets_mean": 4995.9,
"valid_targets_min": 715
},
{
"epoch": 3.810375670840787,
"grad_norm": 0.5646539409857256,
"learning_rate": 2.041932415688212e-05,
"loss": 0.2749,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2734571099281311,
"step": 2130,
"valid_targets_mean": 4401.4,
"valid_targets_min": 1873
},
{
"epoch": 3.8193202146690517,
"grad_norm": 0.5405176564877853,
"learning_rate": 2.0330115449426054e-05,
"loss": 0.2792,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30330121517181396,
"step": 2135,
"valid_targets_mean": 4075.5,
"valid_targets_min": 988
},
{
"epoch": 3.8282647584973164,
"grad_norm": 0.5063431046009021,
"learning_rate": 2.0240900171857064e-05,
"loss": 0.2892,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29637011885643005,
"step": 2140,
"valid_targets_mean": 4556.2,
"valid_targets_min": 1850
},
{
"epoch": 3.8372093023255816,
"grad_norm": 0.6148280852194663,
"learning_rate": 2.0151680099779574e-05,
"loss": 0.2795,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2594483494758606,
"step": 2145,
"valid_targets_mean": 3378.6,
"valid_targets_min": 943
},
{
"epoch": 3.8461538461538463,
"grad_norm": 0.5460464073665912,
"learning_rate": 2.0062457008893408e-05,
"loss": 0.2775,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25146251916885376,
"step": 2150,
"valid_targets_mean": 3959.3,
"valid_targets_min": 1579
},
{
"epoch": 3.855098389982111,
"grad_norm": 0.5034957296053513,
"learning_rate": 1.9973232674958487e-05,
"loss": 0.2698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25639331340789795,
"step": 2155,
"valid_targets_mean": 4098.7,
"valid_targets_min": 1449
},
{
"epoch": 3.8640429338103757,
"grad_norm": 0.566801459570412,
"learning_rate": 1.9884008873759446e-05,
"loss": 0.2751,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29593968391418457,
"step": 2160,
"valid_targets_mean": 3769.4,
"valid_targets_min": 474
},
{
"epoch": 3.8729874776386404,
"grad_norm": 0.5224664015779718,
"learning_rate": 1.979478738107035e-05,
"loss": 0.2669,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2669827938079834,
"step": 2165,
"valid_targets_mean": 4153.2,
"valid_targets_min": 1824
},
{
"epoch": 3.881932021466905,
"grad_norm": 0.5346475973128151,
"learning_rate": 1.9705569972619295e-05,
"loss": 0.2837,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28263264894485474,
"step": 2170,
"valid_targets_mean": 3984.6,
"valid_targets_min": 1518
},
{
"epoch": 3.89087656529517,
"grad_norm": 0.5482896143276372,
"learning_rate": 1.961635842405311e-05,
"loss": 0.2675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27248382568359375,
"step": 2175,
"valid_targets_mean": 4330.0,
"valid_targets_min": 1711
},
{
"epoch": 3.899821109123435,
"grad_norm": 0.48204226172382336,
"learning_rate": 1.9527154510901972e-05,
"loss": 0.2734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25980862975120544,
"step": 2180,
"valid_targets_mean": 4406.8,
"valid_targets_min": 1855
},
{
"epoch": 3.9087656529516996,
"grad_norm": 0.4210041453535078,
"learning_rate": 1.9437960008544126e-05,
"loss": 0.2578,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2111448049545288,
"step": 2185,
"valid_targets_mean": 5192.1,
"valid_targets_min": 2200
},
{
"epoch": 3.9177101967799643,
"grad_norm": 0.5637363734690357,
"learning_rate": 1.9348776692170494e-05,
"loss": 0.2836,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2881026566028595,
"step": 2190,
"valid_targets_mean": 3882.8,
"valid_targets_min": 558
},
{
"epoch": 3.926654740608229,
"grad_norm": 0.48316017438181486,
"learning_rate": 1.9259606336749374e-05,
"loss": 0.2784,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2716853618621826,
"step": 2195,
"valid_targets_mean": 4683.8,
"valid_targets_min": 1674
},
{
"epoch": 3.9355992844364938,
"grad_norm": 0.45317704598781144,
"learning_rate": 1.9170450716991122e-05,
"loss": 0.2615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.236902117729187,
"step": 2200,
"valid_targets_mean": 4864.1,
"valid_targets_min": 2033
},
{
"epoch": 3.9445438282647585,
"grad_norm": 0.56647472453608,
"learning_rate": 1.90813116073128e-05,
"loss": 0.2896,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30802735686302185,
"step": 2205,
"valid_targets_mean": 3714.6,
"valid_targets_min": 823
},
{
"epoch": 3.953488372093023,
"grad_norm": 0.5508322430994914,
"learning_rate": 1.899219078180289e-05,
"loss": 0.2789,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29120323061943054,
"step": 2210,
"valid_targets_mean": 3726.9,
"valid_targets_min": 1807
},
{
"epoch": 3.962432915921288,
"grad_norm": 0.5708136652371602,
"learning_rate": 1.8903090014185984e-05,
"loss": 0.2706,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26580384373664856,
"step": 2215,
"valid_targets_mean": 3621.6,
"valid_targets_min": 1470
},
{
"epoch": 3.9713774597495526,
"grad_norm": 0.5942416912075751,
"learning_rate": 1.881401107778744e-05,
"loss": 0.2802,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30616092681884766,
"step": 2220,
"valid_targets_mean": 3367.2,
"valid_targets_min": 777
},
{
"epoch": 3.9803220035778173,
"grad_norm": 0.5144304612582596,
"learning_rate": 1.8724955745498147e-05,
"loss": 0.2689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2784048318862915,
"step": 2225,
"valid_targets_mean": 4234.6,
"valid_targets_min": 1729
},
{
"epoch": 3.9892665474060824,
"grad_norm": 0.5300804516751338,
"learning_rate": 1.863592578973921e-05,
"loss": 0.2769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27351003885269165,
"step": 2230,
"valid_targets_mean": 3583.5,
"valid_targets_min": 1324
},
{
"epoch": 3.998211091234347,
"grad_norm": 0.5329781559722259,
"learning_rate": 1.854692298242667e-05,
"loss": 0.2692,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24892058968544006,
"step": 2235,
"valid_targets_mean": 3651.9,
"valid_targets_min": 1519
},
{
"epoch": 4.007155635062611,
"grad_norm": 0.4900604244331859,
"learning_rate": 1.8457949094936265e-05,
"loss": 0.2479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2408735752105713,
"step": 2240,
"valid_targets_mean": 4293.0,
"valid_targets_min": 1617
},
{
"epoch": 4.016100178890877,
"grad_norm": 0.49977219265912204,
"learning_rate": 1.8369005898068136e-05,
"loss": 0.25,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26399219036102295,
"step": 2245,
"valid_targets_mean": 5123.9,
"valid_targets_min": 667
},
{
"epoch": 4.025044722719142,
"grad_norm": 0.5502105291911087,
"learning_rate": 1.8280095162011617e-05,
"loss": 0.2608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28108128905296326,
"step": 2250,
"valid_targets_mean": 4024.1,
"valid_targets_min": 747
},
{
"epoch": 4.033989266547406,
"grad_norm": 0.5835364945002972,
"learning_rate": 1.819121865630998e-05,
"loss": 0.2627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25397148728370667,
"step": 2255,
"valid_targets_mean": 3106.8,
"valid_targets_min": 1424
},
{
"epoch": 4.042933810375671,
"grad_norm": 0.5736849669987507,
"learning_rate": 1.8102378149825242e-05,
"loss": 0.2566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25006911158561707,
"step": 2260,
"valid_targets_mean": 4338.4,
"valid_targets_min": 1212
},
{
"epoch": 4.051878354203936,
"grad_norm": 0.578856261130234,
"learning_rate": 1.801357541070294e-05,
"loss": 0.2561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2498929500579834,
"step": 2265,
"valid_targets_mean": 3711.7,
"valid_targets_min": 1454
},
{
"epoch": 4.0608228980322005,
"grad_norm": 0.570026305308228,
"learning_rate": 1.7924812206336956e-05,
"loss": 0.2641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24680036306381226,
"step": 2270,
"valid_targets_mean": 3502.1,
"valid_targets_min": 766
},
{
"epoch": 4.069767441860465,
"grad_norm": 0.5017381451878832,
"learning_rate": 1.7836090303334312e-05,
"loss": 0.2587,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24516400694847107,
"step": 2275,
"valid_targets_mean": 4885.2,
"valid_targets_min": 1056
},
{
"epoch": 4.07871198568873,
"grad_norm": 0.6571441759078382,
"learning_rate": 1.7747411467480058e-05,
"loss": 0.2619,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25563162565231323,
"step": 2280,
"valid_targets_mean": 4010.9,
"valid_targets_min": 1636
},
{
"epoch": 4.087656529516995,
"grad_norm": 0.5157227921600919,
"learning_rate": 1.7658777463702076e-05,
"loss": 0.2611,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26061367988586426,
"step": 2285,
"valid_targets_mean": 4204.8,
"valid_targets_min": 1436
},
{
"epoch": 4.096601073345259,
"grad_norm": 0.5245851983426554,
"learning_rate": 1.7570190056035996e-05,
"loss": 0.2598,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23559322953224182,
"step": 2290,
"valid_targets_mean": 4053.4,
"valid_targets_min": 722
},
{
"epoch": 4.105545617173524,
"grad_norm": 0.5917926110353966,
"learning_rate": 1.7481651007590054e-05,
"loss": 0.2706,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25014737248420715,
"step": 2295,
"valid_targets_mean": 3289.2,
"valid_targets_min": 699
},
{
"epoch": 4.114490161001789,
"grad_norm": 0.5026025456498621,
"learning_rate": 1.7393162080510045e-05,
"loss": 0.2712,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2548500895500183,
"step": 2300,
"valid_targets_mean": 4602.9,
"valid_targets_min": 1525
},
{
"epoch": 4.1234347048300535,
"grad_norm": 0.5164574844544229,
"learning_rate": 1.7304725035944194e-05,
"loss": 0.2549,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2356826364994049,
"step": 2305,
"valid_targets_mean": 4163.1,
"valid_targets_min": 1691
},
{
"epoch": 4.132379248658318,
"grad_norm": 0.48824332711112567,
"learning_rate": 1.7216341634008168e-05,
"loss": 0.2493,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25585299730300903,
"step": 2310,
"valid_targets_mean": 5345.3,
"valid_targets_min": 2336
},
{
"epoch": 4.141323792486583,
"grad_norm": 0.5908232354996049,
"learning_rate": 1.7128013633749978e-05,
"loss": 0.2713,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26593607664108276,
"step": 2315,
"valid_targets_mean": 4050.5,
"valid_targets_min": 684
},
{
"epoch": 4.150268336314848,
"grad_norm": 0.5495386431735231,
"learning_rate": 1.7039742793115025e-05,
"loss": 0.2688,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2615734040737152,
"step": 2320,
"valid_targets_mean": 3975.1,
"valid_targets_min": 2183
},
{
"epoch": 4.159212880143112,
"grad_norm": 0.6242915835353913,
"learning_rate": 1.6951530868911097e-05,
"loss": 0.2654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2717490792274475,
"step": 2325,
"valid_targets_mean": 3084.0,
"valid_targets_min": 737
},
{
"epoch": 4.168157423971378,
"grad_norm": 0.5070664833456054,
"learning_rate": 1.6863379616773388e-05,
"loss": 0.2641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2583721876144409,
"step": 2330,
"valid_targets_mean": 4625.7,
"valid_targets_min": 1817
},
{
"epoch": 4.177101967799643,
"grad_norm": 0.5582812233226788,
"learning_rate": 1.6775290791129567e-05,
"loss": 0.2584,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2620850205421448,
"step": 2335,
"valid_targets_mean": 3869.9,
"valid_targets_min": 1570
},
{
"epoch": 4.186046511627907,
"grad_norm": 0.584227709585007,
"learning_rate": 1.668726614516488e-05,
"loss": 0.2689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25571852922439575,
"step": 2340,
"valid_targets_mean": 3331.9,
"valid_targets_min": 1615
},
{
"epoch": 4.194991055456172,
"grad_norm": 0.5175133185961949,
"learning_rate": 1.6599307430787216e-05,
"loss": 0.256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2526220977306366,
"step": 2345,
"valid_targets_mean": 4406.4,
"valid_targets_min": 1662
},
{
"epoch": 4.203935599284437,
"grad_norm": 0.49289171535932735,
"learning_rate": 1.6511416398592264e-05,
"loss": 0.2705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2843324840068817,
"step": 2350,
"valid_targets_mean": 5134.6,
"valid_targets_min": 995
},
{
"epoch": 4.212880143112701,
"grad_norm": 0.5356859083954757,
"learning_rate": 1.64235947978287e-05,
"loss": 0.2669,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28424036502838135,
"step": 2355,
"valid_targets_mean": 4424.1,
"valid_targets_min": 1810
},
{
"epoch": 4.221824686940966,
"grad_norm": 0.513042991430007,
"learning_rate": 1.6335844376363295e-05,
"loss": 0.2664,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2585211396217346,
"step": 2360,
"valid_targets_mean": 5082.6,
"valid_targets_min": 907
},
{
"epoch": 4.230769230769231,
"grad_norm": 0.5695128355206176,
"learning_rate": 1.6248166880646225e-05,
"loss": 0.2557,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2641540467739105,
"step": 2365,
"valid_targets_mean": 3779.7,
"valid_targets_min": 1253
},
{
"epoch": 4.2397137745974955,
"grad_norm": 0.6023295149757434,
"learning_rate": 1.6160564055676235e-05,
"loss": 0.259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2857375144958496,
"step": 2370,
"valid_targets_mean": 2948.9,
"valid_targets_min": 720
},
{
"epoch": 4.24865831842576,
"grad_norm": 0.5098827801538092,
"learning_rate": 1.6073037644965938e-05,
"loss": 0.2548,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23553355038166046,
"step": 2375,
"valid_targets_mean": 4315.9,
"valid_targets_min": 1473
},
{
"epoch": 4.257602862254025,
"grad_norm": 0.5243491333274759,
"learning_rate": 1.5985589390507117e-05,
"loss": 0.2627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27872568368911743,
"step": 2380,
"valid_targets_mean": 4803.7,
"valid_targets_min": 842
},
{
"epoch": 4.26654740608229,
"grad_norm": 0.5241756061317848,
"learning_rate": 1.589822103273607e-05,
"loss": 0.2633,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2604633867740631,
"step": 2385,
"valid_targets_mean": 3930.9,
"valid_targets_min": 835
},
{
"epoch": 4.275491949910554,
"grad_norm": 0.4948005196786464,
"learning_rate": 1.5810934310498922e-05,
"loss": 0.2733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28036582469940186,
"step": 2390,
"valid_targets_mean": 4740.4,
"valid_targets_min": 1665
},
{
"epoch": 4.284436493738819,
"grad_norm": 0.5212209771223362,
"learning_rate": 1.5723730961017082e-05,
"loss": 0.2593,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28980493545532227,
"step": 2395,
"valid_targets_mean": 4507.4,
"valid_targets_min": 1489
},
{
"epoch": 4.293381037567084,
"grad_norm": 0.5309847222961126,
"learning_rate": 1.5636612719852615e-05,
"loss": 0.2732,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2707955837249756,
"step": 2400,
"valid_targets_mean": 4071.7,
"valid_targets_min": 2048
},
{
"epoch": 4.3023255813953485,
"grad_norm": 0.6436096499085671,
"learning_rate": 1.5549581320873715e-05,
"loss": 0.2596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27491945028305054,
"step": 2405,
"valid_targets_mean": 3519.8,
"valid_targets_min": 483
},
{
"epoch": 4.311270125223613,
"grad_norm": 0.6837292335134912,
"learning_rate": 1.5462638496220223e-05,
"loss": 0.2615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2572469413280487,
"step": 2410,
"valid_targets_mean": 3385.1,
"valid_targets_min": 787
},
{
"epoch": 4.320214669051879,
"grad_norm": 0.5148506938846231,
"learning_rate": 1.537578597626912e-05,
"loss": 0.2701,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2704946994781494,
"step": 2415,
"valid_targets_mean": 4277.2,
"valid_targets_min": 1140
},
{
"epoch": 4.3291592128801435,
"grad_norm": 0.5488881906738768,
"learning_rate": 1.528902548960009e-05,
"loss": 0.2697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26252859830856323,
"step": 2420,
"valid_targets_mean": 4134.1,
"valid_targets_min": 697
},
{
"epoch": 4.338103756708408,
"grad_norm": 0.728874058237292,
"learning_rate": 1.5202358762961155e-05,
"loss": 0.2694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2942860424518585,
"step": 2425,
"valid_targets_mean": 2536.9,
"valid_targets_min": 629
},
{
"epoch": 4.347048300536673,
"grad_norm": 0.542241600208826,
"learning_rate": 1.511578752123426e-05,
"loss": 0.2574,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2418219894170761,
"step": 2430,
"valid_targets_mean": 3832.9,
"valid_targets_min": 1764
},
{
"epoch": 4.355992844364938,
"grad_norm": 0.5211187289766209,
"learning_rate": 1.5029313487400958e-05,
"loss": 0.2681,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27209898829460144,
"step": 2435,
"valid_targets_mean": 4450.8,
"valid_targets_min": 1600
},
{
"epoch": 4.364937388193202,
"grad_norm": 0.519412156562896,
"learning_rate": 1.4942938382508147e-05,
"loss": 0.2535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2514136731624603,
"step": 2440,
"valid_targets_mean": 3935.2,
"valid_targets_min": 1225
},
{
"epoch": 4.373881932021467,
"grad_norm": 0.5552648581770736,
"learning_rate": 1.4856663925633776e-05,
"loss": 0.2623,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27997347712516785,
"step": 2445,
"valid_targets_mean": 3901.2,
"valid_targets_min": 656
},
{
"epoch": 4.382826475849732,
"grad_norm": 0.5765361718445776,
"learning_rate": 1.4770491833852663e-05,
"loss": 0.2663,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25308501720428467,
"step": 2450,
"valid_targets_mean": 3612.2,
"valid_targets_min": 1505
},
{
"epoch": 4.391771019677996,
"grad_norm": 0.4583081364190965,
"learning_rate": 1.4684423822202297e-05,
"loss": 0.2566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2737816870212555,
"step": 2455,
"valid_targets_mean": 5324.3,
"valid_targets_min": 1435
},
{
"epoch": 4.400715563506261,
"grad_norm": 0.5330319752947505,
"learning_rate": 1.4598461603648736e-05,
"loss": 0.2692,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2785816788673401,
"step": 2460,
"valid_targets_mean": 3858.1,
"valid_targets_min": 646
},
{
"epoch": 4.409660107334526,
"grad_norm": 0.5365942670180822,
"learning_rate": 1.451260688905245e-05,
"loss": 0.266,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25116056203842163,
"step": 2465,
"valid_targets_mean": 3929.6,
"valid_targets_min": 1495
},
{
"epoch": 4.4186046511627906,
"grad_norm": 0.5412560763819989,
"learning_rate": 1.4426861387134361e-05,
"loss": 0.2635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2546349763870239,
"step": 2470,
"valid_targets_mean": 3853.9,
"valid_targets_min": 1665
},
{
"epoch": 4.427549194991055,
"grad_norm": 0.49146455305384606,
"learning_rate": 1.4341226804441766e-05,
"loss": 0.2707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.284711092710495,
"step": 2475,
"valid_targets_mean": 4519.9,
"valid_targets_min": 2096
},
{
"epoch": 4.43649373881932,
"grad_norm": 0.5417709539865344,
"learning_rate": 1.4255704845314406e-05,
"loss": 0.2744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28545889258384705,
"step": 2480,
"valid_targets_mean": 4169.8,
"valid_targets_min": 1480
},
{
"epoch": 4.445438282647585,
"grad_norm": 0.580103049281134,
"learning_rate": 1.4170297211850522e-05,
"loss": 0.2597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2692874073982239,
"step": 2485,
"valid_targets_mean": 3508.5,
"valid_targets_min": 1796
},
{
"epoch": 4.454382826475849,
"grad_norm": 0.518242596266636,
"learning_rate": 1.4085005603873004e-05,
"loss": 0.2748,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27401190996170044,
"step": 2490,
"valid_targets_mean": 4321.2,
"valid_targets_min": 1504
},
{
"epoch": 4.463327370304114,
"grad_norm": 0.5757017697078726,
"learning_rate": 1.3999831718895545e-05,
"loss": 0.276,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28794726729393005,
"step": 2495,
"valid_targets_mean": 4045.3,
"valid_targets_min": 1123
},
{
"epoch": 4.47227191413238,
"grad_norm": 0.5507231462190035,
"learning_rate": 1.3914777252088851e-05,
"loss": 0.2666,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28651851415634155,
"step": 2500,
"valid_targets_mean": 4500.8,
"valid_targets_min": 1340
},
{
"epoch": 4.481216457960644,
"grad_norm": 0.5709744504493519,
"learning_rate": 1.3829843896246917e-05,
"loss": 0.2715,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2755128741264343,
"step": 2505,
"valid_targets_mean": 3492.8,
"valid_targets_min": 1623
},
{
"epoch": 4.490161001788909,
"grad_norm": 0.6042383309260438,
"learning_rate": 1.3745033341753337e-05,
"loss": 0.2687,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2556525468826294,
"step": 2510,
"valid_targets_mean": 3758.3,
"valid_targets_min": 1447
},
{
"epoch": 4.499105545617174,
"grad_norm": 0.5391378624752455,
"learning_rate": 1.3660347276547645e-05,
"loss": 0.2761,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2629320025444031,
"step": 2515,
"valid_targets_mean": 3977.8,
"valid_targets_min": 1561
},
{
"epoch": 4.5080500894454385,
"grad_norm": 0.5894869456529992,
"learning_rate": 1.3575787386091745e-05,
"loss": 0.2549,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2664399743080139,
"step": 2520,
"valid_targets_mean": 3450.4,
"valid_targets_min": 1805
},
{
"epoch": 4.516994633273703,
"grad_norm": 0.5927649885745278,
"learning_rate": 1.3491355353336338e-05,
"loss": 0.2701,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2676470875740051,
"step": 2525,
"valid_targets_mean": 3550.7,
"valid_targets_min": 741
},
{
"epoch": 4.525939177101968,
"grad_norm": 0.5460664988494238,
"learning_rate": 1.3407052858687432e-05,
"loss": 0.2693,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28948739171028137,
"step": 2530,
"valid_targets_mean": 4106.0,
"valid_targets_min": 1399
},
{
"epoch": 4.534883720930233,
"grad_norm": 0.547063854344203,
"learning_rate": 1.3322881579972934e-05,
"loss": 0.2616,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2661360502243042,
"step": 2535,
"valid_targets_mean": 3879.1,
"valid_targets_min": 754
},
{
"epoch": 4.543828264758497,
"grad_norm": 0.5551257878105804,
"learning_rate": 1.323884319240921e-05,
"loss": 0.2649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30140677094459534,
"step": 2540,
"valid_targets_mean": 3945.9,
"valid_targets_min": 1303
},
{
"epoch": 4.552772808586762,
"grad_norm": 0.5712690563559092,
"learning_rate": 1.3154939368567771e-05,
"loss": 0.2432,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25856685638427734,
"step": 2545,
"valid_targets_mean": 3441.0,
"valid_targets_min": 1512
},
{
"epoch": 4.561717352415027,
"grad_norm": 0.5434270961027026,
"learning_rate": 1.3071171778341975e-05,
"loss": 0.2597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25168734788894653,
"step": 2550,
"valid_targets_mean": 4073.9,
"valid_targets_min": 1313
},
{
"epoch": 4.5706618962432914,
"grad_norm": 0.5497424956791681,
"learning_rate": 1.2987542088913801e-05,
"loss": 0.2587,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24401748180389404,
"step": 2555,
"valid_targets_mean": 4201.8,
"valid_targets_min": 1546
},
{
"epoch": 4.579606440071556,
"grad_norm": 0.5096054278407313,
"learning_rate": 1.290405196472064e-05,
"loss": 0.265,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26317811012268066,
"step": 2560,
"valid_targets_mean": 4815.1,
"valid_targets_min": 1171
},
{
"epoch": 4.588550983899821,
"grad_norm": 0.5275387474839849,
"learning_rate": 1.282070306742222e-05,
"loss": 0.265,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2525607645511627,
"step": 2565,
"valid_targets_mean": 4492.8,
"valid_targets_min": 1887
},
{
"epoch": 4.597495527728086,
"grad_norm": 0.5924005743194193,
"learning_rate": 1.2737497055867482e-05,
"loss": 0.2701,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2749042510986328,
"step": 2570,
"valid_targets_mean": 3256.1,
"valid_targets_min": 825
},
{
"epoch": 4.60644007155635,
"grad_norm": 0.520307087440015,
"learning_rate": 1.2654435586061604e-05,
"loss": 0.2489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23750732839107513,
"step": 2575,
"valid_targets_mean": 3960.6,
"valid_targets_min": 1329
},
{
"epoch": 4.615384615384615,
"grad_norm": 0.5616936308653787,
"learning_rate": 1.2571520311133012e-05,
"loss": 0.2627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26292529702186584,
"step": 2580,
"valid_targets_mean": 4504.7,
"valid_targets_min": 1275
},
{
"epoch": 4.624329159212881,
"grad_norm": 0.5518910049186732,
"learning_rate": 1.2488752881300514e-05,
"loss": 0.2539,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2535983920097351,
"step": 2585,
"valid_targets_mean": 3939.8,
"valid_targets_min": 1386
},
{
"epoch": 4.633273703041145,
"grad_norm": 0.5256431179864964,
"learning_rate": 1.2406134943840398e-05,
"loss": 0.2496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2522655129432678,
"step": 2590,
"valid_targets_mean": 4140.9,
"valid_targets_min": 474
},
{
"epoch": 4.64221824686941,
"grad_norm": 0.5048588742383056,
"learning_rate": 1.232366814305372e-05,
"loss": 0.2498,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24697677791118622,
"step": 2595,
"valid_targets_mean": 4505.9,
"valid_targets_min": 1820
},
{
"epoch": 4.651162790697675,
"grad_norm": 0.6135798826851775,
"learning_rate": 1.2241354120233527e-05,
"loss": 0.2609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27449357509613037,
"step": 2600,
"valid_targets_mean": 3534.1,
"valid_targets_min": 1231
},
{
"epoch": 4.660107334525939,
"grad_norm": 0.5407420740372647,
"learning_rate": 1.2159194513632213e-05,
"loss": 0.2619,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2621440589427948,
"step": 2605,
"valid_targets_mean": 3698.6,
"valid_targets_min": 625
},
{
"epoch": 4.669051878354204,
"grad_norm": 0.5784897601072413,
"learning_rate": 1.20771909584289e-05,
"loss": 0.2683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2809554934501648,
"step": 2610,
"valid_targets_mean": 4114.5,
"valid_targets_min": 1649
},
{
"epoch": 4.677996422182469,
"grad_norm": 0.5583707405753705,
"learning_rate": 1.1995345086696919e-05,
"loss": 0.2593,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.265133798122406,
"step": 2615,
"valid_targets_mean": 4105.6,
"valid_targets_min": 1769
},
{
"epoch": 4.6869409660107335,
"grad_norm": 0.5899963254378155,
"learning_rate": 1.1913658527371284e-05,
"loss": 0.2642,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2800382077693939,
"step": 2620,
"valid_targets_mean": 3958.2,
"valid_targets_min": 1014
},
{
"epoch": 4.695885509838998,
"grad_norm": 0.5666305355030801,
"learning_rate": 1.1832132906216314e-05,
"loss": 0.2681,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27610641717910767,
"step": 2625,
"valid_targets_mean": 3627.1,
"valid_targets_min": 734
},
{
"epoch": 4.704830053667263,
"grad_norm": 0.48544029558526913,
"learning_rate": 1.1750769845793268e-05,
"loss": 0.2629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25514447689056396,
"step": 2630,
"valid_targets_mean": 4717.1,
"valid_targets_min": 767
},
{
"epoch": 4.713774597495528,
"grad_norm": 0.5191718129231461,
"learning_rate": 1.1669570965428028e-05,
"loss": 0.2708,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28754234313964844,
"step": 2635,
"valid_targets_mean": 4340.2,
"valid_targets_min": 1685
},
{
"epoch": 4.722719141323792,
"grad_norm": 0.5824564729383654,
"learning_rate": 1.1588537881178902e-05,
"loss": 0.2545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.259286105632782,
"step": 2640,
"valid_targets_mean": 3709.2,
"valid_targets_min": 1083
},
{
"epoch": 4.731663685152057,
"grad_norm": 0.6199061316983084,
"learning_rate": 1.150767220580444e-05,
"loss": 0.2628,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.264919638633728,
"step": 2645,
"valid_targets_mean": 3604.6,
"valid_targets_min": 1544
},
{
"epoch": 4.740608228980322,
"grad_norm": 0.4746750054946057,
"learning_rate": 1.1426975548731329e-05,
"loss": 0.2587,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21649254858493805,
"step": 2650,
"valid_targets_mean": 4358.8,
"valid_targets_min": 1497
},
{
"epoch": 4.7495527728085865,
"grad_norm": 0.6094545797228554,
"learning_rate": 1.1346449516022395e-05,
"loss": 0.2525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26640570163726807,
"step": 2655,
"valid_targets_mean": 3034.4,
"valid_targets_min": 529
},
{
"epoch": 4.758497316636851,
"grad_norm": 0.5341381722241784,
"learning_rate": 1.1266095710344611e-05,
"loss": 0.261,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2599736154079437,
"step": 2660,
"valid_targets_mean": 4056.6,
"valid_targets_min": 748
},
{
"epoch": 4.767441860465116,
"grad_norm": 0.5450354818964038,
"learning_rate": 1.1185915730937209e-05,
"loss": 0.2554,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2556326985359192,
"step": 2665,
"valid_targets_mean": 3869.1,
"valid_targets_min": 1724
},
{
"epoch": 4.7763864042933815,
"grad_norm": 0.5823841949915403,
"learning_rate": 1.1105911173579831e-05,
"loss": 0.2757,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2735878527164459,
"step": 2670,
"valid_targets_mean": 3594.8,
"valid_targets_min": 1608
},
{
"epoch": 4.785330948121646,
"grad_norm": 0.5282126999205208,
"learning_rate": 1.1026083630560814e-05,
"loss": 0.2526,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26514312624931335,
"step": 2675,
"valid_targets_mean": 4371.6,
"valid_targets_min": 1156
},
{
"epoch": 4.794275491949911,
"grad_norm": 0.5463930991787092,
"learning_rate": 1.0946434690645446e-05,
"loss": 0.2611,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2594326138496399,
"step": 2680,
"valid_targets_mean": 4857.9,
"valid_targets_min": 2646
},
{
"epoch": 4.803220035778176,
"grad_norm": 0.4924897165473573,
"learning_rate": 1.08669659390444e-05,
"loss": 0.2654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2588515281677246,
"step": 2685,
"valid_targets_mean": 4642.6,
"valid_targets_min": 2325
},
{
"epoch": 4.81216457960644,
"grad_norm": 0.4976503303623363,
"learning_rate": 1.0787678957382124e-05,
"loss": 0.2516,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.268010675907135,
"step": 2690,
"valid_targets_mean": 4382.6,
"valid_targets_min": 1666
},
{
"epoch": 4.821109123434705,
"grad_norm": 0.5302669946862639,
"learning_rate": 1.0708575323665422e-05,
"loss": 0.2561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25757157802581787,
"step": 2695,
"valid_targets_mean": 3814.4,
"valid_targets_min": 1832
},
{
"epoch": 4.83005366726297,
"grad_norm": 0.546113045209434,
"learning_rate": 1.062965661225201e-05,
"loss": 0.2636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2852606773376465,
"step": 2700,
"valid_targets_mean": 4466.5,
"valid_targets_min": 1706
},
{
"epoch": 4.838998211091234,
"grad_norm": 0.508464282119227,
"learning_rate": 1.0550924393819204e-05,
"loss": 0.2638,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2477300763130188,
"step": 2705,
"valid_targets_mean": 4274.6,
"valid_targets_min": 1461
},
{
"epoch": 4.847942754919499,
"grad_norm": 0.5908025845080628,
"learning_rate": 1.0472380235332631e-05,
"loss": 0.2632,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26860788464546204,
"step": 2710,
"valid_targets_mean": 3469.6,
"valid_targets_min": 1287
},
{
"epoch": 4.856887298747764,
"grad_norm": 0.49449536043979037,
"learning_rate": 1.0394025700015064e-05,
"loss": 0.2601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2539494037628174,
"step": 2715,
"valid_targets_mean": 5158.5,
"valid_targets_min": 1956
},
{
"epoch": 4.8658318425760285,
"grad_norm": 0.5211386908969953,
"learning_rate": 1.0315862347315314e-05,
"loss": 0.263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26820501685142517,
"step": 2720,
"valid_targets_mean": 4476.4,
"valid_targets_min": 1901
},
{
"epoch": 4.874776386404293,
"grad_norm": 0.5544257720104306,
"learning_rate": 1.0237891732877202e-05,
"loss": 0.2671,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2941119372844696,
"step": 2725,
"valid_targets_mean": 4002.2,
"valid_targets_min": 1560
},
{
"epoch": 4.883720930232558,
"grad_norm": 0.5465940219798077,
"learning_rate": 1.0160115408508533e-05,
"loss": 0.2693,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26257503032684326,
"step": 2730,
"valid_targets_mean": 3682.9,
"valid_targets_min": 950
},
{
"epoch": 4.892665474060823,
"grad_norm": 0.5476342559629205,
"learning_rate": 1.008253492215031e-05,
"loss": 0.2565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2684975862503052,
"step": 2735,
"valid_targets_mean": 4095.6,
"valid_targets_min": 1925
},
{
"epoch": 4.901610017889087,
"grad_norm": 0.5180846052234739,
"learning_rate": 1.0005151817845853e-05,
"loss": 0.2729,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2808322012424469,
"step": 2740,
"valid_targets_mean": 4175.7,
"valid_targets_min": 2464
},
{
"epoch": 4.910554561717352,
"grad_norm": 0.5936981738189633,
"learning_rate": 9.927967635710087e-06,
"loss": 0.2516,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24229755997657776,
"step": 2745,
"valid_targets_mean": 4147.9,
"valid_targets_min": 914
},
{
"epoch": 4.919499105545617,
"grad_norm": 0.5464370878938494,
"learning_rate": 9.850983911898913e-06,
"loss": 0.2657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24679221212863922,
"step": 2750,
"valid_targets_mean": 3841.9,
"valid_targets_min": 877
},
{
"epoch": 4.928443649373882,
"grad_norm": 0.5334187085612581,
"learning_rate": 9.774202178578592e-06,
"loss": 0.2531,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2615172863006592,
"step": 2755,
"valid_targets_mean": 3857.0,
"valid_targets_min": 622
},
{
"epoch": 4.937388193202147,
"grad_norm": 0.5666627948297285,
"learning_rate": 9.69762396389529e-06,
"loss": 0.2637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2589084804058075,
"step": 2760,
"valid_targets_mean": 3624.9,
"valid_targets_min": 1519
},
{
"epoch": 4.946332737030412,
"grad_norm": 0.5273284504363817,
"learning_rate": 9.621250791944659e-06,
"loss": 0.2627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2510490417480469,
"step": 2765,
"valid_targets_mean": 5004.1,
"valid_targets_min": 1979
},
{
"epoch": 4.9552772808586765,
"grad_norm": 0.6220423946842822,
"learning_rate": 9.545084182741476e-06,
"loss": 0.2723,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2961236536502838,
"step": 2770,
"valid_targets_mean": 3909.4,
"valid_targets_min": 657
},
{
"epoch": 4.964221824686941,
"grad_norm": 0.6418856659491654,
"learning_rate": 9.469125652189403e-06,
"loss": 0.2672,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28539496660232544,
"step": 2775,
"valid_targets_mean": 3030.6,
"valid_targets_min": 575
},
{
"epoch": 4.973166368515206,
"grad_norm": 0.5309277403670316,
"learning_rate": 9.393376712050847e-06,
"loss": 0.2637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2643331289291382,
"step": 2780,
"valid_targets_mean": 4088.8,
"valid_targets_min": 848
},
{
"epoch": 4.982110912343471,
"grad_norm": 0.6124698201076337,
"learning_rate": 9.317838869916835e-06,
"loss": 0.2632,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28254374861717224,
"step": 2785,
"valid_targets_mean": 3677.6,
"valid_targets_min": 1521
},
{
"epoch": 4.991055456171735,
"grad_norm": 0.7441462785686875,
"learning_rate": 9.242513629177033e-06,
"loss": 0.261,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27683040499687195,
"step": 2790,
"valid_targets_mean": 3313.4,
"valid_targets_min": 627
},
{
"epoch": 5.0,
"grad_norm": 0.5230399259211697,
"learning_rate": 9.167402488989784e-06,
"loss": 0.2555,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25869959592819214,
"step": 2795,
"valid_targets_mean": 3854.7,
"valid_targets_min": 743
},
{
"epoch": 5.008944543828265,
"grad_norm": 0.5549552542784999,
"learning_rate": 9.092506944252344e-06,
"loss": 0.2525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2471010535955429,
"step": 2800,
"valid_targets_mean": 4048.8,
"valid_targets_min": 1320
},
{
"epoch": 5.017889087656529,
"grad_norm": 0.5147728124256338,
"learning_rate": 9.017828485571044e-06,
"loss": 0.2399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23798583447933197,
"step": 2805,
"valid_targets_mean": 4106.8,
"valid_targets_min": 937
},
{
"epoch": 5.026833631484794,
"grad_norm": 0.5315317178738851,
"learning_rate": 8.943368599231706e-06,
"loss": 0.2644,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2732792794704437,
"step": 2810,
"valid_targets_mean": 4333.1,
"valid_targets_min": 2013
},
{
"epoch": 5.035778175313059,
"grad_norm": 0.5729446923576372,
"learning_rate": 8.869128767169986e-06,
"loss": 0.2424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2487604320049286,
"step": 2815,
"valid_targets_mean": 4101.1,
"valid_targets_min": 1705
},
{
"epoch": 5.0447227191413235,
"grad_norm": 0.5034079404779742,
"learning_rate": 8.79511046694194e-06,
"loss": 0.2608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26576727628707886,
"step": 2820,
"valid_targets_mean": 5089.2,
"valid_targets_min": 2511
},
{
"epoch": 5.053667262969588,
"grad_norm": 0.6023654856445056,
"learning_rate": 8.721315171694591e-06,
"loss": 0.2452,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25126317143440247,
"step": 2825,
"valid_targets_mean": 3496.4,
"valid_targets_min": 690
},
{
"epoch": 5.062611806797853,
"grad_norm": 0.6689786638114392,
"learning_rate": 8.647744350136612e-06,
"loss": 0.2462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24577105045318604,
"step": 2830,
"valid_targets_mean": 2972.4,
"valid_targets_min": 732
},
{
"epoch": 5.071556350626118,
"grad_norm": 0.5438242397653636,
"learning_rate": 8.574399466509085e-06,
"loss": 0.2551,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26564639806747437,
"step": 2835,
"valid_targets_mean": 3876.6,
"valid_targets_min": 1618
},
{
"epoch": 5.080500894454383,
"grad_norm": 0.6404762750457129,
"learning_rate": 8.501281980556369e-06,
"loss": 0.2638,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2322574257850647,
"step": 2840,
"valid_targets_mean": 3335.4,
"valid_targets_min": 1755
},
{
"epoch": 5.089445438282648,
"grad_norm": 0.5158771438098722,
"learning_rate": 8.428393347497057e-06,
"loss": 0.2549,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2659394145011902,
"step": 2845,
"valid_targets_mean": 4493.7,
"valid_targets_min": 2239
},
{
"epoch": 5.098389982110913,
"grad_norm": 0.563631894055807,
"learning_rate": 8.355735017995011e-06,
"loss": 0.2518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23874777555465698,
"step": 2850,
"valid_targets_mean": 3666.8,
"valid_targets_min": 754
},
{
"epoch": 5.107334525939177,
"grad_norm": 0.5264091725894624,
"learning_rate": 8.283308438130458e-06,
"loss": 0.2557,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28656524419784546,
"step": 2855,
"valid_targets_mean": 4860.7,
"valid_targets_min": 1880
},
{
"epoch": 5.116279069767442,
"grad_norm": 0.5531684984629897,
"learning_rate": 8.211115049371266e-06,
"loss": 0.2478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25294798612594604,
"step": 2860,
"valid_targets_mean": 4066.2,
"valid_targets_min": 634
},
{
"epoch": 5.125223613595707,
"grad_norm": 0.5887989735486293,
"learning_rate": 8.13915628854419e-06,
"loss": 0.246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27043190598487854,
"step": 2865,
"valid_targets_mean": 3563.4,
"valid_targets_min": 737
},
{
"epoch": 5.1341681574239715,
"grad_norm": 0.6198216758291454,
"learning_rate": 8.067433587806336e-06,
"loss": 0.2588,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2664569318294525,
"step": 2870,
"valid_targets_mean": 3196.0,
"valid_targets_min": 646
},
{
"epoch": 5.143112701252236,
"grad_norm": 0.49039197556547504,
"learning_rate": 7.995948374616628e-06,
"loss": 0.2449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24738174676895142,
"step": 2875,
"valid_targets_mean": 4813.1,
"valid_targets_min": 1748
},
{
"epoch": 5.152057245080501,
"grad_norm": 0.5124249703499617,
"learning_rate": 7.924702071707386e-06,
"loss": 0.2482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22936435043811798,
"step": 2880,
"valid_targets_mean": 4589.9,
"valid_targets_min": 669
},
{
"epoch": 5.161001788908766,
"grad_norm": 0.5356467322668551,
"learning_rate": 7.853696097056037e-06,
"loss": 0.2582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.264324426651001,
"step": 2885,
"valid_targets_mean": 4108.2,
"valid_targets_min": 1605
},
{
"epoch": 5.16994633273703,
"grad_norm": 0.5087262397528598,
"learning_rate": 7.782931863856888e-06,
"loss": 0.248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23341549932956696,
"step": 2890,
"valid_targets_mean": 4439.1,
"valid_targets_min": 1726
},
{
"epoch": 5.178890876565295,
"grad_norm": 0.5549321487561256,
"learning_rate": 7.71241078049298e-06,
"loss": 0.2438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25444790720939636,
"step": 2895,
"valid_targets_mean": 4032.2,
"valid_targets_min": 1642
},
{
"epoch": 5.18783542039356,
"grad_norm": 0.5352806321855557,
"learning_rate": 7.642134250508069e-06,
"loss": 0.2452,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24765413999557495,
"step": 2900,
"valid_targets_mean": 4077.3,
"valid_targets_min": 1757
},
{
"epoch": 5.196779964221824,
"grad_norm": 0.5518211501366974,
"learning_rate": 7.57210367257871e-06,
"loss": 0.2655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24627630412578583,
"step": 2905,
"valid_targets_mean": 4041.1,
"valid_targets_min": 1350
},
{
"epoch": 5.205724508050089,
"grad_norm": 0.5517560537112484,
"learning_rate": 7.502320440486399e-06,
"loss": 0.2516,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27135342359542847,
"step": 2910,
"valid_targets_mean": 4264.5,
"valid_targets_min": 1184
},
{
"epoch": 5.214669051878354,
"grad_norm": 0.5509625444275201,
"learning_rate": 7.4327859430898445e-06,
"loss": 0.2573,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2660328149795532,
"step": 2915,
"valid_targets_mean": 4360.2,
"valid_targets_min": 1551
},
{
"epoch": 5.2236135957066185,
"grad_norm": 0.5264725135537257,
"learning_rate": 7.363501564297302e-06,
"loss": 0.2503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2478117048740387,
"step": 2920,
"valid_targets_mean": 4145.1,
"valid_targets_min": 1811
},
{
"epoch": 5.232558139534884,
"grad_norm": 0.5015055063053451,
"learning_rate": 7.294468683039058e-06,
"loss": 0.2595,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24327683448791504,
"step": 2925,
"valid_targets_mean": 4711.1,
"valid_targets_min": 714
},
{
"epoch": 5.241502683363149,
"grad_norm": 0.5747369854441176,
"learning_rate": 7.225688673239981e-06,
"loss": 0.2512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24569492042064667,
"step": 2930,
"valid_targets_mean": 4338.2,
"valid_targets_min": 687
},
{
"epoch": 5.2504472271914135,
"grad_norm": 0.558577994633376,
"learning_rate": 7.1571629037921804e-06,
"loss": 0.2526,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28280454874038696,
"step": 2935,
"valid_targets_mean": 4211.2,
"valid_targets_min": 2352
},
{
"epoch": 5.259391771019678,
"grad_norm": 0.6144056807907267,
"learning_rate": 7.088892738527731e-06,
"loss": 0.2608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2709640562534332,
"step": 2940,
"valid_targets_mean": 4119.1,
"valid_targets_min": 1206
},
{
"epoch": 5.268336314847943,
"grad_norm": 0.5107272318888509,
"learning_rate": 7.020879536191571e-06,
"loss": 0.2497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26789391040802,
"step": 2945,
"valid_targets_mean": 4640.5,
"valid_targets_min": 1448
},
{
"epoch": 5.277280858676208,
"grad_norm": 0.5541009190577022,
"learning_rate": 6.953124650414447e-06,
"loss": 0.2512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2534041404724121,
"step": 2950,
"valid_targets_mean": 4751.1,
"valid_targets_min": 1213
},
{
"epoch": 5.286225402504472,
"grad_norm": 0.6514472569289943,
"learning_rate": 6.885629429685943e-06,
"loss": 0.2599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2853846251964569,
"step": 2955,
"valid_targets_mean": 4381.8,
"valid_targets_min": 1086
},
{
"epoch": 5.295169946332737,
"grad_norm": 0.5988322541910981,
"learning_rate": 6.818395217327696e-06,
"loss": 0.2577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25575023889541626,
"step": 2960,
"valid_targets_mean": 3193.8,
"valid_targets_min": 1521
},
{
"epoch": 5.304114490161002,
"grad_norm": 0.5670506850205758,
"learning_rate": 6.751423351466604e-06,
"loss": 0.2441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23857812583446503,
"step": 2965,
"valid_targets_mean": 4116.7,
"valid_targets_min": 2343
},
{
"epoch": 5.3130590339892665,
"grad_norm": 0.5218993251194615,
"learning_rate": 6.684715165008242e-06,
"loss": 0.2511,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24250607192516327,
"step": 2970,
"valid_targets_mean": 4213.7,
"valid_targets_min": 712
},
{
"epoch": 5.322003577817531,
"grad_norm": 0.5569832821022914,
"learning_rate": 6.618271985610316e-06,
"loss": 0.2516,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2601429224014282,
"step": 2975,
"valid_targets_mean": 4093.6,
"valid_targets_min": 1465
},
{
"epoch": 5.330948121645796,
"grad_norm": 0.5257447628225279,
"learning_rate": 6.552095135656211e-06,
"loss": 0.252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22466397285461426,
"step": 2980,
"valid_targets_mean": 4426.8,
"valid_targets_min": 1498
},
{
"epoch": 5.339892665474061,
"grad_norm": 0.5288226075745489,
"learning_rate": 6.486185932228732e-06,
"loss": 0.2495,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23786196112632751,
"step": 2985,
"valid_targets_mean": 4234.4,
"valid_targets_min": 947
},
{
"epoch": 5.348837209302325,
"grad_norm": 0.5316983597863091,
"learning_rate": 6.420545687083823e-06,
"loss": 0.2453,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2561112642288208,
"step": 2990,
"valid_targets_mean": 4393.5,
"valid_targets_min": 1639
},
{
"epoch": 5.35778175313059,
"grad_norm": 0.6336255850890024,
"learning_rate": 6.355175706624521e-06,
"loss": 0.2516,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24200129508972168,
"step": 2995,
"valid_targets_mean": 2892.8,
"valid_targets_min": 1724
},
{
"epoch": 5.366726296958855,
"grad_norm": 0.5790999887623745,
"learning_rate": 6.290077291874923e-06,
"loss": 0.2472,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25445109605789185,
"step": 3000,
"valid_targets_mean": 3687.9,
"valid_targets_min": 1561
},
{
"epoch": 5.375670840787119,
"grad_norm": 0.6224285293408105,
"learning_rate": 6.225251738454281e-06,
"loss": 0.2558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2375735342502594,
"step": 3005,
"valid_targets_mean": 3882.3,
"valid_targets_min": 1924
},
{
"epoch": 5.384615384615385,
"grad_norm": 0.5037477615762228,
"learning_rate": 6.160700336551246e-06,
"loss": 0.2484,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22593946754932404,
"step": 3010,
"valid_targets_mean": 4476.9,
"valid_targets_min": 1419
},
{
"epoch": 5.39355992844365,
"grad_norm": 0.5857014550270156,
"learning_rate": 6.096424370898186e-06,
"loss": 0.2563,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26964280009269714,
"step": 3015,
"valid_targets_mean": 3775.2,
"valid_targets_min": 942
},
{
"epoch": 5.402504472271914,
"grad_norm": 0.5658229988053839,
"learning_rate": 6.032425120745586e-06,
"loss": 0.255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2709835171699524,
"step": 3020,
"valid_targets_mean": 3667.1,
"valid_targets_min": 1957
},
{
"epoch": 5.411449016100179,
"grad_norm": 0.5988261907445214,
"learning_rate": 5.968703859836615e-06,
"loss": 0.2562,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2751755118370056,
"step": 3025,
"valid_targets_mean": 3496.3,
"valid_targets_min": 671
},
{
"epoch": 5.420393559928444,
"grad_norm": 0.5141241348502327,
"learning_rate": 5.905261856381779e-06,
"loss": 0.257,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2791970372200012,
"step": 3030,
"valid_targets_mean": 4357.8,
"valid_targets_min": 1171
},
{
"epoch": 5.4293381037567086,
"grad_norm": 0.5498788228367728,
"learning_rate": 5.8421003730336635e-06,
"loss": 0.2532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2511694133281708,
"step": 3035,
"valid_targets_mean": 3824.6,
"valid_targets_min": 1185
},
{
"epoch": 5.438282647584973,
"grad_norm": 0.6029343448549779,
"learning_rate": 5.77922066686182e-06,
"loss": 0.2482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.243141770362854,
"step": 3040,
"valid_targets_mean": 3373.0,
"valid_targets_min": 823
},
{
"epoch": 5.447227191413238,
"grad_norm": 0.5131367304880754,
"learning_rate": 5.716623989327723e-06,
"loss": 0.2504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2467704713344574,
"step": 3045,
"valid_targets_mean": 4253.5,
"valid_targets_min": 1483
},
{
"epoch": 5.456171735241503,
"grad_norm": 0.5805462950603849,
"learning_rate": 5.654311586259882e-06,
"loss": 0.25,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23988988995552063,
"step": 3050,
"valid_targets_mean": 4065.0,
"valid_targets_min": 2083
},
{
"epoch": 5.465116279069767,
"grad_norm": 0.5715523149741332,
"learning_rate": 5.592284697829049e-06,
"loss": 0.2435,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2494080364704132,
"step": 3055,
"valid_targets_mean": 3334.1,
"valid_targets_min": 734
},
{
"epoch": 5.474060822898032,
"grad_norm": 0.5721433275869938,
"learning_rate": 5.5305445585235315e-06,
"loss": 0.2598,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28742748498916626,
"step": 3060,
"valid_targets_mean": 3750.8,
"valid_targets_min": 1385
},
{
"epoch": 5.483005366726297,
"grad_norm": 0.5114459072142161,
"learning_rate": 5.469092397124609e-06,
"loss": 0.2354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2271006852388382,
"step": 3065,
"valid_targets_mean": 4397.1,
"valid_targets_min": 1489
},
{
"epoch": 5.4919499105545615,
"grad_norm": 0.5521229518692201,
"learning_rate": 5.407929436682098e-06,
"loss": 0.2433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25235363841056824,
"step": 3070,
"valid_targets_mean": 4136.6,
"valid_targets_min": 1627
},
{
"epoch": 5.500894454382826,
"grad_norm": 0.5402233613552551,
"learning_rate": 5.347056894490006e-06,
"loss": 0.2514,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2618515193462372,
"step": 3075,
"valid_targets_mean": 4445.6,
"valid_targets_min": 1844
},
{
"epoch": 5.509838998211091,
"grad_norm": 0.5533934913144476,
"learning_rate": 5.286475982062283e-06,
"loss": 0.2572,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26157045364379883,
"step": 3080,
"valid_targets_mean": 4031.0,
"valid_targets_min": 1056
},
{
"epoch": 5.518783542039356,
"grad_norm": 0.5110038510091776,
"learning_rate": 5.226187905108746e-06,
"loss": 0.2628,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2799553871154785,
"step": 3085,
"valid_targets_mean": 4822.0,
"valid_targets_min": 1524
},
{
"epoch": 5.52772808586762,
"grad_norm": 0.6041299965242917,
"learning_rate": 5.166193863511046e-06,
"loss": 0.2478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25382912158966064,
"step": 3090,
"valid_targets_mean": 4463.2,
"valid_targets_min": 1625
},
{
"epoch": 5.536672629695886,
"grad_norm": 0.523055625256692,
"learning_rate": 5.106495051298815e-06,
"loss": 0.2601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26213690638542175,
"step": 3095,
"valid_targets_mean": 4872.1,
"valid_targets_min": 1339
},
{
"epoch": 5.545617173524151,
"grad_norm": 0.689189142486139,
"learning_rate": 5.047092656625887e-06,
"loss": 0.2464,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22535747289657593,
"step": 3100,
"valid_targets_mean": 4960.2,
"valid_targets_min": 1725
},
{
"epoch": 5.554561717352415,
"grad_norm": 0.5703961451507539,
"learning_rate": 4.98798786174667e-06,
"loss": 0.2567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23777396976947784,
"step": 3105,
"valid_targets_mean": 3530.8,
"valid_targets_min": 1099
},
{
"epoch": 5.56350626118068,
"grad_norm": 0.5659413248498028,
"learning_rate": 4.9291818429925585e-06,
"loss": 0.2503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2758846580982208,
"step": 3110,
"valid_targets_mean": 3740.4,
"valid_targets_min": 1606
},
{
"epoch": 5.572450805008945,
"grad_norm": 0.6859304017050197,
"learning_rate": 4.8706757707486075e-06,
"loss": 0.2556,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24378885328769684,
"step": 3115,
"valid_targets_mean": 4183.4,
"valid_targets_min": 1253
},
{
"epoch": 5.5813953488372094,
"grad_norm": 0.8010245971038674,
"learning_rate": 4.812470809430179e-06,
"loss": 0.2506,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2438773214817047,
"step": 3120,
"valid_targets_mean": 4535.4,
"valid_targets_min": 1654
},
{
"epoch": 5.590339892665474,
"grad_norm": 0.48380553908118173,
"learning_rate": 4.754568117459788e-06,
"loss": 0.2514,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23566769063472748,
"step": 3125,
"valid_targets_mean": 4967.9,
"valid_targets_min": 2282
},
{
"epoch": 5.599284436493739,
"grad_norm": 0.555628362724338,
"learning_rate": 4.69696884724403e-06,
"loss": 0.2587,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26789629459381104,
"step": 3130,
"valid_targets_mean": 3930.6,
"valid_targets_min": 1612
},
{
"epoch": 5.608228980322004,
"grad_norm": 0.5726463627079651,
"learning_rate": 4.639674145150679e-06,
"loss": 0.2703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27078795433044434,
"step": 3135,
"valid_targets_mean": 4010.0,
"valid_targets_min": 2215
},
{
"epoch": 5.617173524150268,
"grad_norm": 0.5160136519489497,
"learning_rate": 4.582685151485826e-06,
"loss": 0.254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2637634873390198,
"step": 3140,
"valid_targets_mean": 4663.4,
"valid_targets_min": 1675
},
{
"epoch": 5.626118067978533,
"grad_norm": 0.5831172100665993,
"learning_rate": 4.526003000471238e-06,
"loss": 0.252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25619733333587646,
"step": 3145,
"valid_targets_mean": 3704.6,
"valid_targets_min": 1062
},
{
"epoch": 5.635062611806798,
"grad_norm": 0.5228549236039476,
"learning_rate": 4.469628820221723e-06,
"loss": 0.2481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25507116317749023,
"step": 3150,
"valid_targets_mean": 4272.4,
"valid_targets_min": 1740
},
{
"epoch": 5.644007155635062,
"grad_norm": 0.5442853215358627,
"learning_rate": 4.4135637327227365e-06,
"loss": 0.2489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24775390326976776,
"step": 3155,
"valid_targets_mean": 4432.6,
"valid_targets_min": 2006
},
{
"epoch": 5.652951699463327,
"grad_norm": 0.6205216192517241,
"learning_rate": 4.357808853808014e-06,
"loss": 0.2484,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26101428270339966,
"step": 3160,
"valid_targets_mean": 3737.1,
"valid_targets_min": 644
},
{
"epoch": 5.661896243291592,
"grad_norm": 0.5132795398550757,
"learning_rate": 4.302365293137383e-06,
"loss": 0.2558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2703346014022827,
"step": 3165,
"valid_targets_mean": 4475.0,
"valid_targets_min": 1557
},
{
"epoch": 5.6708407871198565,
"grad_norm": 0.5446296655760452,
"learning_rate": 4.247234154174649e-06,
"loss": 0.2565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.261799693107605,
"step": 3170,
"valid_targets_mean": 4172.8,
"valid_targets_min": 823
},
{
"epoch": 5.679785330948121,
"grad_norm": 0.5219059793104994,
"learning_rate": 4.192416534165666e-06,
"loss": 0.2551,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2537573277950287,
"step": 3175,
"valid_targets_mean": 4267.9,
"valid_targets_min": 579
},
{
"epoch": 5.688729874776387,
"grad_norm": 0.5461673557485848,
"learning_rate": 4.137913524116488e-06,
"loss": 0.2347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2290881723165512,
"step": 3180,
"valid_targets_mean": 4211.2,
"valid_targets_min": 818
},
{
"epoch": 5.6976744186046515,
"grad_norm": 0.517997717225711,
"learning_rate": 4.083726208771653e-06,
"loss": 0.2514,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25634273886680603,
"step": 3185,
"valid_targets_mean": 4610.6,
"valid_targets_min": 1674
},
{
"epoch": 5.706618962432916,
"grad_norm": 0.5213271875253821,
"learning_rate": 4.0298556665925996e-06,
"loss": 0.2611,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27138853073120117,
"step": 3190,
"valid_targets_mean": 4529.8,
"valid_targets_min": 1865
},
{
"epoch": 5.715563506261181,
"grad_norm": 0.546634737650849,
"learning_rate": 3.976302969736183e-06,
"loss": 0.2587,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2496567666530609,
"step": 3195,
"valid_targets_mean": 3815.2,
"valid_targets_min": 932
},
{
"epoch": 5.724508050089446,
"grad_norm": 0.5258705612970683,
"learning_rate": 3.923069184033357e-06,
"loss": 0.2509,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23271816968917847,
"step": 3200,
"valid_targets_mean": 4088.2,
"valid_targets_min": 2116
},
{
"epoch": 5.73345259391771,
"grad_norm": 0.5867279766106626,
"learning_rate": 3.870155368967963e-06,
"loss": 0.2536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25471609830856323,
"step": 3205,
"valid_targets_mean": 3395.8,
"valid_targets_min": 1808
},
{
"epoch": 5.742397137745975,
"grad_norm": 0.5656851680671992,
"learning_rate": 3.8175625776556354e-06,
"loss": 0.2578,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26453453302383423,
"step": 3210,
"valid_targets_mean": 4103.0,
"valid_targets_min": 786
},
{
"epoch": 5.75134168157424,
"grad_norm": 0.5284899901213221,
"learning_rate": 3.76529185682283e-06,
"loss": 0.2562,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24859002232551575,
"step": 3215,
"valid_targets_mean": 4613.4,
"valid_targets_min": 1303
},
{
"epoch": 5.7602862254025045,
"grad_norm": 0.5635253947920319,
"learning_rate": 3.7133442467860215e-06,
"loss": 0.2532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24023880064487457,
"step": 3220,
"valid_targets_mean": 3926.2,
"valid_targets_min": 822
},
{
"epoch": 5.769230769230769,
"grad_norm": 0.6683290106994736,
"learning_rate": 3.6617207814309686e-06,
"loss": 0.2535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24666255712509155,
"step": 3225,
"valid_targets_mean": 3464.2,
"valid_targets_min": 1681
},
{
"epoch": 5.778175313059034,
"grad_norm": 0.5711365259269587,
"learning_rate": 3.610422488192169e-06,
"loss": 0.2474,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22737815976142883,
"step": 3230,
"valid_targets_mean": 3654.8,
"valid_targets_min": 1601
},
{
"epoch": 5.787119856887299,
"grad_norm": 0.5262566407141166,
"learning_rate": 3.559450388032355e-06,
"loss": 0.2405,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23528073728084564,
"step": 3235,
"valid_targets_mean": 4000.4,
"valid_targets_min": 1795
},
{
"epoch": 5.796064400715563,
"grad_norm": 0.5857070524704964,
"learning_rate": 3.508805495422247e-06,
"loss": 0.2497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25850462913513184,
"step": 3240,
"valid_targets_mean": 3548.4,
"valid_targets_min": 2027
},
{
"epoch": 5.805008944543828,
"grad_norm": 0.5422739378299365,
"learning_rate": 3.4584888183203134e-06,
"loss": 0.2454,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23234635591506958,
"step": 3245,
"valid_targets_mean": 3974.6,
"valid_targets_min": 1831
},
{
"epoch": 5.813953488372093,
"grad_norm": 0.5467138164186622,
"learning_rate": 3.4085013581527295e-06,
"loss": 0.2502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25337696075439453,
"step": 3250,
"valid_targets_mean": 3679.7,
"valid_targets_min": 1793
},
{
"epoch": 5.822898032200357,
"grad_norm": 0.5923423600872293,
"learning_rate": 3.3588441097934223e-06,
"loss": 0.2552,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27606481313705444,
"step": 3255,
"valid_targets_mean": 4041.6,
"valid_targets_min": 1902
},
{
"epoch": 5.831842576028622,
"grad_norm": 0.544712722817465,
"learning_rate": 3.30951806154431e-06,
"loss": 0.2573,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24701544642448425,
"step": 3260,
"valid_targets_mean": 4252.6,
"valid_targets_min": 1603
},
{
"epoch": 5.840787119856888,
"grad_norm": 0.5682646260679644,
"learning_rate": 3.260524195115595e-06,
"loss": 0.2527,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2743680477142334,
"step": 3265,
"valid_targets_mean": 4033.4,
"valid_targets_min": 1567
},
{
"epoch": 5.849731663685152,
"grad_norm": 0.5053561115203649,
"learning_rate": 3.2118634856062546e-06,
"loss": 0.2515,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25195997953414917,
"step": 3270,
"valid_targets_mean": 4670.6,
"valid_targets_min": 1711
},
{
"epoch": 5.858676207513417,
"grad_norm": 0.5720698542136006,
"learning_rate": 3.163536901484601e-06,
"loss": 0.2579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25598081946372986,
"step": 3275,
"valid_targets_mean": 3693.4,
"valid_targets_min": 850
},
{
"epoch": 5.867620751341682,
"grad_norm": 0.5504159278631617,
"learning_rate": 3.115545404569045e-06,
"loss": 0.2491,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2605506181716919,
"step": 3280,
"valid_targets_mean": 3985.3,
"valid_targets_min": 1494
},
{
"epoch": 5.8765652951699465,
"grad_norm": 0.5073092549610757,
"learning_rate": 3.0678899500089244e-06,
"loss": 0.2593,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28743916749954224,
"step": 3285,
"valid_targets_mean": 5028.8,
"valid_targets_min": 2241
},
{
"epoch": 5.885509838998211,
"grad_norm": 0.5340456565641353,
"learning_rate": 3.0205714862655135e-06,
"loss": 0.2539,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2738155722618103,
"step": 3290,
"valid_targets_mean": 4406.5,
"valid_targets_min": 1014
},
{
"epoch": 5.894454382826476,
"grad_norm": 0.5891360814807866,
"learning_rate": 2.973590955093124e-06,
"loss": 0.2584,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26489949226379395,
"step": 3295,
"valid_targets_mean": 3631.4,
"valid_targets_min": 1316
},
{
"epoch": 5.903398926654741,
"grad_norm": 0.606826380313794,
"learning_rate": 2.9269492915203735e-06,
"loss": 0.2528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28875553607940674,
"step": 3300,
"valid_targets_mean": 3582.3,
"valid_targets_min": 748
},
{
"epoch": 5.912343470483005,
"grad_norm": 0.5117519052350044,
"learning_rate": 2.880647423831591e-06,
"loss": 0.2548,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2642664909362793,
"step": 3305,
"valid_targets_mean": 5080.2,
"valid_targets_min": 747
},
{
"epoch": 5.92128801431127,
"grad_norm": 0.5806379654175979,
"learning_rate": 2.8346862735483215e-06,
"loss": 0.2522,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2645312547683716,
"step": 3310,
"valid_targets_mean": 3762.3,
"valid_targets_min": 1805
},
{
"epoch": 5.930232558139535,
"grad_norm": 0.5311509065424678,
"learning_rate": 2.789066755410994e-06,
"loss": 0.2488,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2585093379020691,
"step": 3315,
"valid_targets_mean": 4278.2,
"valid_targets_min": 1326
},
{
"epoch": 5.9391771019677995,
"grad_norm": 0.5936285800316835,
"learning_rate": 2.7437897773607102e-06,
"loss": 0.2559,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26041656732559204,
"step": 3320,
"valid_targets_mean": 3442.7,
"valid_targets_min": 1502
},
{
"epoch": 5.948121645796064,
"grad_norm": 0.5459969266201287,
"learning_rate": 2.698856240521173e-06,
"loss": 0.2566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25794172286987305,
"step": 3325,
"valid_targets_mean": 4014.2,
"valid_targets_min": 1551
},
{
"epoch": 5.957066189624329,
"grad_norm": 0.5630581255206843,
"learning_rate": 2.6542670391807667e-06,
"loss": 0.2533,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24545322358608246,
"step": 3330,
"valid_targets_mean": 3481.9,
"valid_targets_min": 1557
},
{
"epoch": 5.966010733452594,
"grad_norm": 0.5799194413488256,
"learning_rate": 2.610023060774749e-06,
"loss": 0.2549,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2724427580833435,
"step": 3335,
"valid_targets_mean": 3878.4,
"valid_targets_min": 702
},
{
"epoch": 5.974955277280858,
"grad_norm": 0.5740945458943522,
"learning_rate": 2.566125185867576e-06,
"loss": 0.2469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23313261568546295,
"step": 3340,
"valid_targets_mean": 3677.9,
"valid_targets_min": 923
},
{
"epoch": 5.983899821109123,
"grad_norm": 0.4939353323910504,
"learning_rate": 2.5225742881354043e-06,
"loss": 0.2455,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23637865483760834,
"step": 3345,
"valid_targets_mean": 5144.5,
"valid_targets_min": 2196
},
{
"epoch": 5.992844364937389,
"grad_norm": 0.5709249769648037,
"learning_rate": 2.479371234348682e-06,
"loss": 0.2718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2716667056083679,
"step": 3350,
"valid_targets_mean": 4413.6,
"valid_targets_min": 1591
},
{
"epoch": 6.001788908765653,
"grad_norm": 0.49922306688966933,
"learning_rate": 2.4365168843549e-06,
"loss": 0.2583,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24928270280361176,
"step": 3355,
"valid_targets_mean": 4612.2,
"valid_targets_min": 1207
},
{
"epoch": 6.010733452593918,
"grad_norm": 0.5555093196620423,
"learning_rate": 2.3940120910614774e-06,
"loss": 0.2536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2676859498023987,
"step": 3360,
"valid_targets_mean": 3853.4,
"valid_targets_min": 1449
},
{
"epoch": 6.019677996422183,
"grad_norm": 0.5566602842743498,
"learning_rate": 2.351857700418807e-06,
"loss": 0.241,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2452341467142105,
"step": 3365,
"valid_targets_mean": 4434.4,
"valid_targets_min": 777
},
{
"epoch": 6.028622540250447,
"grad_norm": 0.5088695531600443,
"learning_rate": 2.310054551403391e-06,
"loss": 0.2387,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2538371682167053,
"step": 3370,
"valid_targets_mean": 4775.4,
"valid_targets_min": 1902
},
{
"epoch": 6.037567084078712,
"grad_norm": 0.5558924991251052,
"learning_rate": 2.2686034760011656e-06,
"loss": 0.2435,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23813003301620483,
"step": 3375,
"valid_targets_mean": 3898.2,
"valid_targets_min": 1674
},
{
"epoch": 6.046511627906977,
"grad_norm": 0.5591093005835225,
"learning_rate": 2.2275052991909218e-06,
"loss": 0.2417,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21672865748405457,
"step": 3380,
"valid_targets_mean": 4234.8,
"valid_targets_min": 671
},
{
"epoch": 6.0554561717352415,
"grad_norm": 0.5260886376788583,
"learning_rate": 2.186760838927897e-06,
"loss": 0.2507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22722241282463074,
"step": 3385,
"valid_targets_mean": 4410.5,
"valid_targets_min": 575
},
{
"epoch": 6.064400715563506,
"grad_norm": 0.5613980727726008,
"learning_rate": 2.146370906127506e-06,
"loss": 0.2408,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2486397624015808,
"step": 3390,
"valid_targets_mean": 3953.5,
"valid_targets_min": 1297
},
{
"epoch": 6.073345259391771,
"grad_norm": 0.5718364438676335,
"learning_rate": 2.1063363046491813e-06,
"loss": 0.2404,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24342885613441467,
"step": 3395,
"valid_targets_mean": 4326.2,
"valid_targets_min": 1784
},
{
"epoch": 6.082289803220036,
"grad_norm": 0.5484733914155208,
"learning_rate": 2.0666578312803942e-06,
"loss": 0.2488,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23995618522167206,
"step": 3400,
"valid_targets_mean": 4243.8,
"valid_targets_min": 1656
},
{
"epoch": 6.0912343470483,
"grad_norm": 0.6076003177346635,
"learning_rate": 2.0273362757207726e-06,
"loss": 0.2529,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2636367678642273,
"step": 3405,
"valid_targets_mean": 3371.1,
"valid_targets_min": 700
},
{
"epoch": 6.100178890876565,
"grad_norm": 0.5364865052473711,
"learning_rate": 1.988372420566416e-06,
"loss": 0.2525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2631525993347168,
"step": 3410,
"valid_targets_mean": 4552.2,
"valid_targets_min": 527
},
{
"epoch": 6.10912343470483,
"grad_norm": 0.5382573273538706,
"learning_rate": 1.9497670412942835e-06,
"loss": 0.2434,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25336796045303345,
"step": 3415,
"valid_targets_mean": 4031.2,
"valid_targets_min": 1500
},
{
"epoch": 6.1180679785330945,
"grad_norm": 0.5332393694448714,
"learning_rate": 1.9115209062467954e-06,
"loss": 0.248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25488486886024475,
"step": 3420,
"valid_targets_mean": 4084.2,
"valid_targets_min": 1073
},
{
"epoch": 6.127012522361359,
"grad_norm": 0.5822463874616248,
"learning_rate": 1.8736347766165086e-06,
"loss": 0.2415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25610625743865967,
"step": 3425,
"valid_targets_mean": 3508.5,
"valid_targets_min": 644
},
{
"epoch": 6.135957066189624,
"grad_norm": 0.516320931889104,
"learning_rate": 1.8361094064309993e-06,
"loss": 0.2523,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26783958077430725,
"step": 3430,
"valid_targets_mean": 4032.3,
"valid_targets_min": 1287
},
{
"epoch": 6.1449016100178895,
"grad_norm": 0.5331137313762538,
"learning_rate": 1.7989455425378266e-06,
"loss": 0.2499,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2545079290866852,
"step": 3435,
"valid_targets_mean": 4148.0,
"valid_targets_min": 1830
},
{
"epoch": 6.153846153846154,
"grad_norm": 0.511372820106071,
"learning_rate": 1.7621439245896943e-06,
"loss": 0.2476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25283390283584595,
"step": 3440,
"valid_targets_mean": 4522.1,
"valid_targets_min": 1614
},
{
"epoch": 6.162790697674419,
"grad_norm": 0.642569852208313,
"learning_rate": 1.7257052850296996e-06,
"loss": 0.2357,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24894089996814728,
"step": 3445,
"valid_targets_mean": 3752.3,
"valid_targets_min": 697
},
{
"epoch": 6.171735241502684,
"grad_norm": 0.5666144603072086,
"learning_rate": 1.6896303490767829e-06,
"loss": 0.2418,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24932259321212769,
"step": 3450,
"valid_targets_mean": 3750.7,
"valid_targets_min": 1707
},
{
"epoch": 6.180679785330948,
"grad_norm": 0.5143915126274258,
"learning_rate": 1.6539198347112884e-06,
"loss": 0.245,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2590116560459137,
"step": 3455,
"valid_targets_mean": 4465.8,
"valid_targets_min": 1477
},
{
"epoch": 6.189624329159213,
"grad_norm": 0.5657080432140568,
"learning_rate": 1.6185744526606706e-06,
"loss": 0.2248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22567050158977509,
"step": 3460,
"valid_targets_mean": 4094.5,
"valid_targets_min": 1981
},
{
"epoch": 6.198568872987478,
"grad_norm": 0.6089266321722668,
"learning_rate": 1.583594906385335e-06,
"loss": 0.2516,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2387622594833374,
"step": 3465,
"valid_targets_mean": 4029.4,
"valid_targets_min": 1928
},
{
"epoch": 6.207513416815742,
"grad_norm": 0.4852359479822391,
"learning_rate": 1.548981892064665e-06,
"loss": 0.2574,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24283546209335327,
"step": 3470,
"valid_targets_mean": 5261.4,
"valid_targets_min": 1062
},
{
"epoch": 6.216457960644007,
"grad_norm": 0.4537685331486559,
"learning_rate": 1.5147360985831516e-06,
"loss": 0.2465,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21774128079414368,
"step": 3475,
"valid_targets_mean": 5369.9,
"valid_targets_min": 3175
},
{
"epoch": 6.225402504472272,
"grad_norm": 0.5236024964731602,
"learning_rate": 1.4808582075166778e-06,
"loss": 0.2487,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25047406554222107,
"step": 3480,
"valid_targets_mean": 4213.7,
"valid_targets_min": 1750
},
{
"epoch": 6.2343470483005365,
"grad_norm": 0.594758118058126,
"learning_rate": 1.447348893118965e-06,
"loss": 0.2446,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2589150667190552,
"step": 3485,
"valid_targets_mean": 3918.9,
"valid_targets_min": 2197
},
{
"epoch": 6.243291592128801,
"grad_norm": 0.5390376277621793,
"learning_rate": 1.4142088223081408e-06,
"loss": 0.2441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24606183171272278,
"step": 3490,
"valid_targets_mean": 4628.6,
"valid_targets_min": 2230
},
{
"epoch": 6.252236135957066,
"grad_norm": 0.515173541243895,
"learning_rate": 1.3814386546534864e-06,
"loss": 0.253,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2567700147628784,
"step": 3495,
"valid_targets_mean": 4171.9,
"valid_targets_min": 1779
},
{
"epoch": 6.261180679785331,
"grad_norm": 0.5308974195526618,
"learning_rate": 1.3490390423622856e-06,
"loss": 0.2427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22043094038963318,
"step": 3500,
"valid_targets_mean": 4421.9,
"valid_targets_min": 1412
},
{
"epoch": 6.270125223613595,
"grad_norm": 0.5045875631623113,
"learning_rate": 1.3170106302668616e-06,
"loss": 0.2455,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23024529218673706,
"step": 3505,
"valid_targets_mean": 4453.3,
"valid_targets_min": 1660
},
{
"epoch": 6.27906976744186,
"grad_norm": 0.5448476578553636,
"learning_rate": 1.2853540558117272e-06,
"loss": 0.2454,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24999341368675232,
"step": 3510,
"valid_targets_mean": 4241.5,
"valid_targets_min": 1712
},
{
"epoch": 6.288014311270125,
"grad_norm": 0.5759478717126266,
"learning_rate": 1.254069949040917e-06,
"loss": 0.254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25016283988952637,
"step": 3515,
"valid_targets_mean": 3847.2,
"valid_targets_min": 669
},
{
"epoch": 6.29695885509839,
"grad_norm": 0.542415226047018,
"learning_rate": 1.2231589325854354e-06,
"loss": 0.2474,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2293107956647873,
"step": 3520,
"valid_targets_mean": 4337.9,
"valid_targets_min": 1502
},
{
"epoch": 6.305903398926655,
"grad_norm": 0.5091719583649115,
"learning_rate": 1.1926216216508735e-06,
"loss": 0.2565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25717687606811523,
"step": 3525,
"valid_targets_mean": 4432.9,
"valid_targets_min": 737
},
{
"epoch": 6.31484794275492,
"grad_norm": 0.4941207542833962,
"learning_rate": 1.162458624005145e-06,
"loss": 0.2525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24258843064308167,
"step": 3530,
"valid_targets_mean": 4559.1,
"valid_targets_min": 1824
},
{
"epoch": 6.3237924865831845,
"grad_norm": 0.5967014559288393,
"learning_rate": 1.1326705399664207e-06,
"loss": 0.2451,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23474426567554474,
"step": 3535,
"valid_targets_mean": 3250.2,
"valid_targets_min": 1600
},
{
"epoch": 6.332737030411449,
"grad_norm": 0.5207543513220922,
"learning_rate": 1.103257962391151e-06,
"loss": 0.237,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24193906784057617,
"step": 3540,
"valid_targets_mean": 4304.2,
"valid_targets_min": 763
},
{
"epoch": 6.341681574239714,
"grad_norm": 0.5920796448944554,
"learning_rate": 1.0742214766622938e-06,
"loss": 0.2523,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2564089596271515,
"step": 3545,
"valid_targets_mean": 3882.9,
"valid_targets_min": 579
},
{
"epoch": 6.350626118067979,
"grad_norm": 0.5232360068927403,
"learning_rate": 1.0455616606776363e-06,
"loss": 0.2395,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2539476156234741,
"step": 3550,
"valid_targets_mean": 3925.2,
"valid_targets_min": 805
},
{
"epoch": 6.359570661896243,
"grad_norm": 0.4866461666276335,
"learning_rate": 1.0172790848383141e-06,
"loss": 0.2435,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24338996410369873,
"step": 3555,
"valid_targets_mean": 4900.0,
"valid_targets_min": 2526
},
{
"epoch": 6.368515205724508,
"grad_norm": 0.5299824855199575,
"learning_rate": 9.893743120374543e-07,
"loss": 0.2465,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24363267421722412,
"step": 3560,
"valid_targets_mean": 3905.7,
"valid_targets_min": 1083
},
{
"epoch": 6.377459749552773,
"grad_norm": 0.5642560950283441,
"learning_rate": 9.618478976489709e-07,
"loss": 0.2517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23905110359191895,
"step": 3565,
"valid_targets_mean": 4138.6,
"valid_targets_min": 856
},
{
"epoch": 6.386404293381037,
"grad_norm": 0.5115018928118804,
"learning_rate": 9.347003895165052e-07,
"loss": 0.2448,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26956266164779663,
"step": 3570,
"valid_targets_mean": 5040.1,
"valid_targets_min": 1505
},
{
"epoch": 6.395348837209302,
"grad_norm": 0.5710236424221047,
"learning_rate": 9.079323279425245e-07,
"loss": 0.2532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2561646103858948,
"step": 3575,
"valid_targets_mean": 4197.1,
"valid_targets_min": 1158
},
{
"epoch": 6.404293381037567,
"grad_norm": 0.5054247186866906,
"learning_rate": 8.815442456775835e-07,
"loss": 0.249,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25438791513442993,
"step": 3580,
"valid_targets_mean": 4520.4,
"valid_targets_min": 1430
},
{
"epoch": 6.4132379248658316,
"grad_norm": 0.5325941678660696,
"learning_rate": 8.555366679097043e-07,
"loss": 0.2508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24359354376792908,
"step": 3585,
"valid_targets_mean": 4353.4,
"valid_targets_min": 1339
},
{
"epoch": 6.422182468694096,
"grad_norm": 0.5189637715129809,
"learning_rate": 8.29910112253931e-07,
"loss": 0.2492,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2488621473312378,
"step": 3590,
"valid_targets_mean": 4283.8,
"valid_targets_min": 2266
},
{
"epoch": 6.431127012522361,
"grad_norm": 0.5866424542601351,
"learning_rate": 8.046650887420227e-07,
"loss": 0.2456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26135364174842834,
"step": 3595,
"valid_targets_mean": 3206.2,
"valid_targets_min": 1617
},
{
"epoch": 6.440071556350626,
"grad_norm": 0.5499318781593886,
"learning_rate": 7.798020998123101e-07,
"loss": 0.2471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2563382685184479,
"step": 3600,
"valid_targets_mean": 4393.6,
"valid_targets_min": 710
},
{
"epoch": 6.449016100178891,
"grad_norm": 0.5310211310663512,
"learning_rate": 7.55321640299691e-07,
"loss": 0.248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25477510690689087,
"step": 3605,
"valid_targets_mean": 4263.4,
"valid_targets_min": 2011
},
{
"epoch": 6.457960644007156,
"grad_norm": 0.560059078942515,
"learning_rate": 7.312241974257861e-07,
"loss": 0.2373,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2293008267879486,
"step": 3610,
"valid_targets_mean": 3617.6,
"valid_targets_min": 1590
},
{
"epoch": 6.466905187835421,
"grad_norm": 0.5267478780824102,
"learning_rate": 7.075102507892295e-07,
"loss": 0.247,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23703113198280334,
"step": 3615,
"valid_targets_mean": 4467.4,
"valid_targets_min": 1654
},
{
"epoch": 6.475849731663685,
"grad_norm": 0.5537266130087152,
"learning_rate": 6.841802723561408e-07,
"loss": 0.2325,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.241033136844635,
"step": 3620,
"valid_targets_mean": 4434.5,
"valid_targets_min": 680
},
{
"epoch": 6.48479427549195,
"grad_norm": 0.5258675827998067,
"learning_rate": 6.612347264507257e-07,
"loss": 0.2569,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23057600855827332,
"step": 3625,
"valid_targets_mean": 4508.6,
"valid_targets_min": 1675
},
{
"epoch": 6.493738819320215,
"grad_norm": 0.6060163526427282,
"learning_rate": 6.386740697460281e-07,
"loss": 0.2582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.266754686832428,
"step": 3630,
"valid_targets_mean": 3405.2,
"valid_targets_min": 1494
},
{
"epoch": 6.5026833631484795,
"grad_norm": 1.243756853379082,
"learning_rate": 6.164987512548415e-07,
"loss": 0.2425,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24251213669776917,
"step": 3635,
"valid_targets_mean": 4815.0,
"valid_targets_min": 748
},
{
"epoch": 6.511627906976744,
"grad_norm": 0.4905512612650833,
"learning_rate": 5.947092123207854e-07,
"loss": 0.2458,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2418278455734253,
"step": 3640,
"valid_targets_mean": 4851.4,
"valid_targets_min": 1723
},
{
"epoch": 6.520572450805009,
"grad_norm": 0.6977038416301831,
"learning_rate": 5.733058866095143e-07,
"loss": 0.2439,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25958025455474854,
"step": 3645,
"valid_targets_mean": 3321.6,
"valid_targets_min": 864
},
{
"epoch": 6.529516994633274,
"grad_norm": 0.5620237411481044,
"learning_rate": 5.522892001000801e-07,
"loss": 0.247,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25899815559387207,
"step": 3650,
"valid_targets_mean": 3941.6,
"valid_targets_min": 645
},
{
"epoch": 6.538461538461538,
"grad_norm": 0.5931969111624182,
"learning_rate": 5.316595710764594e-07,
"loss": 0.2485,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2590034008026123,
"step": 3655,
"valid_targets_mean": 3292.1,
"valid_targets_min": 1140
},
{
"epoch": 6.547406082289803,
"grad_norm": 0.5619298957004911,
"learning_rate": 5.114174101192282e-07,
"loss": 0.2551,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25470370054244995,
"step": 3660,
"valid_targets_mean": 4170.2,
"valid_targets_min": 1529
},
{
"epoch": 6.556350626118068,
"grad_norm": 0.5338888004490264,
"learning_rate": 4.915631200973958e-07,
"loss": 0.2489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23330549895763397,
"step": 3665,
"valid_targets_mean": 4152.4,
"valid_targets_min": 1548
},
{
"epoch": 6.565295169946332,
"grad_norm": 0.5029110114373035,
"learning_rate": 4.7209709616038214e-07,
"loss": 0.2413,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2532098591327667,
"step": 3670,
"valid_targets_mean": 4623.9,
"valid_targets_min": 1504
},
{
"epoch": 6.574239713774597,
"grad_norm": 0.5553623774184658,
"learning_rate": 4.5301972573014163e-07,
"loss": 0.2498,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25203073024749756,
"step": 3675,
"valid_targets_mean": 4177.2,
"valid_targets_min": 954
},
{
"epoch": 6.583184257602863,
"grad_norm": 0.5645036118540637,
"learning_rate": 4.3433138849347854e-07,
"loss": 0.255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25823813676834106,
"step": 3680,
"valid_targets_mean": 4475.9,
"valid_targets_min": 2315
},
{
"epoch": 6.592128801431127,
"grad_norm": 0.5703760997362556,
"learning_rate": 4.1603245639446845e-07,
"loss": 0.2475,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24437285959720612,
"step": 3685,
"valid_targets_mean": 4044.4,
"valid_targets_min": 1603
},
{
"epoch": 6.601073345259392,
"grad_norm": 0.5422079585581118,
"learning_rate": 3.981232936270596e-07,
"loss": 0.2324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23096385598182678,
"step": 3690,
"valid_targets_mean": 4084.5,
"valid_targets_min": 2212
},
{
"epoch": 6.610017889087657,
"grad_norm": 0.560268180958077,
"learning_rate": 3.806042566278345e-07,
"loss": 0.2623,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3074514865875244,
"step": 3695,
"valid_targets_mean": 4345.9,
"valid_targets_min": 1526
},
{
"epoch": 6.618962432915922,
"grad_norm": 0.5139061022298529,
"learning_rate": 3.6347569406890213e-07,
"loss": 0.2439,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24795208871364594,
"step": 3700,
"valid_targets_mean": 4453.6,
"valid_targets_min": 2173
},
{
"epoch": 6.627906976744186,
"grad_norm": 0.5732304901299363,
"learning_rate": 3.467379468509746e-07,
"loss": 0.2512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2507464289665222,
"step": 3705,
"valid_targets_mean": 3565.4,
"valid_targets_min": 1726
},
{
"epoch": 6.636851520572451,
"grad_norm": 0.5275323599021355,
"learning_rate": 3.3039134809656594e-07,
"loss": 0.238,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25029295682907104,
"step": 3710,
"valid_targets_mean": 4312.4,
"valid_targets_min": 1826
},
{
"epoch": 6.645796064400716,
"grad_norm": 0.5142402557074688,
"learning_rate": 3.144362231433706e-07,
"loss": 0.2442,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24940407276153564,
"step": 3715,
"valid_targets_mean": 4422.9,
"valid_targets_min": 747
},
{
"epoch": 6.65474060822898,
"grad_norm": 0.5730417596248877,
"learning_rate": 2.9887288953778903e-07,
"loss": 0.2564,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2630217671394348,
"step": 3720,
"valid_targets_mean": 4032.0,
"valid_targets_min": 1372
},
{
"epoch": 6.663685152057245,
"grad_norm": 0.554437674633871,
"learning_rate": 2.8370165702860553e-07,
"loss": 0.2451,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26767322421073914,
"step": 3725,
"valid_targets_mean": 4060.4,
"valid_targets_min": 1319
},
{
"epoch": 6.67262969588551,
"grad_norm": 0.5716086807724999,
"learning_rate": 2.6892282756082246e-07,
"loss": 0.246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23963013291358948,
"step": 3730,
"valid_targets_mean": 3399.0,
"valid_targets_min": 691
},
{
"epoch": 6.6815742397137745,
"grad_norm": 0.5079641007584742,
"learning_rate": 2.545366952696582e-07,
"loss": 0.2441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2464374452829361,
"step": 3735,
"valid_targets_mean": 4499.1,
"valid_targets_min": 1971
},
{
"epoch": 6.690518783542039,
"grad_norm": 0.9402640194261683,
"learning_rate": 2.405435464746786e-07,
"loss": 0.264,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27681803703308105,
"step": 3740,
"valid_targets_mean": 3995.8,
"valid_targets_min": 656
},
{
"epoch": 6.699463327370304,
"grad_norm": 0.5895147291124684,
"learning_rate": 2.2694365967411258e-07,
"loss": 0.2572,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26021093130111694,
"step": 3745,
"valid_targets_mean": 3512.1,
"valid_targets_min": 922
},
{
"epoch": 6.708407871198569,
"grad_norm": 0.5247512021335333,
"learning_rate": 2.137373055393055e-07,
"loss": 0.2525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2672116756439209,
"step": 3750,
"valid_targets_mean": 4461.2,
"valid_targets_min": 1031
},
{
"epoch": 6.717352415026833,
"grad_norm": 0.5648115569047794,
"learning_rate": 2.009247469093234e-07,
"loss": 0.2372,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24653485417366028,
"step": 3755,
"valid_targets_mean": 3891.8,
"valid_targets_min": 1329
},
{
"epoch": 6.726296958855098,
"grad_norm": 0.5935904883224387,
"learning_rate": 1.8850623878573505e-07,
"loss": 0.2541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2428642213344574,
"step": 3760,
"valid_targets_mean": 3706.3,
"valid_targets_min": 931
},
{
"epoch": 6.735241502683364,
"grad_norm": 0.5282006716958451,
"learning_rate": 1.7648202832752924e-07,
"loss": 0.2583,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22287273406982422,
"step": 3765,
"valid_targets_mean": 4499.3,
"valid_targets_min": 1662
},
{
"epoch": 6.7441860465116275,
"grad_norm": 0.5697571140348834,
"learning_rate": 1.6485235484619665e-07,
"loss": 0.2428,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25361984968185425,
"step": 3770,
"valid_targets_mean": 3464.8,
"valid_targets_min": 1843
},
{
"epoch": 6.753130590339893,
"grad_norm": 0.561107497561089,
"learning_rate": 1.5361744980096905e-07,
"loss": 0.2382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23007211089134216,
"step": 3775,
"valid_targets_mean": 3861.9,
"valid_targets_min": 1742
},
{
"epoch": 6.762075134168158,
"grad_norm": 0.5240522175257502,
"learning_rate": 1.427775367942097e-07,
"loss": 0.2564,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25991159677505493,
"step": 3780,
"valid_targets_mean": 4519.6,
"valid_targets_min": 1936
},
{
"epoch": 6.7710196779964225,
"grad_norm": 0.5553928938449468,
"learning_rate": 1.3233283156696142e-07,
"loss": 0.2437,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2548370659351349,
"step": 3785,
"valid_targets_mean": 3997.4,
"valid_targets_min": 621
},
{
"epoch": 6.779964221824687,
"grad_norm": 0.5074568016914366,
"learning_rate": 1.222835419946633e-07,
"loss": 0.252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23944196105003357,
"step": 3790,
"valid_targets_mean": 5238.7,
"valid_targets_min": 2620
},
{
"epoch": 6.788908765652952,
"grad_norm": 0.5333184632049403,
"learning_rate": 1.1262986808300291e-07,
"loss": 0.2485,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25998786091804504,
"step": 3795,
"valid_targets_mean": 4385.2,
"valid_targets_min": 1617
},
{
"epoch": 6.797853309481217,
"grad_norm": 0.5068220624841174,
"learning_rate": 1.0337200196393505e-07,
"loss": 0.2577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25370797514915466,
"step": 3800,
"valid_targets_mean": 4350.8,
"valid_targets_min": 1473
},
{
"epoch": 6.806797853309481,
"grad_norm": 0.5340749980997674,
"learning_rate": 9.451012789186476e-08,
"loss": 0.2433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24803949892520905,
"step": 3805,
"valid_targets_mean": 4403.3,
"valid_targets_min": 784
},
{
"epoch": 6.815742397137746,
"grad_norm": 0.5465845662554875,
"learning_rate": 8.604442223998144e-08,
"loss": 0.2621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28449052572250366,
"step": 3810,
"valid_targets_mean": 4181.7,
"valid_targets_min": 1019
},
{
"epoch": 6.824686940966011,
"grad_norm": 0.5740109665058152,
"learning_rate": 7.797505349673496e-08,
"loss": 0.2428,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24289534986019135,
"step": 3815,
"valid_targets_mean": 3507.5,
"valid_targets_min": 1523
},
{
"epoch": 6.833631484794275,
"grad_norm": 0.532987766803314,
"learning_rate": 7.030218226250051e-08,
"loss": 0.251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24493467807769775,
"step": 3820,
"valid_targets_mean": 4069.8,
"valid_targets_min": 795
},
{
"epoch": 6.84257602862254,
"grad_norm": 0.6131271407710378,
"learning_rate": 6.302596124636573e-08,
"loss": 0.2555,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2517031729221344,
"step": 3825,
"valid_targets_mean": 4256.1,
"valid_targets_min": 741
},
{
"epoch": 6.851520572450805,
"grad_norm": 0.5260881026648205,
"learning_rate": 5.6146535263106314e-08,
"loss": 0.249,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22869578003883362,
"step": 3830,
"valid_targets_mean": 4011.5,
"valid_targets_min": 1329
},
{
"epoch": 6.8604651162790695,
"grad_norm": 0.6127050009448671,
"learning_rate": 4.966404123029289e-08,
"loss": 0.2448,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2303614318370819,
"step": 3835,
"valid_targets_mean": 4033.9,
"valid_targets_min": 1573
},
{
"epoch": 6.869409660107334,
"grad_norm": 0.5818917098959172,
"learning_rate": 4.357860816557091e-08,
"loss": 0.2611,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2567775249481201,
"step": 3840,
"valid_targets_mean": 3792.1,
"valid_targets_min": 529
},
{
"epoch": 6.878354203935599,
"grad_norm": 0.5360181923150845,
"learning_rate": 3.789035718408718e-08,
"loss": 0.2458,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24667097628116608,
"step": 3845,
"valid_targets_mean": 3941.6,
"valid_targets_min": 1016
},
{
"epoch": 6.8872987477638645,
"grad_norm": 0.596035881473606,
"learning_rate": 3.259940149609175e-08,
"loss": 0.2522,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.278276652097702,
"step": 3850,
"valid_targets_mean": 3848.6,
"valid_targets_min": 884
},
{
"epoch": 6.896243291592128,
"grad_norm": 0.5426279598087133,
"learning_rate": 2.7705846404670888e-08,
"loss": 0.2362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25362810492515564,
"step": 3855,
"valid_targets_mean": 3896.8,
"valid_targets_min": 1947
},
{
"epoch": 6.905187835420394,
"grad_norm": 0.5217040663626972,
"learning_rate": 2.3209789303657582e-08,
"loss": 0.2428,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24874532222747803,
"step": 3860,
"valid_targets_mean": 4455.1,
"valid_targets_min": 1374
},
{
"epoch": 6.914132379248659,
"grad_norm": 0.6253844624269363,
"learning_rate": 1.9111319675699792e-08,
"loss": 0.2447,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24061639606952667,
"step": 3865,
"valid_targets_mean": 4007.6,
"valid_targets_min": 1409
},
{
"epoch": 6.923076923076923,
"grad_norm": 0.600953932839311,
"learning_rate": 1.5410519090461872e-08,
"loss": 0.2478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25711876153945923,
"step": 3870,
"valid_targets_mean": 3362.2,
"valid_targets_min": 995
},
{
"epoch": 6.932021466905188,
"grad_norm": 0.5660567298832868,
"learning_rate": 1.210746120302142e-08,
"loss": 0.2463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2501237392425537,
"step": 3875,
"valid_targets_mean": 3972.0,
"valid_targets_min": 2149
},
{
"epoch": 6.940966010733453,
"grad_norm": 0.6014456216364971,
"learning_rate": 9.202211752386003e-09,
"loss": 0.2541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25210267305374146,
"step": 3880,
"valid_targets_mean": 4391.4,
"valid_targets_min": 1615
},
{
"epoch": 6.9499105545617175,
"grad_norm": 0.5988847243290031,
"learning_rate": 6.694828560200872e-09,
"loss": 0.2572,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2896597385406494,
"step": 3885,
"valid_targets_mean": 4030.7,
"valid_targets_min": 1853
},
{
"epoch": 6.958855098389982,
"grad_norm": 0.5395682499202165,
"learning_rate": 4.585361529581001e-09,
"loss": 0.2411,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2411486953496933,
"step": 3890,
"valid_targets_mean": 4078.4,
"valid_targets_min": 822
},
{
"epoch": 6.967799642218247,
"grad_norm": 0.6335748048992399,
"learning_rate": 2.87385264413631e-09,
"loss": 0.2559,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2603016793727875,
"step": 3895,
"valid_targets_mean": 2954.7,
"valid_targets_min": 911
},
{
"epoch": 6.976744186046512,
"grad_norm": 0.5727655803906435,
"learning_rate": 1.560335967114579e-09,
"loss": 0.2541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25090134143829346,
"step": 3900,
"valid_targets_mean": 4419.8,
"valid_targets_min": 1517
},
{
"epoch": 6.985688729874776,
"grad_norm": 0.5157971974589199,
"learning_rate": 6.4483764074863e-10,
"loss": 0.2364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2580246329307556,
"step": 3905,
"valid_targets_mean": 4267.4,
"valid_targets_min": 1483
},
{
"epoch": 6.994633273703041,
"grad_norm": 0.5412701822718862,
"learning_rate": 1.273758857145424e-10,
"loss": 0.2505,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2360781729221344,
"step": 3910,
"valid_targets_mean": 3865.5,
"valid_targets_min": 653
},
{
"epoch": 7.0,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23571906983852386,
"step": 3913,
"total_flos": 1325319151616000.0,
"train_loss": 0.29724271997234386,
"train_runtime": 27386.6627,
"train_samples_per_second": 2.285,
"train_steps_per_second": 0.143,
"valid_targets_mean": 3601.1,
"valid_targets_min": 1303
}
],
"logging_steps": 5,
"max_steps": 3913,
"num_input_tokens_seen": 0,
"num_train_epochs": 7,
"save_steps": 1500,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 1325319151616000.0,
"train_batch_size": 1,
"trial_name": null,
"trial_params": null
}