diff --git "a/trainer_state.json" "b/trainer_state.json" new file mode 100644--- /dev/null +++ "b/trainer_state.json" @@ -0,0 +1,14699 @@ +{ + "best_global_step": null, + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 7.0, + "eval_steps": 500, + "global_step": 6664, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.005252100840336135, + "grad_norm": 11.793528240093083, + "learning_rate": 2.39880059970015e-07, + "loss": 0.7356, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.750144362449646, + "step": 5, + "valid_targets_mean": 3398.8, + "valid_targets_min": 746 + }, + { + "epoch": 0.01050420168067227, + "grad_norm": 9.544117410382237, + "learning_rate": 5.397301349325338e-07, + "loss": 0.6877, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5979838371276855, + "step": 10, + "valid_targets_mean": 4347.4, + "valid_targets_min": 1651 + }, + { + "epoch": 0.015756302521008403, + "grad_norm": 8.563267976325044, + "learning_rate": 8.395802098950526e-07, + "loss": 0.6892, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.607923150062561, + "step": 15, + "valid_targets_mean": 4633.2, + "valid_targets_min": 1560 + }, + { + "epoch": 0.02100840336134454, + "grad_norm": 8.188017827775615, + "learning_rate": 1.1394302848575713e-06, + "loss": 0.6695, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6504963040351868, + "step": 20, + "valid_targets_mean": 3938.1, + "valid_targets_min": 1841 + }, + { + "epoch": 0.026260504201680673, + "grad_norm": 6.523486790143655, + "learning_rate": 1.43928035982009e-06, + "loss": 0.6875, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7029379606246948, + "step": 25, + "valid_targets_mean": 3724.8, + "valid_targets_min": 1374 + }, + { + "epoch": 0.031512605042016806, + "grad_norm": 5.51646121673247, + "learning_rate": 1.7391304347826088e-06, + "loss": 0.6512, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6437787413597107, + "step": 30, + "valid_targets_mean": 3264.8, + "valid_targets_min": 1089 + }, + { + "epoch": 0.03676470588235294, + "grad_norm": 4.319516286938232, + "learning_rate": 2.0389805097451275e-06, + "loss": 0.5769, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6190094947814941, + "step": 35, + "valid_targets_mean": 3374.9, + "valid_targets_min": 627 + }, + { + "epoch": 0.04201680672268908, + "grad_norm": 3.7446317656639048, + "learning_rate": 2.3388305847076464e-06, + "loss": 0.5953, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6246620416641235, + "step": 40, + "valid_targets_mean": 3514.9, + "valid_targets_min": 1574 + }, + { + "epoch": 0.04726890756302521, + "grad_norm": 2.652464883959148, + "learning_rate": 2.6386806596701653e-06, + "loss": 0.5982, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6014484167098999, + "step": 45, + "valid_targets_mean": 3956.7, + "valid_targets_min": 1899 + }, + { + "epoch": 0.052521008403361345, + "grad_norm": 1.9872458383108076, + "learning_rate": 2.9385307346326843e-06, + "loss": 0.5479, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5268915891647339, + "step": 50, + "valid_targets_mean": 4397.6, + "valid_targets_min": 2261 + }, + { + "epoch": 0.05777310924369748, + "grad_norm": 1.6856790315793377, + "learning_rate": 3.2383808095952024e-06, + "loss": 0.5517, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.535837709903717, + "step": 55, + "valid_targets_mean": 3263.8, + "valid_targets_min": 1873 + }, + { + "epoch": 0.06302521008403361, + "grad_norm": 1.2418730665732476, + "learning_rate": 3.5382308845577213e-06, + "loss": 0.5094, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5285685658454895, + "step": 60, + "valid_targets_mean": 3430.2, + "valid_targets_min": 1013 + }, + { + "epoch": 0.06827731092436974, + "grad_norm": 0.8868118364710539, + "learning_rate": 3.83808095952024e-06, + "loss": 0.4861, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.4722723364830017, + "step": 65, + "valid_targets_mean": 4041.6, + "valid_targets_min": 1366 + }, + { + "epoch": 0.07352941176470588, + "grad_norm": 0.9428896232462224, + "learning_rate": 4.137931034482759e-06, + "loss": 0.5037, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.53287672996521, + "step": 70, + "valid_targets_mean": 3515.2, + "valid_targets_min": 2050 + }, + { + "epoch": 0.07878151260504201, + "grad_norm": 0.9383925766489141, + "learning_rate": 4.437781109445278e-06, + "loss": 0.5135, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.524086058139801, + "step": 75, + "valid_targets_mean": 3048.9, + "valid_targets_min": 746 + }, + { + "epoch": 0.08403361344537816, + "grad_norm": 0.9340541727723428, + "learning_rate": 4.737631184407796e-06, + "loss": 0.489, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5150220990180969, + "step": 80, + "valid_targets_mean": 2982.6, + "valid_targets_min": 855 + }, + { + "epoch": 0.08928571428571429, + "grad_norm": 0.7737514488505065, + "learning_rate": 5.037481259370315e-06, + "loss": 0.4923, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.498151570558548, + "step": 85, + "valid_targets_mean": 3753.4, + "valid_targets_min": 2125 + }, + { + "epoch": 0.09453781512605042, + "grad_norm": 0.8574731436330563, + "learning_rate": 5.337331334332834e-06, + "loss": 0.5013, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.4901542663574219, + "step": 90, + "valid_targets_mean": 2946.8, + "valid_targets_min": 1173 + }, + { + "epoch": 0.09978991596638656, + "grad_norm": 0.8207916191722505, + "learning_rate": 5.6371814092953526e-06, + "loss": 0.4644, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.45455610752105713, + "step": 95, + "valid_targets_mean": 3284.2, + "valid_targets_min": 1438 + }, + { + "epoch": 0.10504201680672269, + "grad_norm": 0.6890899996201467, + "learning_rate": 5.937031484257871e-06, + "loss": 0.4503, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3856987953186035, + "step": 100, + "valid_targets_mean": 3818.4, + "valid_targets_min": 1133 + }, + { + "epoch": 0.11029411764705882, + "grad_norm": 0.7375624963619357, + "learning_rate": 6.2368815592203904e-06, + "loss": 0.4597, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.42143797874450684, + "step": 105, + "valid_targets_mean": 3339.8, + "valid_targets_min": 1051 + }, + { + "epoch": 0.11554621848739496, + "grad_norm": 0.7422023625324775, + "learning_rate": 6.536731634182909e-06, + "loss": 0.449, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.47655802965164185, + "step": 110, + "valid_targets_mean": 3285.1, + "valid_targets_min": 1642 + }, + { + "epoch": 0.1207983193277311, + "grad_norm": 0.6767508461063624, + "learning_rate": 6.8365817091454274e-06, + "loss": 0.4463, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.42775917053222656, + "step": 115, + "valid_targets_mean": 3340.8, + "valid_targets_min": 1747 + }, + { + "epoch": 0.12605042016806722, + "grad_norm": 0.7262880447276591, + "learning_rate": 7.136431784107947e-06, + "loss": 0.4491, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.4421280324459076, + "step": 120, + "valid_targets_mean": 3218.2, + "valid_targets_min": 1765 + }, + { + "epoch": 0.13130252100840337, + "grad_norm": 0.7791375198049785, + "learning_rate": 7.436281859070465e-06, + "loss": 0.4446, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.4363992214202881, + "step": 125, + "valid_targets_mean": 3182.9, + "valid_targets_min": 1233 + }, + { + "epoch": 0.13655462184873948, + "grad_norm": 0.7376851052403786, + "learning_rate": 7.736131934032984e-06, + "loss": 0.4195, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.4291246831417084, + "step": 130, + "valid_targets_mean": 3020.8, + "valid_targets_min": 869 + }, + { + "epoch": 0.14180672268907563, + "grad_norm": 0.7251699149877672, + "learning_rate": 8.035982008995503e-06, + "loss": 0.4383, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.4199424982070923, + "step": 135, + "valid_targets_mean": 3269.2, + "valid_targets_min": 926 + }, + { + "epoch": 0.14705882352941177, + "grad_norm": 0.7174356234657762, + "learning_rate": 8.335832083958023e-06, + "loss": 0.4209, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3915764093399048, + "step": 140, + "valid_targets_mean": 3256.4, + "valid_targets_min": 1016 + }, + { + "epoch": 0.15231092436974789, + "grad_norm": 0.7429933172485804, + "learning_rate": 8.63568215892054e-06, + "loss": 0.4246, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.4099087417125702, + "step": 145, + "valid_targets_mean": 3058.4, + "valid_targets_min": 1367 + }, + { + "epoch": 0.15756302521008403, + "grad_norm": 0.6609884978656597, + "learning_rate": 8.93553223388306e-06, + "loss": 0.4275, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.38431763648986816, + "step": 150, + "valid_targets_mean": 3513.8, + "valid_targets_min": 761 + }, + { + "epoch": 0.16281512605042017, + "grad_norm": 0.7414117819519422, + "learning_rate": 9.235382308845579e-06, + "loss": 0.4149, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.41205519437789917, + "step": 155, + "valid_targets_mean": 2834.2, + "valid_targets_min": 1480 + }, + { + "epoch": 0.16806722689075632, + "grad_norm": 0.766190877937914, + "learning_rate": 9.535232383808097e-06, + "loss": 0.4221, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.40908199548721313, + "step": 160, + "valid_targets_mean": 2854.1, + "valid_targets_min": 1229 + }, + { + "epoch": 0.17331932773109243, + "grad_norm": 0.7322988121738653, + "learning_rate": 9.835082458770614e-06, + "loss": 0.4219, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.409344881772995, + "step": 165, + "valid_targets_mean": 3215.8, + "valid_targets_min": 1727 + }, + { + "epoch": 0.17857142857142858, + "grad_norm": 0.7036664531547118, + "learning_rate": 1.0134932533733135e-05, + "loss": 0.4117, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3934198021888733, + "step": 170, + "valid_targets_mean": 3578.9, + "valid_targets_min": 1860 + }, + { + "epoch": 0.18382352941176472, + "grad_norm": 0.7504645575443613, + "learning_rate": 1.0434782608695653e-05, + "loss": 0.4176, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.41233259439468384, + "step": 175, + "valid_targets_mean": 3121.1, + "valid_targets_min": 1145 + }, + { + "epoch": 0.18907563025210083, + "grad_norm": 0.8540338092213114, + "learning_rate": 1.0734632683658172e-05, + "loss": 0.4206, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.4257834851741791, + "step": 180, + "valid_targets_mean": 2910.1, + "valid_targets_min": 1195 + }, + { + "epoch": 0.19432773109243698, + "grad_norm": 0.672825231347177, + "learning_rate": 1.103448275862069e-05, + "loss": 0.4046, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.37902510166168213, + "step": 185, + "valid_targets_mean": 3215.2, + "valid_targets_min": 1087 + }, + { + "epoch": 0.19957983193277312, + "grad_norm": 0.7299680458741075, + "learning_rate": 1.1334332833583211e-05, + "loss": 0.4173, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3878703713417053, + "step": 190, + "valid_targets_mean": 3842.3, + "valid_targets_min": 730 + }, + { + "epoch": 0.20483193277310924, + "grad_norm": 0.7452069066845327, + "learning_rate": 1.1634182908545729e-05, + "loss": 0.4012, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.40164220333099365, + "step": 195, + "valid_targets_mean": 3112.6, + "valid_targets_min": 1097 + }, + { + "epoch": 0.21008403361344538, + "grad_norm": 0.6701617672469308, + "learning_rate": 1.1934032983508246e-05, + "loss": 0.3889, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.4067269563674927, + "step": 200, + "valid_targets_mean": 3587.6, + "valid_targets_min": 1833 + }, + { + "epoch": 0.21533613445378152, + "grad_norm": 0.6999892185242177, + "learning_rate": 1.2233883058470766e-05, + "loss": 0.4046, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.42524561285972595, + "step": 205, + "valid_targets_mean": 3660.6, + "valid_targets_min": 1182 + }, + { + "epoch": 0.22058823529411764, + "grad_norm": 0.6936596594842792, + "learning_rate": 1.2533733133433283e-05, + "loss": 0.3979, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.4341742992401123, + "step": 210, + "valid_targets_mean": 3839.4, + "valid_targets_min": 1586 + }, + { + "epoch": 0.22584033613445378, + "grad_norm": 0.7203275927233951, + "learning_rate": 1.2833583208395803e-05, + "loss": 0.4122, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.4256739020347595, + "step": 215, + "valid_targets_mean": 3062.7, + "valid_targets_min": 1714 + }, + { + "epoch": 0.23109243697478993, + "grad_norm": 0.8564716523005904, + "learning_rate": 1.313343328335832e-05, + "loss": 0.4007, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.4049715995788574, + "step": 220, + "valid_targets_mean": 3611.1, + "valid_targets_min": 1504 + }, + { + "epoch": 0.23634453781512604, + "grad_norm": 0.6563920907148093, + "learning_rate": 1.3433283358320841e-05, + "loss": 0.3885, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3269047141075134, + "step": 225, + "valid_targets_mean": 3457.1, + "valid_targets_min": 1170 + }, + { + "epoch": 0.2415966386554622, + "grad_norm": 0.7196899057898143, + "learning_rate": 1.3733133433283359e-05, + "loss": 0.3893, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.38853204250335693, + "step": 230, + "valid_targets_mean": 3089.3, + "valid_targets_min": 1436 + }, + { + "epoch": 0.24684873949579833, + "grad_norm": 0.7287732338618192, + "learning_rate": 1.4032983508245878e-05, + "loss": 0.3919, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.38699156045913696, + "step": 235, + "valid_targets_mean": 3257.2, + "valid_targets_min": 1302 + }, + { + "epoch": 0.25210084033613445, + "grad_norm": 0.7214311214899903, + "learning_rate": 1.4332833583208396e-05, + "loss": 0.3841, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.41121745109558105, + "step": 240, + "valid_targets_mean": 3425.1, + "valid_targets_min": 2023 + }, + { + "epoch": 0.25735294117647056, + "grad_norm": 0.648625366284687, + "learning_rate": 1.4632683658170917e-05, + "loss": 0.361, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3404223918914795, + "step": 245, + "valid_targets_mean": 3196.4, + "valid_targets_min": 809 + }, + { + "epoch": 0.26260504201680673, + "grad_norm": 0.7442737796844059, + "learning_rate": 1.4932533733133435e-05, + "loss": 0.3958, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.37922531366348267, + "step": 250, + "valid_targets_mean": 3197.8, + "valid_targets_min": 1059 + }, + { + "epoch": 0.26785714285714285, + "grad_norm": 0.7290285381798371, + "learning_rate": 1.5232383808095954e-05, + "loss": 0.3759, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.33683687448501587, + "step": 255, + "valid_targets_mean": 3301.7, + "valid_targets_min": 964 + }, + { + "epoch": 0.27310924369747897, + "grad_norm": 0.7658760733120059, + "learning_rate": 1.5532233883058472e-05, + "loss": 0.3864, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3716367483139038, + "step": 260, + "valid_targets_mean": 3694.2, + "valid_targets_min": 1105 + }, + { + "epoch": 0.27836134453781514, + "grad_norm": 0.8430133851017164, + "learning_rate": 1.5832083958020993e-05, + "loss": 0.3997, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.4212614893913269, + "step": 265, + "valid_targets_mean": 2612.6, + "valid_targets_min": 1491 + }, + { + "epoch": 0.28361344537815125, + "grad_norm": 0.7343320220234513, + "learning_rate": 1.613193403298351e-05, + "loss": 0.4027, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3935287594795227, + "step": 270, + "valid_targets_mean": 3110.5, + "valid_targets_min": 1091 + }, + { + "epoch": 0.28886554621848737, + "grad_norm": 0.7657356714112876, + "learning_rate": 1.6431784107946028e-05, + "loss": 0.3703, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.36865124106407166, + "step": 275, + "valid_targets_mean": 3259.2, + "valid_targets_min": 1822 + }, + { + "epoch": 0.29411764705882354, + "grad_norm": 0.6955693394366955, + "learning_rate": 1.6731634182908546e-05, + "loss": 0.3727, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.36471718549728394, + "step": 280, + "valid_targets_mean": 3547.6, + "valid_targets_min": 1625 + }, + { + "epoch": 0.29936974789915966, + "grad_norm": 0.7042195932323547, + "learning_rate": 1.7031484257871064e-05, + "loss": 0.3672, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3420675992965698, + "step": 285, + "valid_targets_mean": 3628.2, + "valid_targets_min": 1415 + }, + { + "epoch": 0.30462184873949577, + "grad_norm": 0.8809660140825649, + "learning_rate": 1.7331334332833585e-05, + "loss": 0.3791, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.35459285974502563, + "step": 290, + "valid_targets_mean": 3398.9, + "valid_targets_min": 1460 + }, + { + "epoch": 0.30987394957983194, + "grad_norm": 0.7752770337054249, + "learning_rate": 1.7631184407796102e-05, + "loss": 0.3838, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3816995620727539, + "step": 295, + "valid_targets_mean": 2947.4, + "valid_targets_min": 1079 + }, + { + "epoch": 0.31512605042016806, + "grad_norm": 0.7665849286642425, + "learning_rate": 1.7931034482758623e-05, + "loss": 0.3576, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.36882513761520386, + "step": 300, + "valid_targets_mean": 3003.0, + "valid_targets_min": 1274 + }, + { + "epoch": 0.32037815126050423, + "grad_norm": 0.7763875661157622, + "learning_rate": 1.823088455772114e-05, + "loss": 0.3735, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3900800943374634, + "step": 305, + "valid_targets_mean": 3306.3, + "valid_targets_min": 914 + }, + { + "epoch": 0.32563025210084034, + "grad_norm": 0.7724334584719763, + "learning_rate": 1.853073463268366e-05, + "loss": 0.3894, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.36286020278930664, + "step": 310, + "valid_targets_mean": 3332.2, + "valid_targets_min": 1312 + }, + { + "epoch": 0.33088235294117646, + "grad_norm": 0.8144297942259716, + "learning_rate": 1.8830584707646176e-05, + "loss": 0.377, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.395212858915329, + "step": 315, + "valid_targets_mean": 2601.3, + "valid_targets_min": 987 + }, + { + "epoch": 0.33613445378151263, + "grad_norm": 0.6210630540146885, + "learning_rate": 1.9130434782608697e-05, + "loss": 0.3653, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.34900736808776855, + "step": 320, + "valid_targets_mean": 4341.5, + "valid_targets_min": 1856 + }, + { + "epoch": 0.34138655462184875, + "grad_norm": 0.7382149230509586, + "learning_rate": 1.9430284857571215e-05, + "loss": 0.3724, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.37840932607650757, + "step": 325, + "valid_targets_mean": 3290.9, + "valid_targets_min": 1601 + }, + { + "epoch": 0.34663865546218486, + "grad_norm": 0.7441687764233078, + "learning_rate": 1.9730134932533736e-05, + "loss": 0.3807, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3847064971923828, + "step": 330, + "valid_targets_mean": 3119.4, + "valid_targets_min": 1986 + }, + { + "epoch": 0.35189075630252103, + "grad_norm": 0.6427174614521525, + "learning_rate": 2.0029985007496254e-05, + "loss": 0.3556, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.38938313722610474, + "step": 335, + "valid_targets_mean": 3777.1, + "valid_targets_min": 974 + }, + { + "epoch": 0.35714285714285715, + "grad_norm": 0.6767174257258602, + "learning_rate": 2.0329835082458775e-05, + "loss": 0.3632, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.33448052406311035, + "step": 340, + "valid_targets_mean": 2878.0, + "valid_targets_min": 512 + }, + { + "epoch": 0.36239495798319327, + "grad_norm": 0.7046783787151958, + "learning_rate": 2.0629685157421292e-05, + "loss": 0.3697, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.35749202966690063, + "step": 345, + "valid_targets_mean": 3215.4, + "valid_targets_min": 1202 + }, + { + "epoch": 0.36764705882352944, + "grad_norm": 0.7219690552414987, + "learning_rate": 2.092953523238381e-05, + "loss": 0.3881, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.37818586826324463, + "step": 350, + "valid_targets_mean": 3693.1, + "valid_targets_min": 1455 + }, + { + "epoch": 0.37289915966386555, + "grad_norm": 0.6860266938886983, + "learning_rate": 2.1229385307346328e-05, + "loss": 0.3675, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.34528088569641113, + "step": 355, + "valid_targets_mean": 3477.5, + "valid_targets_min": 1571 + }, + { + "epoch": 0.37815126050420167, + "grad_norm": 0.7609425900554888, + "learning_rate": 2.152923538230885e-05, + "loss": 0.3949, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.429862916469574, + "step": 360, + "valid_targets_mean": 2912.1, + "valid_targets_min": 1450 + }, + { + "epoch": 0.38340336134453784, + "grad_norm": 0.6848089283903739, + "learning_rate": 2.1829085457271363e-05, + "loss": 0.3669, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3468002676963806, + "step": 365, + "valid_targets_mean": 3323.0, + "valid_targets_min": 1431 + }, + { + "epoch": 0.38865546218487396, + "grad_norm": 0.7419166645990429, + "learning_rate": 2.2128935532233884e-05, + "loss": 0.3744, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3837374746799469, + "step": 370, + "valid_targets_mean": 3461.4, + "valid_targets_min": 1147 + }, + { + "epoch": 0.3939075630252101, + "grad_norm": 0.8576299436135565, + "learning_rate": 2.2428785607196405e-05, + "loss": 0.393, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.39932119846343994, + "step": 375, + "valid_targets_mean": 2641.6, + "valid_targets_min": 998 + }, + { + "epoch": 0.39915966386554624, + "grad_norm": 0.7247001275212052, + "learning_rate": 2.2728635682158923e-05, + "loss": 0.3684, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3718080520629883, + "step": 380, + "valid_targets_mean": 3260.9, + "valid_targets_min": 614 + }, + { + "epoch": 0.40441176470588236, + "grad_norm": 0.7885722026955804, + "learning_rate": 2.302848575712144e-05, + "loss": 0.3797, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.39757227897644043, + "step": 385, + "valid_targets_mean": 2796.2, + "valid_targets_min": 1005 + }, + { + "epoch": 0.4096638655462185, + "grad_norm": 0.7828630662690874, + "learning_rate": 2.3328335832083958e-05, + "loss": 0.3793, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3814929127693176, + "step": 390, + "valid_targets_mean": 3183.6, + "valid_targets_min": 2298 + }, + { + "epoch": 0.41491596638655465, + "grad_norm": 0.8409621672836618, + "learning_rate": 2.362818590704648e-05, + "loss": 0.3763, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3965279459953308, + "step": 395, + "valid_targets_mean": 2821.2, + "valid_targets_min": 617 + }, + { + "epoch": 0.42016806722689076, + "grad_norm": 0.6764711962883958, + "learning_rate": 2.3928035982009e-05, + "loss": 0.355, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3417738080024719, + "step": 400, + "valid_targets_mean": 3265.2, + "valid_targets_min": 1665 + }, + { + "epoch": 0.4254201680672269, + "grad_norm": 0.7365452834319242, + "learning_rate": 2.4227886056971515e-05, + "loss": 0.3735, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3877049684524536, + "step": 405, + "valid_targets_mean": 3019.3, + "valid_targets_min": 1076 + }, + { + "epoch": 0.43067226890756305, + "grad_norm": 0.6737132753666218, + "learning_rate": 2.4527736131934036e-05, + "loss": 0.3566, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.36130669713020325, + "step": 410, + "valid_targets_mean": 3610.8, + "valid_targets_min": 790 + }, + { + "epoch": 0.43592436974789917, + "grad_norm": 0.9130730152687944, + "learning_rate": 2.4827586206896553e-05, + "loss": 0.3783, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3609384000301361, + "step": 415, + "valid_targets_mean": 3255.8, + "valid_targets_min": 1728 + }, + { + "epoch": 0.4411764705882353, + "grad_norm": 0.8464202746590961, + "learning_rate": 2.5127436281859074e-05, + "loss": 0.3788, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.33865395188331604, + "step": 420, + "valid_targets_mean": 3377.2, + "valid_targets_min": 981 + }, + { + "epoch": 0.44642857142857145, + "grad_norm": 0.7384506566000549, + "learning_rate": 2.542728635682159e-05, + "loss": 0.3462, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3339518904685974, + "step": 425, + "valid_targets_mean": 2839.1, + "valid_targets_min": 1351 + }, + { + "epoch": 0.45168067226890757, + "grad_norm": 0.6110714780946447, + "learning_rate": 2.572713643178411e-05, + "loss": 0.3677, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3625059425830841, + "step": 430, + "valid_targets_mean": 4396.7, + "valid_targets_min": 2416 + }, + { + "epoch": 0.4569327731092437, + "grad_norm": 0.5790619763281034, + "learning_rate": 2.602698650674663e-05, + "loss": 0.3524, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.32317501306533813, + "step": 435, + "valid_targets_mean": 4668.6, + "valid_targets_min": 1233 + }, + { + "epoch": 0.46218487394957986, + "grad_norm": 0.642678687454446, + "learning_rate": 2.632683658170915e-05, + "loss": 0.3433, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3185131549835205, + "step": 440, + "valid_targets_mean": 3936.4, + "valid_targets_min": 1524 + }, + { + "epoch": 0.46743697478991597, + "grad_norm": 0.5867900140587048, + "learning_rate": 2.6626686656671666e-05, + "loss": 0.3446, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3317568600177765, + "step": 445, + "valid_targets_mean": 4389.3, + "valid_targets_min": 856 + }, + { + "epoch": 0.4726890756302521, + "grad_norm": 0.6996864572340856, + "learning_rate": 2.6926536731634184e-05, + "loss": 0.3573, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.35135549306869507, + "step": 450, + "valid_targets_mean": 3241.3, + "valid_targets_min": 906 + }, + { + "epoch": 0.47794117647058826, + "grad_norm": 0.6713569052572641, + "learning_rate": 2.7226386806596705e-05, + "loss": 0.3452, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3594322204589844, + "step": 455, + "valid_targets_mean": 3680.4, + "valid_targets_min": 832 + }, + { + "epoch": 0.4831932773109244, + "grad_norm": 0.6528374934626601, + "learning_rate": 2.752623688155922e-05, + "loss": 0.3433, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.33547288179397583, + "step": 460, + "valid_targets_mean": 3168.9, + "valid_targets_min": 1484 + }, + { + "epoch": 0.4884453781512605, + "grad_norm": 0.7585928062211041, + "learning_rate": 2.782608695652174e-05, + "loss": 0.3517, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.34602272510528564, + "step": 465, + "valid_targets_mean": 3667.5, + "valid_targets_min": 1440 + }, + { + "epoch": 0.49369747899159666, + "grad_norm": 0.7549275178598076, + "learning_rate": 2.812593703148426e-05, + "loss": 0.3689, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.40832167863845825, + "step": 470, + "valid_targets_mean": 3025.6, + "valid_targets_min": 1349 + }, + { + "epoch": 0.4989495798319328, + "grad_norm": 0.8305062206700754, + "learning_rate": 2.8425787106446782e-05, + "loss": 0.3684, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.36201930046081543, + "step": 475, + "valid_targets_mean": 2935.8, + "valid_targets_min": 1156 + }, + { + "epoch": 0.5042016806722689, + "grad_norm": 0.7148304561333289, + "learning_rate": 2.8725637181409296e-05, + "loss": 0.358, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3326527178287506, + "step": 480, + "valid_targets_mean": 3190.4, + "valid_targets_min": 993 + }, + { + "epoch": 0.509453781512605, + "grad_norm": 0.8146565793649729, + "learning_rate": 2.9025487256371818e-05, + "loss": 0.3431, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3617240786552429, + "step": 485, + "valid_targets_mean": 2785.6, + "valid_targets_min": 1275 + }, + { + "epoch": 0.5147058823529411, + "grad_norm": 0.7209287114298926, + "learning_rate": 2.9325337331334335e-05, + "loss": 0.352, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.36016473174095154, + "step": 490, + "valid_targets_mean": 3266.8, + "valid_targets_min": 1669 + }, + { + "epoch": 0.5199579831932774, + "grad_norm": 0.7172263463358715, + "learning_rate": 2.9625187406296856e-05, + "loss": 0.3609, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.36014240980148315, + "step": 495, + "valid_targets_mean": 3357.5, + "valid_targets_min": 1710 + }, + { + "epoch": 0.5252100840336135, + "grad_norm": 0.6972857671515527, + "learning_rate": 2.992503748125937e-05, + "loss": 0.3617, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.34464967250823975, + "step": 500, + "valid_targets_mean": 3468.1, + "valid_targets_min": 1685 + }, + { + "epoch": 0.5304621848739496, + "grad_norm": 0.7173833022077326, + "learning_rate": 3.022488755622189e-05, + "loss": 0.3608, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.35650789737701416, + "step": 505, + "valid_targets_mean": 3659.6, + "valid_targets_min": 1931 + }, + { + "epoch": 0.5357142857142857, + "grad_norm": 0.7592796407843059, + "learning_rate": 3.052473763118441e-05, + "loss": 0.3512, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3427087068557739, + "step": 510, + "valid_targets_mean": 3862.3, + "valid_targets_min": 2009 + }, + { + "epoch": 0.5409663865546218, + "grad_norm": 1.1258165798910273, + "learning_rate": 3.0824587706146934e-05, + "loss": 0.361, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.367844820022583, + "step": 515, + "valid_targets_mean": 1792.6, + "valid_targets_min": 777 + }, + { + "epoch": 0.5462184873949579, + "grad_norm": 1.1349526835427646, + "learning_rate": 3.112443778110945e-05, + "loss": 0.3252, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3122398853302002, + "step": 520, + "valid_targets_mean": 1354.7, + "valid_targets_min": 705 + }, + { + "epoch": 0.5514705882352942, + "grad_norm": 1.8110765728106655, + "learning_rate": 3.142428785607197e-05, + "loss": 0.3052, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3012329041957855, + "step": 525, + "valid_targets_mean": 1556.9, + "valid_targets_min": 914 + }, + { + "epoch": 0.5567226890756303, + "grad_norm": 1.1404918052705433, + "learning_rate": 3.172413793103448e-05, + "loss": 0.2933, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2664037346839905, + "step": 530, + "valid_targets_mean": 1397.1, + "valid_targets_min": 680 + }, + { + "epoch": 0.5619747899159664, + "grad_norm": 0.9458053300681202, + "learning_rate": 3.2023988005997004e-05, + "loss": 0.2891, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.289004921913147, + "step": 535, + "valid_targets_mean": 1698.1, + "valid_targets_min": 819 + }, + { + "epoch": 0.5672268907563025, + "grad_norm": 1.0086441843661589, + "learning_rate": 3.2323838080959525e-05, + "loss": 0.2798, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.26696014404296875, + "step": 540, + "valid_targets_mean": 1393.1, + "valid_targets_min": 734 + }, + { + "epoch": 0.5724789915966386, + "grad_norm": 1.0260360672408402, + "learning_rate": 3.262368815592204e-05, + "loss": 0.29, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2623750567436218, + "step": 545, + "valid_targets_mean": 1443.1, + "valid_targets_min": 655 + }, + { + "epoch": 0.5777310924369747, + "grad_norm": 0.9985074269719646, + "learning_rate": 3.292353823088456e-05, + "loss": 0.2606, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.26140543818473816, + "step": 550, + "valid_targets_mean": 1392.2, + "valid_targets_min": 737 + }, + { + "epoch": 0.582983193277311, + "grad_norm": 0.9985105336106163, + "learning_rate": 3.3223388305847075e-05, + "loss": 0.2812, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.25588417053222656, + "step": 555, + "valid_targets_mean": 1386.6, + "valid_targets_min": 759 + }, + { + "epoch": 0.5882352941176471, + "grad_norm": 1.1959754188425515, + "learning_rate": 3.3523238380809596e-05, + "loss": 0.2603, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.27921628952026367, + "step": 560, + "valid_targets_mean": 1442.9, + "valid_targets_min": 750 + }, + { + "epoch": 0.5934873949579832, + "grad_norm": 1.001393308800324, + "learning_rate": 3.382308845577212e-05, + "loss": 0.2606, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2664732336997986, + "step": 565, + "valid_targets_mean": 1536.1, + "valid_targets_min": 780 + }, + { + "epoch": 0.5987394957983193, + "grad_norm": 0.9505908357818789, + "learning_rate": 3.412293853073464e-05, + "loss": 0.2688, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2818218767642975, + "step": 570, + "valid_targets_mean": 1463.1, + "valid_targets_min": 679 + }, + { + "epoch": 0.6039915966386554, + "grad_norm": 1.0707192051376093, + "learning_rate": 3.442278860569715e-05, + "loss": 0.2615, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2692759931087494, + "step": 575, + "valid_targets_mean": 1292.8, + "valid_targets_min": 771 + }, + { + "epoch": 0.6092436974789915, + "grad_norm": 1.1070031492080266, + "learning_rate": 3.4722638680659673e-05, + "loss": 0.2482, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2560975253582001, + "step": 580, + "valid_targets_mean": 1542.4, + "valid_targets_min": 878 + }, + { + "epoch": 0.6144957983193278, + "grad_norm": 0.898740421578359, + "learning_rate": 3.5022488755622194e-05, + "loss": 0.2447, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23506242036819458, + "step": 585, + "valid_targets_mean": 1506.8, + "valid_targets_min": 942 + }, + { + "epoch": 0.6197478991596639, + "grad_norm": 0.9882747404397235, + "learning_rate": 3.5322338830584716e-05, + "loss": 0.2549, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2667955756187439, + "step": 590, + "valid_targets_mean": 1401.9, + "valid_targets_min": 675 + }, + { + "epoch": 0.625, + "grad_norm": 0.9973429121391257, + "learning_rate": 3.562218890554723e-05, + "loss": 0.2558, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2597658038139343, + "step": 595, + "valid_targets_mean": 1483.8, + "valid_targets_min": 892 + }, + { + "epoch": 0.6302521008403361, + "grad_norm": 1.1184131263781747, + "learning_rate": 3.592203898050975e-05, + "loss": 0.2616, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2559979557991028, + "step": 600, + "valid_targets_mean": 1356.3, + "valid_targets_min": 656 + }, + { + "epoch": 0.6355042016806722, + "grad_norm": 1.1551828432063649, + "learning_rate": 3.6221889055472265e-05, + "loss": 0.259, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2352353036403656, + "step": 605, + "valid_targets_mean": 1340.6, + "valid_targets_min": 706 + }, + { + "epoch": 0.6407563025210085, + "grad_norm": 0.9979079936759186, + "learning_rate": 3.6521739130434786e-05, + "loss": 0.2565, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.257199227809906, + "step": 610, + "valid_targets_mean": 1528.6, + "valid_targets_min": 548 + }, + { + "epoch": 0.6460084033613446, + "grad_norm": 0.9872520856471761, + "learning_rate": 3.68215892053973e-05, + "loss": 0.2478, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24192388355731964, + "step": 615, + "valid_targets_mean": 1268.9, + "valid_targets_min": 658 + }, + { + "epoch": 0.6512605042016807, + "grad_norm": 1.0290619368672818, + "learning_rate": 3.712143928035982e-05, + "loss": 0.2568, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.250153124332428, + "step": 620, + "valid_targets_mean": 1360.1, + "valid_targets_min": 650 + }, + { + "epoch": 0.6565126050420168, + "grad_norm": 0.9161121685195928, + "learning_rate": 3.742128935532234e-05, + "loss": 0.2579, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.25210872292518616, + "step": 625, + "valid_targets_mean": 1452.3, + "valid_targets_min": 859 + }, + { + "epoch": 0.6617647058823529, + "grad_norm": 1.231558662443427, + "learning_rate": 3.772113943028486e-05, + "loss": 0.2355, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2508789896965027, + "step": 630, + "valid_targets_mean": 1391.3, + "valid_targets_min": 728 + }, + { + "epoch": 0.667016806722689, + "grad_norm": 0.8973325739286778, + "learning_rate": 3.802098950524738e-05, + "loss": 0.2461, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22503423690795898, + "step": 635, + "valid_targets_mean": 1344.4, + "valid_targets_min": 686 + }, + { + "epoch": 0.6722689075630253, + "grad_norm": 0.9602158780480545, + "learning_rate": 3.83208395802099e-05, + "loss": 0.2427, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2667675018310547, + "step": 640, + "valid_targets_mean": 1545.2, + "valid_targets_min": 697 + }, + { + "epoch": 0.6775210084033614, + "grad_norm": 0.9207285003363753, + "learning_rate": 3.862068965517242e-05, + "loss": 0.239, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23141629993915558, + "step": 645, + "valid_targets_mean": 1354.6, + "valid_targets_min": 779 + }, + { + "epoch": 0.6827731092436975, + "grad_norm": 0.8852191091332312, + "learning_rate": 3.8920539730134934e-05, + "loss": 0.2563, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2596163749694824, + "step": 650, + "valid_targets_mean": 1434.1, + "valid_targets_min": 729 + }, + { + "epoch": 0.6880252100840336, + "grad_norm": 0.912601154449096, + "learning_rate": 3.9220389805097455e-05, + "loss": 0.2314, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22037877142429352, + "step": 655, + "valid_targets_mean": 1388.2, + "valid_targets_min": 868 + }, + { + "epoch": 0.6932773109243697, + "grad_norm": 1.015856823111782, + "learning_rate": 3.9520239880059976e-05, + "loss": 0.2452, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23023347556591034, + "step": 660, + "valid_targets_mean": 1282.3, + "valid_targets_min": 765 + }, + { + "epoch": 0.6985294117647058, + "grad_norm": 0.9855004619555965, + "learning_rate": 3.982008995502249e-05, + "loss": 0.2467, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2527748942375183, + "step": 665, + "valid_targets_mean": 1457.2, + "valid_targets_min": 793 + }, + { + "epoch": 0.7037815126050421, + "grad_norm": 0.9177092400221334, + "learning_rate": 3.9999989022799437e-05, + "loss": 0.2481, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.26127058267593384, + "step": 670, + "valid_targets_mean": 1448.5, + "valid_targets_min": 806 + }, + { + "epoch": 0.7090336134453782, + "grad_norm": 0.8689313261706375, + "learning_rate": 3.9999865529431466e-05, + "loss": 0.2298, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2190496325492859, + "step": 675, + "valid_targets_mean": 1380.7, + "valid_targets_min": 803 + }, + { + "epoch": 0.7142857142857143, + "grad_norm": 0.8662595043279143, + "learning_rate": 3.9999604822044886e-05, + "loss": 0.2387, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22773924469947815, + "step": 680, + "valid_targets_mean": 1515.7, + "valid_targets_min": 660 + }, + { + "epoch": 0.7195378151260504, + "grad_norm": 0.9275572542299572, + "learning_rate": 3.999920690242835e-05, + "loss": 0.2194, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21551215648651123, + "step": 685, + "valid_targets_mean": 1402.0, + "valid_targets_min": 837 + }, + { + "epoch": 0.7247899159663865, + "grad_norm": 0.8209341148096483, + "learning_rate": 3.999867177331189e-05, + "loss": 0.2359, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22521734237670898, + "step": 690, + "valid_targets_mean": 1574.1, + "valid_targets_min": 719 + }, + { + "epoch": 0.7300420168067226, + "grad_norm": 0.9448587281311374, + "learning_rate": 3.9997999438366895e-05, + "loss": 0.2429, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23695966601371765, + "step": 695, + "valid_targets_mean": 1430.1, + "valid_targets_min": 765 + }, + { + "epoch": 0.7352941176470589, + "grad_norm": 0.9348888815574206, + "learning_rate": 3.9997189902206065e-05, + "loss": 0.2388, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24235057830810547, + "step": 700, + "valid_targets_mean": 1372.3, + "valid_targets_min": 727 + }, + { + "epoch": 0.740546218487395, + "grad_norm": 0.898775745123375, + "learning_rate": 3.999624317038344e-05, + "loss": 0.234, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20886942744255066, + "step": 705, + "valid_targets_mean": 1192.8, + "valid_targets_min": 655 + }, + { + "epoch": 0.7457983193277311, + "grad_norm": 0.8896703345645318, + "learning_rate": 3.9995159249394303e-05, + "loss": 0.2447, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2359616905450821, + "step": 710, + "valid_targets_mean": 1508.0, + "valid_targets_min": 669 + }, + { + "epoch": 0.7510504201680672, + "grad_norm": 0.9044856336058926, + "learning_rate": 3.999393814667517e-05, + "loss": 0.2258, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22560223937034607, + "step": 715, + "valid_targets_mean": 1430.2, + "valid_targets_min": 1046 + }, + { + "epoch": 0.7563025210084033, + "grad_norm": 0.7809432057780077, + "learning_rate": 3.9992579870603695e-05, + "loss": 0.2447, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2628813087940216, + "step": 720, + "valid_targets_mean": 1651.8, + "valid_targets_min": 692 + }, + { + "epoch": 0.7615546218487395, + "grad_norm": 0.8587913679452784, + "learning_rate": 3.999108443049869e-05, + "loss": 0.2396, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24335074424743652, + "step": 725, + "valid_targets_mean": 1540.4, + "valid_targets_min": 846 + }, + { + "epoch": 0.7668067226890757, + "grad_norm": 0.9548503644681028, + "learning_rate": 3.998945183661997e-05, + "loss": 0.2532, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2418360412120819, + "step": 730, + "valid_targets_mean": 1455.1, + "valid_targets_min": 764 + }, + { + "epoch": 0.7720588235294118, + "grad_norm": 0.8057865606417343, + "learning_rate": 3.9987682100168376e-05, + "loss": 0.2286, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21932202577590942, + "step": 735, + "valid_targets_mean": 1497.4, + "valid_targets_min": 822 + }, + { + "epoch": 0.7773109243697479, + "grad_norm": 0.8569864825362092, + "learning_rate": 3.99857752332856e-05, + "loss": 0.2326, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24598419666290283, + "step": 740, + "valid_targets_mean": 1543.8, + "valid_targets_min": 982 + }, + { + "epoch": 0.782563025210084, + "grad_norm": 0.8966461968047943, + "learning_rate": 3.998373124905418e-05, + "loss": 0.2414, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24538162350654602, + "step": 745, + "valid_targets_mean": 1346.3, + "valid_targets_min": 713 + }, + { + "epoch": 0.7878151260504201, + "grad_norm": 0.9787609428455722, + "learning_rate": 3.9981550161497375e-05, + "loss": 0.2329, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22620789706707, + "step": 750, + "valid_targets_mean": 1395.7, + "valid_targets_min": 721 + }, + { + "epoch": 0.7930672268907563, + "grad_norm": 0.8647918297737699, + "learning_rate": 3.9979231985579074e-05, + "loss": 0.2291, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22276586294174194, + "step": 755, + "valid_targets_mean": 1290.6, + "valid_targets_min": 741 + }, + { + "epoch": 0.7983193277310925, + "grad_norm": 0.8550351182526175, + "learning_rate": 3.99767767372037e-05, + "loss": 0.2309, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24379882216453552, + "step": 760, + "valid_targets_mean": 1568.1, + "valid_targets_min": 734 + }, + { + "epoch": 0.8035714285714286, + "grad_norm": 0.8680279094247919, + "learning_rate": 3.997418443321609e-05, + "loss": 0.2389, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23442883789539337, + "step": 765, + "valid_targets_mean": 1703.1, + "valid_targets_min": 744 + }, + { + "epoch": 0.8088235294117647, + "grad_norm": 0.9333899796386794, + "learning_rate": 3.997145509140138e-05, + "loss": 0.2392, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.25179609656333923, + "step": 770, + "valid_targets_mean": 1652.8, + "valid_targets_min": 620 + }, + { + "epoch": 0.8140756302521008, + "grad_norm": 0.7856961011675193, + "learning_rate": 3.9968588730484896e-05, + "loss": 0.221, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.224946990609169, + "step": 775, + "valid_targets_mean": 1481.8, + "valid_targets_min": 723 + }, + { + "epoch": 0.819327731092437, + "grad_norm": 0.7761881827856689, + "learning_rate": 3.9965585370132013e-05, + "loss": 0.2298, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21191829442977905, + "step": 780, + "valid_targets_mean": 1686.5, + "valid_targets_min": 740 + }, + { + "epoch": 0.8245798319327731, + "grad_norm": 0.8321605983306755, + "learning_rate": 3.996244503094804e-05, + "loss": 0.2275, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20524507761001587, + "step": 785, + "valid_targets_mean": 1345.1, + "valid_targets_min": 711 + }, + { + "epoch": 0.8298319327731093, + "grad_norm": 0.8224185017405469, + "learning_rate": 3.995916773447804e-05, + "loss": 0.2291, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22673243284225464, + "step": 790, + "valid_targets_mean": 1619.1, + "valid_targets_min": 804 + }, + { + "epoch": 0.8350840336134454, + "grad_norm": 1.5699722200850348, + "learning_rate": 3.995575350320671e-05, + "loss": 0.2223, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2145438939332962, + "step": 795, + "valid_targets_mean": 1423.2, + "valid_targets_min": 674 + }, + { + "epoch": 0.8403361344537815, + "grad_norm": 0.8647740397931104, + "learning_rate": 3.995220236055824e-05, + "loss": 0.2149, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19764792919158936, + "step": 800, + "valid_targets_mean": 1207.4, + "valid_targets_min": 567 + }, + { + "epoch": 0.8455882352941176, + "grad_norm": 0.8208866711497894, + "learning_rate": 3.99485143308961e-05, + "loss": 0.2219, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22692370414733887, + "step": 805, + "valid_targets_mean": 1542.4, + "valid_targets_min": 912 + }, + { + "epoch": 0.8508403361344538, + "grad_norm": 0.7660210546255793, + "learning_rate": 3.994468943952296e-05, + "loss": 0.2316, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23304234445095062, + "step": 810, + "valid_targets_mean": 1591.0, + "valid_targets_min": 897 + }, + { + "epoch": 0.8560924369747899, + "grad_norm": 0.8316792538373139, + "learning_rate": 3.994072771268041e-05, + "loss": 0.2177, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2084471583366394, + "step": 815, + "valid_targets_mean": 1290.1, + "valid_targets_min": 773 + }, + { + "epoch": 0.8613445378151261, + "grad_norm": 0.8668112604053329, + "learning_rate": 3.993662917754885e-05, + "loss": 0.2325, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24037593603134155, + "step": 820, + "valid_targets_mean": 1407.2, + "valid_targets_min": 679 + }, + { + "epoch": 0.8665966386554622, + "grad_norm": 0.9891212862372226, + "learning_rate": 3.993239386224732e-05, + "loss": 0.2266, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22597835958003998, + "step": 825, + "valid_targets_mean": 1600.2, + "valid_targets_min": 818 + }, + { + "epoch": 0.8718487394957983, + "grad_norm": 0.8365460249899657, + "learning_rate": 3.992802179583322e-05, + "loss": 0.2294, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22174695134162903, + "step": 830, + "valid_targets_mean": 1442.4, + "valid_targets_min": 790 + }, + { + "epoch": 0.8771008403361344, + "grad_norm": 0.955688819196928, + "learning_rate": 3.9923513008302204e-05, + "loss": 0.2233, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23063375055789948, + "step": 835, + "valid_targets_mean": 1426.6, + "valid_targets_min": 592 + }, + { + "epoch": 0.8823529411764706, + "grad_norm": 0.7775298281309749, + "learning_rate": 3.991886753058792e-05, + "loss": 0.2239, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21736116707324982, + "step": 840, + "valid_targets_mean": 1430.9, + "valid_targets_min": 662 + }, + { + "epoch": 0.8876050420168067, + "grad_norm": 0.9219183595495097, + "learning_rate": 3.991408539456182e-05, + "loss": 0.2397, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2496243417263031, + "step": 845, + "valid_targets_mean": 1412.6, + "valid_targets_min": 622 + }, + { + "epoch": 0.8928571428571429, + "grad_norm": 0.9447703661465241, + "learning_rate": 3.990916663303293e-05, + "loss": 0.2292, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2532111406326294, + "step": 850, + "valid_targets_mean": 1372.1, + "valid_targets_min": 667 + }, + { + "epoch": 0.898109243697479, + "grad_norm": 0.7856700847441219, + "learning_rate": 3.990411127974762e-05, + "loss": 0.235, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2314455211162567, + "step": 855, + "valid_targets_mean": 1628.1, + "valid_targets_min": 1012 + }, + { + "epoch": 0.9033613445378151, + "grad_norm": 0.9349349696144393, + "learning_rate": 3.989891936938939e-05, + "loss": 0.2331, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2500951886177063, + "step": 860, + "valid_targets_mean": 1464.7, + "valid_targets_min": 635 + }, + { + "epoch": 0.9086134453781513, + "grad_norm": 0.9119192470614107, + "learning_rate": 3.9893590937578634e-05, + "loss": 0.2337, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2547591030597687, + "step": 865, + "valid_targets_mean": 1745.9, + "valid_targets_min": 689 + }, + { + "epoch": 0.9138655462184874, + "grad_norm": 0.9202449016918255, + "learning_rate": 3.9888126020872375e-05, + "loss": 0.2197, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20298632979393005, + "step": 870, + "valid_targets_mean": 1129.1, + "valid_targets_min": 697 + }, + { + "epoch": 0.9191176470588235, + "grad_norm": 0.8174032516425299, + "learning_rate": 3.988252465676401e-05, + "loss": 0.2296, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.25348424911499023, + "step": 875, + "valid_targets_mean": 1624.6, + "valid_targets_min": 656 + }, + { + "epoch": 0.9243697478991597, + "grad_norm": 0.7819162668790818, + "learning_rate": 3.98767868836831e-05, + "loss": 0.23, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.27575284242630005, + "step": 880, + "valid_targets_mean": 1755.8, + "valid_targets_min": 697 + }, + { + "epoch": 0.9296218487394958, + "grad_norm": 0.8141268835699211, + "learning_rate": 3.987091274099504e-05, + "loss": 0.2229, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2335035800933838, + "step": 885, + "valid_targets_mean": 1516.4, + "valid_targets_min": 820 + }, + { + "epoch": 0.9348739495798319, + "grad_norm": 0.7937591348329995, + "learning_rate": 3.986490226900084e-05, + "loss": 0.2232, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22677749395370483, + "step": 890, + "valid_targets_mean": 1391.4, + "valid_targets_min": 680 + }, + { + "epoch": 0.9401260504201681, + "grad_norm": 0.8638827876332873, + "learning_rate": 3.985875550893684e-05, + "loss": 0.2125, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2247205227613449, + "step": 895, + "valid_targets_mean": 1412.4, + "valid_targets_min": 778 + }, + { + "epoch": 0.9453781512605042, + "grad_norm": 0.7937334625060325, + "learning_rate": 3.9852472502974386e-05, + "loss": 0.2369, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.25422534346580505, + "step": 900, + "valid_targets_mean": 1599.6, + "valid_targets_min": 851 + }, + { + "epoch": 0.9506302521008403, + "grad_norm": 0.7815070706059014, + "learning_rate": 3.984605329421961e-05, + "loss": 0.2211, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21097871661186218, + "step": 905, + "valid_targets_mean": 1398.4, + "valid_targets_min": 692 + }, + { + "epoch": 0.9558823529411765, + "grad_norm": 0.7673078400464335, + "learning_rate": 3.983949792671307e-05, + "loss": 0.2148, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20964649319648743, + "step": 910, + "valid_targets_mean": 1477.9, + "valid_targets_min": 741 + }, + { + "epoch": 0.9611344537815126, + "grad_norm": 0.851415365699838, + "learning_rate": 3.9832806445429486e-05, + "loss": 0.2131, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20876117050647736, + "step": 915, + "valid_targets_mean": 1299.4, + "valid_targets_min": 639 + }, + { + "epoch": 0.9663865546218487, + "grad_norm": 0.866799347417237, + "learning_rate": 3.982597889627742e-05, + "loss": 0.2056, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21439066529273987, + "step": 920, + "valid_targets_mean": 1277.9, + "valid_targets_min": 743 + }, + { + "epoch": 0.9716386554621849, + "grad_norm": 0.7220607995686592, + "learning_rate": 3.981901532609896e-05, + "loss": 0.2239, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2239415943622589, + "step": 925, + "valid_targets_mean": 1529.9, + "valid_targets_min": 610 + }, + { + "epoch": 0.976890756302521, + "grad_norm": 0.7774847164190153, + "learning_rate": 3.9811915782669406e-05, + "loss": 0.2182, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20755037665367126, + "step": 930, + "valid_targets_mean": 1331.6, + "valid_targets_min": 695 + }, + { + "epoch": 0.9821428571428571, + "grad_norm": 0.7514140462848654, + "learning_rate": 3.980468031469691e-05, + "loss": 0.2219, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2222648710012436, + "step": 935, + "valid_targets_mean": 1581.9, + "valid_targets_min": 807 + }, + { + "epoch": 0.9873949579831933, + "grad_norm": 0.7556883989929587, + "learning_rate": 3.9797308971822206e-05, + "loss": 0.2155, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2113157957792282, + "step": 940, + "valid_targets_mean": 1327.6, + "valid_targets_min": 765 + }, + { + "epoch": 0.9926470588235294, + "grad_norm": 0.7916476167495613, + "learning_rate": 3.978980180461821e-05, + "loss": 0.2245, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23679675161838531, + "step": 945, + "valid_targets_mean": 1346.4, + "valid_targets_min": 591 + }, + { + "epoch": 0.9978991596638656, + "grad_norm": 0.7026077039339454, + "learning_rate": 3.9782158864589696e-05, + "loss": 0.2291, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20915091037750244, + "step": 950, + "valid_targets_mean": 1483.2, + "valid_targets_min": 692 + }, + { + "epoch": 1.0031512605042017, + "grad_norm": 0.5638798620218901, + "learning_rate": 3.977438020417293e-05, + "loss": 0.3126, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.33122366666793823, + "step": 955, + "valid_targets_mean": 4404.5, + "valid_targets_min": 1323 + }, + { + "epoch": 1.0084033613445378, + "grad_norm": 0.5755600203933873, + "learning_rate": 3.9766465876735354e-05, + "loss": 0.3596, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3643394112586975, + "step": 960, + "valid_targets_mean": 4483.4, + "valid_targets_min": 1005 + }, + { + "epoch": 1.013655462184874, + "grad_norm": 0.5433500453139155, + "learning_rate": 3.9758415936575155e-05, + "loss": 0.3387, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3266267776489258, + "step": 965, + "valid_targets_mean": 4502.1, + "valid_targets_min": 1509 + }, + { + "epoch": 1.01890756302521, + "grad_norm": 0.6267141368025664, + "learning_rate": 3.975023043892094e-05, + "loss": 0.3404, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3264230787754059, + "step": 970, + "valid_targets_mean": 3430.2, + "valid_targets_min": 1561 + }, + { + "epoch": 1.0241596638655461, + "grad_norm": 0.607104749067981, + "learning_rate": 3.974190943993133e-05, + "loss": 0.329, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3339942693710327, + "step": 975, + "valid_targets_mean": 3385.4, + "valid_targets_min": 1184 + }, + { + "epoch": 1.0294117647058822, + "grad_norm": 0.536136082897943, + "learning_rate": 3.973345299669461e-05, + "loss": 0.3558, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3149448335170746, + "step": 980, + "valid_targets_mean": 3982.6, + "valid_targets_min": 1413 + }, + { + "epoch": 1.0346638655462186, + "grad_norm": 0.5075659675082035, + "learning_rate": 3.972486116722828e-05, + "loss": 0.3169, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.32082343101501465, + "step": 985, + "valid_targets_mean": 4911.7, + "valid_targets_min": 2160 + }, + { + "epoch": 1.0399159663865547, + "grad_norm": 0.5581426071520623, + "learning_rate": 3.971613401047872e-05, + "loss": 0.3346, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.35363245010375977, + "step": 990, + "valid_targets_mean": 3782.6, + "valid_targets_min": 1511 + }, + { + "epoch": 1.0451680672268908, + "grad_norm": 0.698413730384984, + "learning_rate": 3.970727158632075e-05, + "loss": 0.3462, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.374415785074234, + "step": 995, + "valid_targets_mean": 3030.0, + "valid_targets_min": 1462 + }, + { + "epoch": 1.050420168067227, + "grad_norm": 0.6206079287451801, + "learning_rate": 3.969827395555721e-05, + "loss": 0.3457, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3208198845386505, + "step": 1000, + "valid_targets_mean": 3772.4, + "valid_targets_min": 874 + }, + { + "epoch": 1.055672268907563, + "grad_norm": 0.6660693366788901, + "learning_rate": 3.968914117991857e-05, + "loss": 0.3445, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3395417630672455, + "step": 1005, + "valid_targets_mean": 3337.1, + "valid_targets_min": 953 + }, + { + "epoch": 1.0609243697478992, + "grad_norm": 0.6001541700551754, + "learning_rate": 3.967987332206249e-05, + "loss": 0.3465, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3561500310897827, + "step": 1010, + "valid_targets_mean": 4284.9, + "valid_targets_min": 1265 + }, + { + "epoch": 1.0661764705882353, + "grad_norm": 0.5433768685257184, + "learning_rate": 3.967047044557341e-05, + "loss": 0.3387, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3220909833908081, + "step": 1015, + "valid_targets_mean": 5010.6, + "valid_targets_min": 1596 + }, + { + "epoch": 1.0714285714285714, + "grad_norm": 0.6300742894051691, + "learning_rate": 3.966093261496208e-05, + "loss": 0.3393, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3596876561641693, + "step": 1020, + "valid_targets_mean": 3490.4, + "valid_targets_min": 1759 + }, + { + "epoch": 1.0766806722689075, + "grad_norm": 0.6791244172980975, + "learning_rate": 3.9651259895665146e-05, + "loss": 0.3504, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.36252090334892273, + "step": 1025, + "valid_targets_mean": 3264.3, + "valid_targets_min": 1353 + }, + { + "epoch": 1.0819327731092436, + "grad_norm": 0.5749237683976328, + "learning_rate": 3.9641452354044687e-05, + "loss": 0.3478, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.31524378061294556, + "step": 1030, + "valid_targets_mean": 3814.6, + "valid_targets_min": 1643 + }, + { + "epoch": 1.0871848739495797, + "grad_norm": 0.6067338424067318, + "learning_rate": 3.9631510057387765e-05, + "loss": 0.345, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.32914769649505615, + "step": 1035, + "valid_targets_mean": 3166.1, + "valid_targets_min": 1269 + }, + { + "epoch": 1.092436974789916, + "grad_norm": 0.6139160246013105, + "learning_rate": 3.962143307390596e-05, + "loss": 0.3648, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3532394766807556, + "step": 1040, + "valid_targets_mean": 3617.4, + "valid_targets_min": 1681 + }, + { + "epoch": 1.0976890756302522, + "grad_norm": 0.5852424169834737, + "learning_rate": 3.961122147273491e-05, + "loss": 0.3475, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.306821346282959, + "step": 1045, + "valid_targets_mean": 3919.8, + "valid_targets_min": 1477 + }, + { + "epoch": 1.1029411764705883, + "grad_norm": 0.6196200689994448, + "learning_rate": 3.9600875323933826e-05, + "loss": 0.3494, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.34865230321884155, + "step": 1050, + "valid_targets_mean": 3418.5, + "valid_targets_min": 662 + }, + { + "epoch": 1.1081932773109244, + "grad_norm": 0.5913392876658434, + "learning_rate": 3.959039469848502e-05, + "loss": 0.3432, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3537408113479614, + "step": 1055, + "valid_targets_mean": 3706.7, + "valid_targets_min": 2077 + }, + { + "epoch": 1.1134453781512605, + "grad_norm": 0.6771276206524633, + "learning_rate": 3.9579779668293416e-05, + "loss": 0.3249, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3203701972961426, + "step": 1060, + "valid_targets_mean": 2878.1, + "valid_targets_min": 1505 + }, + { + "epoch": 1.1186974789915967, + "grad_norm": 0.6786962469374573, + "learning_rate": 3.956903030618605e-05, + "loss": 0.3523, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.35575729608535767, + "step": 1065, + "valid_targets_mean": 3418.0, + "valid_targets_min": 1957 + }, + { + "epoch": 1.1239495798319328, + "grad_norm": 0.5934416223711014, + "learning_rate": 3.955814668591156e-05, + "loss": 0.3487, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.38778382539749146, + "step": 1070, + "valid_targets_mean": 4106.4, + "valid_targets_min": 1704 + }, + { + "epoch": 1.129201680672269, + "grad_norm": 1.3852530686455735, + "learning_rate": 3.9547128882139735e-05, + "loss": 0.3349, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3465884327888489, + "step": 1075, + "valid_targets_mean": 3046.9, + "valid_targets_min": 1422 + }, + { + "epoch": 1.134453781512605, + "grad_norm": 0.5980418747067316, + "learning_rate": 3.9535976970460925e-05, + "loss": 0.3252, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3092625141143799, + "step": 1080, + "valid_targets_mean": 3447.4, + "valid_targets_min": 1603 + }, + { + "epoch": 1.1397058823529411, + "grad_norm": 0.7839568612134259, + "learning_rate": 3.9524691027385585e-05, + "loss": 0.3504, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3626514971256256, + "step": 1085, + "valid_targets_mean": 2597.8, + "valid_targets_min": 1685 + }, + { + "epoch": 1.1449579831932772, + "grad_norm": 0.6257049596683059, + "learning_rate": 3.95132711303437e-05, + "loss": 0.3294, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3430899977684021, + "step": 1090, + "valid_targets_mean": 3290.6, + "valid_targets_min": 1208 + }, + { + "epoch": 1.1502100840336134, + "grad_norm": 0.9029010729944724, + "learning_rate": 3.9501717357684315e-05, + "loss": 0.3368, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.326965868473053, + "step": 1095, + "valid_targets_mean": 2661.8, + "valid_targets_min": 1501 + }, + { + "epoch": 1.1554621848739495, + "grad_norm": 0.6012247577775289, + "learning_rate": 3.9490029788674934e-05, + "loss": 0.3438, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3628232479095459, + "step": 1100, + "valid_targets_mean": 3849.0, + "valid_targets_min": 1866 + }, + { + "epoch": 1.1607142857142858, + "grad_norm": 0.614388950135581, + "learning_rate": 3.9478208503501e-05, + "loss": 0.3242, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.31284618377685547, + "step": 1105, + "valid_targets_mean": 3397.9, + "valid_targets_min": 1239 + }, + { + "epoch": 1.165966386554622, + "grad_norm": 0.653467443640438, + "learning_rate": 3.946625358326538e-05, + "loss": 0.3439, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.346976101398468, + "step": 1110, + "valid_targets_mean": 3155.5, + "valid_targets_min": 1177 + }, + { + "epoch": 1.171218487394958, + "grad_norm": 0.579694254639963, + "learning_rate": 3.945416510998775e-05, + "loss": 0.3355, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.32414424419403076, + "step": 1115, + "valid_targets_mean": 3594.5, + "valid_targets_min": 1270 + }, + { + "epoch": 1.1764705882352942, + "grad_norm": 0.6219350779760418, + "learning_rate": 3.944194316660406e-05, + "loss": 0.3396, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3272247314453125, + "step": 1120, + "valid_targets_mean": 3571.2, + "valid_targets_min": 1216 + }, + { + "epoch": 1.1817226890756303, + "grad_norm": 0.6292410803179813, + "learning_rate": 3.942958783696598e-05, + "loss": 0.3334, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.32565245032310486, + "step": 1125, + "valid_targets_mean": 3290.8, + "valid_targets_min": 1184 + }, + { + "epoch": 1.1869747899159664, + "grad_norm": 0.678979812159635, + "learning_rate": 3.94170992058403e-05, + "loss": 0.3349, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3311670422554016, + "step": 1130, + "valid_targets_mean": 2986.1, + "valid_targets_min": 1292 + }, + { + "epoch": 1.1922268907563025, + "grad_norm": 0.6456475043572049, + "learning_rate": 3.9404477358908354e-05, + "loss": 0.3445, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3214397132396698, + "step": 1135, + "valid_targets_mean": 3485.4, + "valid_targets_min": 1639 + }, + { + "epoch": 1.1974789915966386, + "grad_norm": 0.6695778532642306, + "learning_rate": 3.9391722382765445e-05, + "loss": 0.3281, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.35410648584365845, + "step": 1140, + "valid_targets_mean": 2959.4, + "valid_targets_min": 1394 + }, + { + "epoch": 1.2027310924369747, + "grad_norm": 0.622191556528526, + "learning_rate": 3.937883436492025e-05, + "loss": 0.3351, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3593181073665619, + "step": 1145, + "valid_targets_mean": 3428.9, + "valid_targets_min": 2280 + }, + { + "epoch": 1.2079831932773109, + "grad_norm": 0.6333880919334702, + "learning_rate": 3.9365813393794186e-05, + "loss": 0.3265, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.35325169563293457, + "step": 1150, + "valid_targets_mean": 3233.9, + "valid_targets_min": 810 + }, + { + "epoch": 1.213235294117647, + "grad_norm": 0.6223354482954172, + "learning_rate": 3.9352659558720836e-05, + "loss": 0.3196, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3268436789512634, + "step": 1155, + "valid_targets_mean": 3211.6, + "valid_targets_min": 1654 + }, + { + "epoch": 1.2184873949579833, + "grad_norm": 0.659296380097006, + "learning_rate": 3.933937294994535e-05, + "loss": 0.3341, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.320861279964447, + "step": 1160, + "valid_targets_mean": 3057.8, + "valid_targets_min": 584 + }, + { + "epoch": 1.2237394957983194, + "grad_norm": 0.636761914351194, + "learning_rate": 3.932595365862379e-05, + "loss": 0.3322, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.34962353110313416, + "step": 1165, + "valid_targets_mean": 3572.6, + "valid_targets_min": 2498 + }, + { + "epoch": 1.2289915966386555, + "grad_norm": 0.6592752073339605, + "learning_rate": 3.9312401776822504e-05, + "loss": 0.3367, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.32008883357048035, + "step": 1170, + "valid_targets_mean": 3161.1, + "valid_targets_min": 1350 + }, + { + "epoch": 1.2342436974789917, + "grad_norm": 0.6063230189221366, + "learning_rate": 3.9298717397517546e-05, + "loss": 0.3365, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3388460874557495, + "step": 1175, + "valid_targets_mean": 3486.1, + "valid_targets_min": 1624 + }, + { + "epoch": 1.2394957983193278, + "grad_norm": 0.687253883898937, + "learning_rate": 3.928490061459396e-05, + "loss": 0.3067, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3046797513961792, + "step": 1180, + "valid_targets_mean": 2769.6, + "valid_targets_min": 916 + }, + { + "epoch": 1.2447478991596639, + "grad_norm": 0.5602035515910363, + "learning_rate": 3.927095152284521e-05, + "loss": 0.331, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3130587935447693, + "step": 1185, + "valid_targets_mean": 3734.1, + "valid_targets_min": 2209 + }, + { + "epoch": 1.25, + "grad_norm": 0.6913362496913676, + "learning_rate": 3.925687021797249e-05, + "loss": 0.3228, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.32542842626571655, + "step": 1190, + "valid_targets_mean": 3107.0, + "valid_targets_min": 1259 + }, + { + "epoch": 1.2552521008403361, + "grad_norm": 0.5736429239269779, + "learning_rate": 3.924265679658407e-05, + "loss": 0.3142, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.30502641201019287, + "step": 1195, + "valid_targets_mean": 3685.6, + "valid_targets_min": 1183 + }, + { + "epoch": 1.2605042016806722, + "grad_norm": 0.577437241781624, + "learning_rate": 3.922831135619462e-05, + "loss": 0.3109, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3453516364097595, + "step": 1200, + "valid_targets_mean": 3891.3, + "valid_targets_min": 1101 + }, + { + "epoch": 1.2657563025210083, + "grad_norm": 0.5958378130959316, + "learning_rate": 3.9213833995224605e-05, + "loss": 0.3321, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3231067359447479, + "step": 1205, + "valid_targets_mean": 3877.6, + "valid_targets_min": 1658 + }, + { + "epoch": 1.2710084033613445, + "grad_norm": 0.6735908115281981, + "learning_rate": 3.919922481299952e-05, + "loss": 0.3188, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3365190923213959, + "step": 1210, + "valid_targets_mean": 3050.1, + "valid_targets_min": 1423 + }, + { + "epoch": 1.2762605042016806, + "grad_norm": 0.6601685873762229, + "learning_rate": 3.918448390974928e-05, + "loss": 0.3281, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3299792408943176, + "step": 1215, + "valid_targets_mean": 3202.4, + "valid_targets_min": 1185 + }, + { + "epoch": 1.2815126050420167, + "grad_norm": 0.6705034899134344, + "learning_rate": 3.9169611386607476e-05, + "loss": 0.3418, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.34724968671798706, + "step": 1220, + "valid_targets_mean": 3779.1, + "valid_targets_min": 1091 + }, + { + "epoch": 1.2867647058823528, + "grad_norm": 0.5833278508200939, + "learning_rate": 3.9154607345610746e-05, + "loss": 0.3194, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3058725893497467, + "step": 1225, + "valid_targets_mean": 3628.9, + "valid_targets_min": 1352 + }, + { + "epoch": 1.2920168067226891, + "grad_norm": 0.5696798688900944, + "learning_rate": 3.913947188969801e-05, + "loss": 0.3224, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.32415255904197693, + "step": 1230, + "valid_targets_mean": 4061.2, + "valid_targets_min": 1535 + }, + { + "epoch": 1.2972689075630253, + "grad_norm": 0.6650203053880857, + "learning_rate": 3.912420512270981e-05, + "loss": 0.3106, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3156277537345886, + "step": 1235, + "valid_targets_mean": 2753.1, + "valid_targets_min": 854 + }, + { + "epoch": 1.3025210084033614, + "grad_norm": 0.6404333915329682, + "learning_rate": 3.910880714938757e-05, + "loss": 0.3168, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.30156928300857544, + "step": 1240, + "valid_targets_mean": 2942.5, + "valid_targets_min": 1179 + }, + { + "epoch": 1.3077731092436975, + "grad_norm": 0.604288417212929, + "learning_rate": 3.909327807537288e-05, + "loss": 0.3221, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.30336058139801025, + "step": 1245, + "valid_targets_mean": 3598.9, + "valid_targets_min": 1290 + }, + { + "epoch": 1.3130252100840336, + "grad_norm": 0.875497325929702, + "learning_rate": 3.90776180072068e-05, + "loss": 0.3127, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.32053911685943604, + "step": 1250, + "valid_targets_mean": 2332.6, + "valid_targets_min": 642 + }, + { + "epoch": 1.3182773109243697, + "grad_norm": 0.6151615426766832, + "learning_rate": 3.906182705232909e-05, + "loss": 0.3084, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3063713312149048, + "step": 1255, + "valid_targets_mean": 3670.2, + "valid_targets_min": 1764 + }, + { + "epoch": 1.3235294117647058, + "grad_norm": 0.6686081770965902, + "learning_rate": 3.904590531907751e-05, + "loss": 0.3375, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3719046711921692, + "step": 1260, + "valid_targets_mean": 3528.6, + "valid_targets_min": 1410 + }, + { + "epoch": 1.328781512605042, + "grad_norm": 0.7395507920156082, + "learning_rate": 3.9029852916687034e-05, + "loss": 0.3145, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3327389657497406, + "step": 1265, + "valid_targets_mean": 3147.7, + "valid_targets_min": 1683 + }, + { + "epoch": 1.334033613445378, + "grad_norm": 0.709030289881482, + "learning_rate": 3.9013669955289136e-05, + "loss": 0.3181, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3167096972465515, + "step": 1270, + "valid_targets_mean": 3632.5, + "valid_targets_min": 996 + }, + { + "epoch": 1.3392857142857144, + "grad_norm": 0.6586192793197465, + "learning_rate": 3.899735654591101e-05, + "loss": 0.3171, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3190867602825165, + "step": 1275, + "valid_targets_mean": 3135.3, + "valid_targets_min": 1349 + }, + { + "epoch": 1.3445378151260505, + "grad_norm": 0.682140733121633, + "learning_rate": 3.898091280047486e-05, + "loss": 0.3167, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.33190667629241943, + "step": 1280, + "valid_targets_mean": 3391.6, + "valid_targets_min": 1248 + }, + { + "epoch": 1.3497899159663866, + "grad_norm": 0.5957692884205409, + "learning_rate": 3.896433883179703e-05, + "loss": 0.3131, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3161918520927429, + "step": 1285, + "valid_targets_mean": 3323.4, + "valid_targets_min": 1445 + }, + { + "epoch": 1.3550420168067228, + "grad_norm": 0.6350286869649353, + "learning_rate": 3.894763475358736e-05, + "loss": 0.3115, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3040814995765686, + "step": 1290, + "valid_targets_mean": 3134.3, + "valid_targets_min": 2000 + }, + { + "epoch": 1.3602941176470589, + "grad_norm": 0.6934797525878172, + "learning_rate": 3.8930800680448275e-05, + "loss": 0.3064, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.32412275671958923, + "step": 1295, + "valid_targets_mean": 2828.3, + "valid_targets_min": 1197 + }, + { + "epoch": 1.365546218487395, + "grad_norm": 0.6077199732980291, + "learning_rate": 3.891383672787411e-05, + "loss": 0.331, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.32446929812431335, + "step": 1300, + "valid_targets_mean": 3219.0, + "valid_targets_min": 1223 + }, + { + "epoch": 1.370798319327731, + "grad_norm": 0.6275476086489861, + "learning_rate": 3.889674301225025e-05, + "loss": 0.3223, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.29918792843818665, + "step": 1305, + "valid_targets_mean": 3199.2, + "valid_targets_min": 869 + }, + { + "epoch": 1.3760504201680672, + "grad_norm": 0.6746694949290901, + "learning_rate": 3.8879519650852356e-05, + "loss": 0.3256, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.33456575870513916, + "step": 1310, + "valid_targets_mean": 2817.8, + "valid_targets_min": 1603 + }, + { + "epoch": 1.3813025210084033, + "grad_norm": 0.6421028373174448, + "learning_rate": 3.886216676184555e-05, + "loss": 0.3302, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3090163767337799, + "step": 1315, + "valid_targets_mean": 2942.2, + "valid_targets_min": 1135 + }, + { + "epoch": 1.3865546218487395, + "grad_norm": 0.5573926446318049, + "learning_rate": 3.8844684464283614e-05, + "loss": 0.3167, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.33767062425613403, + "step": 1320, + "valid_targets_mean": 4077.0, + "valid_targets_min": 1994 + }, + { + "epoch": 1.3918067226890756, + "grad_norm": 0.637126836573775, + "learning_rate": 3.882707287810817e-05, + "loss": 0.3286, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.30095210671424866, + "step": 1325, + "valid_targets_mean": 3060.1, + "valid_targets_min": 1066 + }, + { + "epoch": 1.3970588235294117, + "grad_norm": 0.6321058379302512, + "learning_rate": 3.880933212414786e-05, + "loss": 0.3285, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.33812808990478516, + "step": 1330, + "valid_targets_mean": 3687.4, + "valid_targets_min": 1211 + }, + { + "epoch": 1.4023109243697478, + "grad_norm": 0.6375112145565428, + "learning_rate": 3.87914623241175e-05, + "loss": 0.3213, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3038761019706726, + "step": 1335, + "valid_targets_mean": 2972.2, + "valid_targets_min": 1195 + }, + { + "epoch": 1.407563025210084, + "grad_norm": 0.7592514428689119, + "learning_rate": 3.877346360061728e-05, + "loss": 0.3291, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3361939489841461, + "step": 1340, + "valid_targets_mean": 2429.5, + "valid_targets_min": 484 + }, + { + "epoch": 1.41281512605042, + "grad_norm": 0.6066430879087057, + "learning_rate": 3.8755336077131894e-05, + "loss": 0.3227, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3248080015182495, + "step": 1345, + "valid_targets_mean": 3851.9, + "valid_targets_min": 1257 + }, + { + "epoch": 1.4180672268907564, + "grad_norm": 0.5858554643624372, + "learning_rate": 3.873707987802967e-05, + "loss": 0.3208, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.304246723651886, + "step": 1350, + "valid_targets_mean": 3483.2, + "valid_targets_min": 1372 + }, + { + "epoch": 1.4233193277310925, + "grad_norm": 0.6612075948640241, + "learning_rate": 3.871869512856179e-05, + "loss": 0.3129, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3278389275074005, + "step": 1355, + "valid_targets_mean": 3186.8, + "valid_targets_min": 1769 + }, + { + "epoch": 1.4285714285714286, + "grad_norm": 0.6552998713136254, + "learning_rate": 3.870018195486138e-05, + "loss": 0.3158, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.31067150831222534, + "step": 1360, + "valid_targets_mean": 3407.6, + "valid_targets_min": 1074 + }, + { + "epoch": 1.4338235294117647, + "grad_norm": 0.5966743275691717, + "learning_rate": 3.868154048394262e-05, + "loss": 0.3239, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3010474741458893, + "step": 1365, + "valid_targets_mean": 3796.4, + "valid_targets_min": 980 + }, + { + "epoch": 1.4390756302521008, + "grad_norm": 0.7359011060228771, + "learning_rate": 3.8662770843699944e-05, + "loss": 0.3306, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3496723771095276, + "step": 1370, + "valid_targets_mean": 2808.1, + "valid_targets_min": 793 + }, + { + "epoch": 1.444327731092437, + "grad_norm": 0.65437369178061, + "learning_rate": 3.8643873162907086e-05, + "loss": 0.3076, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3403715491294861, + "step": 1375, + "valid_targets_mean": 3677.5, + "valid_targets_min": 1471 + }, + { + "epoch": 1.449579831932773, + "grad_norm": 0.6531132095155441, + "learning_rate": 3.862484757121627e-05, + "loss": 0.3079, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.28045761585235596, + "step": 1380, + "valid_targets_mean": 3032.6, + "valid_targets_min": 1353 + }, + { + "epoch": 1.4548319327731092, + "grad_norm": 0.7024121158190606, + "learning_rate": 3.860569419915727e-05, + "loss": 0.3108, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.31772103905677795, + "step": 1385, + "valid_targets_mean": 2601.9, + "valid_targets_min": 1084 + }, + { + "epoch": 1.4600840336134453, + "grad_norm": 0.6174258612511311, + "learning_rate": 3.858641317813653e-05, + "loss": 0.303, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3092023730278015, + "step": 1390, + "valid_targets_mean": 3280.8, + "valid_targets_min": 1428 + }, + { + "epoch": 1.4653361344537816, + "grad_norm": 0.6773260761366405, + "learning_rate": 3.8567004640436234e-05, + "loss": 0.2957, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.30377262830734253, + "step": 1395, + "valid_targets_mean": 3229.4, + "valid_targets_min": 1193 + }, + { + "epoch": 1.4705882352941178, + "grad_norm": 0.6442894382965205, + "learning_rate": 3.8547468719213476e-05, + "loss": 0.303, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2951875925064087, + "step": 1400, + "valid_targets_mean": 3519.2, + "valid_targets_min": 1614 + }, + { + "epoch": 1.4758403361344539, + "grad_norm": 0.6233027503211065, + "learning_rate": 3.852780554849925e-05, + "loss": 0.296, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2837674617767334, + "step": 1405, + "valid_targets_mean": 3699.1, + "valid_targets_min": 974 + }, + { + "epoch": 1.48109243697479, + "grad_norm": 0.6558871789844729, + "learning_rate": 3.850801526319761e-05, + "loss": 0.3004, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.277635395526886, + "step": 1410, + "valid_targets_mean": 2730.4, + "valid_targets_min": 1575 + }, + { + "epoch": 1.486344537815126, + "grad_norm": 0.5993355650257447, + "learning_rate": 3.84880979990847e-05, + "loss": 0.3028, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.289740651845932, + "step": 1415, + "valid_targets_mean": 3345.0, + "valid_targets_min": 1697 + }, + { + "epoch": 1.4915966386554622, + "grad_norm": 0.5660470420295868, + "learning_rate": 3.846805389280782e-05, + "loss": 0.3022, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2910107374191284, + "step": 1420, + "valid_targets_mean": 3602.2, + "valid_targets_min": 1970 + }, + { + "epoch": 1.4968487394957983, + "grad_norm": 0.6727298285320141, + "learning_rate": 3.844788308188452e-05, + "loss": 0.3296, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3241168260574341, + "step": 1425, + "valid_targets_mean": 3128.4, + "valid_targets_min": 887 + }, + { + "epoch": 1.5021008403361344, + "grad_norm": 0.7266333636248493, + "learning_rate": 3.8427585704701634e-05, + "loss": 0.3085, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3230634331703186, + "step": 1430, + "valid_targets_mean": 2712.2, + "valid_targets_min": 1279 + }, + { + "epoch": 1.5073529411764706, + "grad_norm": 0.625826335328431, + "learning_rate": 3.840716190051433e-05, + "loss": 0.2988, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.28237617015838623, + "step": 1435, + "valid_targets_mean": 3052.6, + "valid_targets_min": 1021 + }, + { + "epoch": 1.5126050420168067, + "grad_norm": 0.643231670297035, + "learning_rate": 3.8386611809445155e-05, + "loss": 0.3098, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.30906054377555847, + "step": 1440, + "valid_targets_mean": 3352.1, + "valid_targets_min": 654 + }, + { + "epoch": 1.5178571428571428, + "grad_norm": 0.7439322282160008, + "learning_rate": 3.8365935572483095e-05, + "loss": 0.3074, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3927016258239746, + "step": 1445, + "valid_targets_mean": 2860.6, + "valid_targets_min": 1039 + }, + { + "epoch": 1.523109243697479, + "grad_norm": 0.5906966913938343, + "learning_rate": 3.834513333148258e-05, + "loss": 0.3107, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.29975053668022156, + "step": 1450, + "valid_targets_mean": 3742.9, + "valid_targets_min": 2459 + }, + { + "epoch": 1.528361344537815, + "grad_norm": 0.5784262635567486, + "learning_rate": 3.832420522916252e-05, + "loss": 0.3133, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.27920496463775635, + "step": 1455, + "valid_targets_mean": 3435.8, + "valid_targets_min": 1276 + }, + { + "epoch": 1.5336134453781511, + "grad_norm": 0.5304379397196218, + "learning_rate": 3.830315140910534e-05, + "loss": 0.3032, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2916795015335083, + "step": 1460, + "valid_targets_mean": 4335.8, + "valid_targets_min": 1572 + }, + { + "epoch": 1.5388655462184873, + "grad_norm": 0.690684220200614, + "learning_rate": 3.8281972015755965e-05, + "loss": 0.309, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.32439422607421875, + "step": 1465, + "valid_targets_mean": 2975.5, + "valid_targets_min": 791 + }, + { + "epoch": 1.5441176470588234, + "grad_norm": 0.9031172365787135, + "learning_rate": 3.826066719442086e-05, + "loss": 0.2345, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22157755494117737, + "step": 1470, + "valid_targets_mean": 1444.9, + "valid_targets_min": 740 + }, + { + "epoch": 1.5493697478991597, + "grad_norm": 0.8412510599148572, + "learning_rate": 3.823923709126701e-05, + "loss": 0.2161, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22126498818397522, + "step": 1475, + "valid_targets_mean": 1456.5, + "valid_targets_min": 612 + }, + { + "epoch": 1.5546218487394958, + "grad_norm": 1.1541206078120574, + "learning_rate": 3.821768185332095e-05, + "loss": 0.2097, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2107081413269043, + "step": 1480, + "valid_targets_mean": 1432.6, + "valid_targets_min": 826 + }, + { + "epoch": 1.559873949579832, + "grad_norm": 0.8048779001890545, + "learning_rate": 3.81960016284677e-05, + "loss": 0.2089, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.192092627286911, + "step": 1485, + "valid_targets_mean": 1432.6, + "valid_targets_min": 742 + }, + { + "epoch": 1.565126050420168, + "grad_norm": 0.8091682143521767, + "learning_rate": 3.817419656544979e-05, + "loss": 0.2141, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21445538103580475, + "step": 1490, + "valid_targets_mean": 1387.0, + "valid_targets_min": 718 + }, + { + "epoch": 1.5703781512605042, + "grad_norm": 0.8028634331257293, + "learning_rate": 3.815226681386626e-05, + "loss": 0.2181, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21761010587215424, + "step": 1495, + "valid_targets_mean": 1527.4, + "valid_targets_min": 764 + }, + { + "epoch": 1.5756302521008403, + "grad_norm": 0.7439177233189905, + "learning_rate": 3.8130212524171576e-05, + "loss": 0.2007, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19787126779556274, + "step": 1500, + "valid_targets_mean": 1353.6, + "valid_targets_min": 725 + }, + { + "epoch": 1.5808823529411766, + "grad_norm": 0.8142970979200826, + "learning_rate": 3.810803384767465e-05, + "loss": 0.2207, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1932760328054428, + "step": 1505, + "valid_targets_mean": 1309.9, + "valid_targets_min": 610 + }, + { + "epoch": 1.5861344537815127, + "grad_norm": 0.7340679359153581, + "learning_rate": 3.808573093653777e-05, + "loss": 0.2028, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19831883907318115, + "step": 1510, + "valid_targets_mean": 1465.4, + "valid_targets_min": 720 + }, + { + "epoch": 1.5913865546218489, + "grad_norm": 0.7860661366128959, + "learning_rate": 3.806330394377556e-05, + "loss": 0.2069, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19419294595718384, + "step": 1515, + "valid_targets_mean": 1379.4, + "valid_targets_min": 615 + }, + { + "epoch": 1.596638655462185, + "grad_norm": 0.8568638447176881, + "learning_rate": 3.8040753023253956e-05, + "loss": 0.2049, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2107909917831421, + "step": 1520, + "valid_targets_mean": 1158.2, + "valid_targets_min": 593 + }, + { + "epoch": 1.601890756302521, + "grad_norm": 0.6995773260097756, + "learning_rate": 3.801807832968912e-05, + "loss": 0.2085, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1988203525543213, + "step": 1525, + "valid_targets_mean": 1543.1, + "valid_targets_min": 704 + }, + { + "epoch": 1.6071428571428572, + "grad_norm": 0.7456785948304131, + "learning_rate": 3.799528001864637e-05, + "loss": 0.1984, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17537815868854523, + "step": 1530, + "valid_targets_mean": 1300.1, + "valid_targets_min": 722 + }, + { + "epoch": 1.6123949579831933, + "grad_norm": 0.8087741971757628, + "learning_rate": 3.797235824653918e-05, + "loss": 0.201, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20719020068645477, + "step": 1535, + "valid_targets_mean": 1401.3, + "valid_targets_min": 642 + }, + { + "epoch": 1.6176470588235294, + "grad_norm": 0.7888860351461294, + "learning_rate": 3.7949313170628006e-05, + "loss": 0.1935, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2095479965209961, + "step": 1540, + "valid_targets_mean": 1436.8, + "valid_targets_min": 518 + }, + { + "epoch": 1.6228991596638656, + "grad_norm": 0.767345470182285, + "learning_rate": 3.79261449490193e-05, + "loss": 0.2106, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22027720510959625, + "step": 1545, + "valid_targets_mean": 1531.6, + "valid_targets_min": 728 + }, + { + "epoch": 1.6281512605042017, + "grad_norm": 0.8137805205710857, + "learning_rate": 3.7902853740664356e-05, + "loss": 0.2073, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21532106399536133, + "step": 1550, + "valid_targets_mean": 1469.6, + "valid_targets_min": 764 + }, + { + "epoch": 1.6334033613445378, + "grad_norm": 0.9016471374390324, + "learning_rate": 3.7879439705358286e-05, + "loss": 0.2139, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23087842762470245, + "step": 1555, + "valid_targets_mean": 1437.8, + "valid_targets_min": 818 + }, + { + "epoch": 1.638655462184874, + "grad_norm": 0.8353128948745288, + "learning_rate": 3.785590300373884e-05, + "loss": 0.2004, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2092447727918625, + "step": 1560, + "valid_targets_mean": 1327.3, + "valid_targets_min": 625 + }, + { + "epoch": 1.64390756302521, + "grad_norm": 0.868105384855138, + "learning_rate": 3.7832243797285385e-05, + "loss": 0.203, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21071121096611023, + "step": 1565, + "valid_targets_mean": 1685.2, + "valid_targets_min": 790 + }, + { + "epoch": 1.6491596638655461, + "grad_norm": 0.7919143845079746, + "learning_rate": 3.780846224831775e-05, + "loss": 0.2109, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2265183925628662, + "step": 1570, + "valid_targets_mean": 1595.3, + "valid_targets_min": 891 + }, + { + "epoch": 1.6544117647058822, + "grad_norm": 0.7549544772773371, + "learning_rate": 3.7784558519995135e-05, + "loss": 0.203, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18298515677452087, + "step": 1575, + "valid_targets_mean": 1381.1, + "valid_targets_min": 719 + }, + { + "epoch": 1.6596638655462184, + "grad_norm": 0.804144396397427, + "learning_rate": 3.776053277631496e-05, + "loss": 0.197, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1860344111919403, + "step": 1580, + "valid_targets_mean": 1345.7, + "valid_targets_min": 657 + }, + { + "epoch": 1.6649159663865545, + "grad_norm": 0.9064506425487462, + "learning_rate": 3.7736385182111785e-05, + "loss": 0.1997, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20600754022598267, + "step": 1585, + "valid_targets_mean": 1342.1, + "valid_targets_min": 783 + }, + { + "epoch": 1.6701680672268906, + "grad_norm": 0.8588049760182106, + "learning_rate": 3.771211590305614e-05, + "loss": 0.1956, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1966136246919632, + "step": 1590, + "valid_targets_mean": 1450.6, + "valid_targets_min": 629 + }, + { + "epoch": 1.675420168067227, + "grad_norm": 0.7948243288514434, + "learning_rate": 3.768772510565342e-05, + "loss": 0.1987, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2040775567293167, + "step": 1595, + "valid_targets_mean": 1461.3, + "valid_targets_min": 678 + }, + { + "epoch": 1.680672268907563, + "grad_norm": 0.8255403927136926, + "learning_rate": 3.76632129572427e-05, + "loss": 0.1992, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20673060417175293, + "step": 1600, + "valid_targets_mean": 1723.1, + "valid_targets_min": 1075 + }, + { + "epoch": 1.6859243697478992, + "grad_norm": 0.7484827437017396, + "learning_rate": 3.763857962599565e-05, + "loss": 0.2019, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20060554146766663, + "step": 1605, + "valid_targets_mean": 1669.1, + "valid_targets_min": 816 + }, + { + "epoch": 1.6911764705882353, + "grad_norm": 0.7780511290517912, + "learning_rate": 3.761382528091531e-05, + "loss": 0.1956, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21109002828598022, + "step": 1610, + "valid_targets_mean": 1521.4, + "valid_targets_min": 957 + }, + { + "epoch": 1.6964285714285714, + "grad_norm": 0.8261801428366944, + "learning_rate": 3.7588950091834986e-05, + "loss": 0.1987, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18024760484695435, + "step": 1615, + "valid_targets_mean": 1282.1, + "valid_targets_min": 643 + }, + { + "epoch": 1.7016806722689075, + "grad_norm": 0.7650069206711103, + "learning_rate": 3.756395422941706e-05, + "loss": 0.2052, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20178046822547913, + "step": 1620, + "valid_targets_mean": 1499.7, + "valid_targets_min": 726 + }, + { + "epoch": 1.7069327731092439, + "grad_norm": 0.7087222035820604, + "learning_rate": 3.753883786515181e-05, + "loss": 0.1919, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19103536009788513, + "step": 1625, + "valid_targets_mean": 1621.1, + "valid_targets_min": 705 + }, + { + "epoch": 1.71218487394958, + "grad_norm": 0.8887563433958335, + "learning_rate": 3.751360117135628e-05, + "loss": 0.1956, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20276349782943726, + "step": 1630, + "valid_targets_mean": 1390.9, + "valid_targets_min": 700 + }, + { + "epoch": 1.717436974789916, + "grad_norm": 0.8362395348050953, + "learning_rate": 3.7488244321173025e-05, + "loss": 0.1854, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18552342057228088, + "step": 1635, + "valid_targets_mean": 1254.4, + "valid_targets_min": 627 + }, + { + "epoch": 1.7226890756302522, + "grad_norm": 0.8655931910128335, + "learning_rate": 3.746276748856898e-05, + "loss": 0.1951, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18865495920181274, + "step": 1640, + "valid_targets_mean": 1479.2, + "valid_targets_min": 817 + }, + { + "epoch": 1.7279411764705883, + "grad_norm": 0.792892975194453, + "learning_rate": 3.743717084833425e-05, + "loss": 0.1969, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19585290551185608, + "step": 1645, + "valid_targets_mean": 1464.4, + "valid_targets_min": 974 + }, + { + "epoch": 1.7331932773109244, + "grad_norm": 0.779810593913834, + "learning_rate": 3.741145457608093e-05, + "loss": 0.1966, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20523177087306976, + "step": 1650, + "valid_targets_mean": 1381.2, + "valid_targets_min": 657 + }, + { + "epoch": 1.7384453781512605, + "grad_norm": 0.7826687066418191, + "learning_rate": 3.738561884824183e-05, + "loss": 0.1997, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20436634123325348, + "step": 1655, + "valid_targets_mean": 1486.0, + "valid_targets_min": 746 + }, + { + "epoch": 1.7436974789915967, + "grad_norm": 0.7652636064297311, + "learning_rate": 3.735966384206936e-05, + "loss": 0.1986, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20646733045578003, + "step": 1660, + "valid_targets_mean": 1459.7, + "valid_targets_min": 739 + }, + { + "epoch": 1.7489495798319328, + "grad_norm": 0.7655125678378137, + "learning_rate": 3.733358973563425e-05, + "loss": 0.1921, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18100708723068237, + "step": 1665, + "valid_targets_mean": 1397.0, + "valid_targets_min": 682 + }, + { + "epoch": 1.754201680672269, + "grad_norm": 0.7963580538812527, + "learning_rate": 3.730739670782435e-05, + "loss": 0.1914, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19578437507152557, + "step": 1670, + "valid_targets_mean": 1288.8, + "valid_targets_min": 703 + }, + { + "epoch": 1.759453781512605, + "grad_norm": 0.8662683116944544, + "learning_rate": 3.72810849383434e-05, + "loss": 0.2051, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18982970714569092, + "step": 1675, + "valid_targets_mean": 1446.1, + "valid_targets_min": 864 + }, + { + "epoch": 1.7647058823529411, + "grad_norm": 0.783041949999934, + "learning_rate": 3.725465460770978e-05, + "loss": 0.209, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.25431910157203674, + "step": 1680, + "valid_targets_mean": 1673.2, + "valid_targets_min": 734 + }, + { + "epoch": 1.7699579831932772, + "grad_norm": 0.7217643791824649, + "learning_rate": 3.7228105897255324e-05, + "loss": 0.195, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2004881650209427, + "step": 1685, + "valid_targets_mean": 1598.7, + "valid_targets_min": 607 + }, + { + "epoch": 1.7752100840336134, + "grad_norm": 0.7436378042988409, + "learning_rate": 3.7201438989124e-05, + "loss": 0.1917, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1999681144952774, + "step": 1690, + "valid_targets_mean": 1445.2, + "valid_targets_min": 551 + }, + { + "epoch": 1.7804621848739495, + "grad_norm": 0.7501915605313334, + "learning_rate": 3.717465406627074e-05, + "loss": 0.2001, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20576688647270203, + "step": 1695, + "valid_targets_mean": 1552.2, + "valid_targets_min": 791 + }, + { + "epoch": 1.7857142857142856, + "grad_norm": 0.7628246639482904, + "learning_rate": 3.714775131246011e-05, + "loss": 0.2009, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20440012216567993, + "step": 1700, + "valid_targets_mean": 1511.6, + "valid_targets_min": 825 + }, + { + "epoch": 1.7909663865546217, + "grad_norm": 0.7246985646816825, + "learning_rate": 3.71207309122651e-05, + "loss": 0.1889, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20958301424980164, + "step": 1705, + "valid_targets_mean": 1489.3, + "valid_targets_min": 859 + }, + { + "epoch": 1.7962184873949578, + "grad_norm": 0.8076167406390439, + "learning_rate": 3.709359305106585e-05, + "loss": 0.1866, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18848812580108643, + "step": 1710, + "valid_targets_mean": 1356.9, + "valid_targets_min": 737 + }, + { + "epoch": 1.8014705882352942, + "grad_norm": 0.7618349813747334, + "learning_rate": 3.7066337915048354e-05, + "loss": 0.201, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19808264076709747, + "step": 1715, + "valid_targets_mean": 1359.9, + "valid_targets_min": 791 + }, + { + "epoch": 1.8067226890756303, + "grad_norm": 0.8211165193393286, + "learning_rate": 3.7038965691203205e-05, + "loss": 0.2016, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20665648579597473, + "step": 1720, + "valid_targets_mean": 1443.4, + "valid_targets_min": 724 + }, + { + "epoch": 1.8119747899159664, + "grad_norm": 1.5195639624253412, + "learning_rate": 3.701147656732431e-05, + "loss": 0.1928, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18661421537399292, + "step": 1725, + "valid_targets_mean": 1376.3, + "valid_targets_min": 944 + }, + { + "epoch": 1.8172268907563025, + "grad_norm": 1.3672377372582318, + "learning_rate": 3.6983870732007596e-05, + "loss": 0.1883, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.171901673078537, + "step": 1730, + "valid_targets_mean": 1597.7, + "valid_targets_min": 802 + }, + { + "epoch": 1.8224789915966386, + "grad_norm": 0.7029694603857538, + "learning_rate": 3.695614837464972e-05, + "loss": 0.2015, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18585661053657532, + "step": 1735, + "valid_targets_mean": 1419.2, + "valid_targets_min": 740 + }, + { + "epoch": 1.8277310924369747, + "grad_norm": 0.7128079074101666, + "learning_rate": 3.692830968544675e-05, + "loss": 0.192, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1792781949043274, + "step": 1740, + "valid_targets_mean": 1570.5, + "valid_targets_min": 881 + }, + { + "epoch": 1.832983193277311, + "grad_norm": 0.7873525110103127, + "learning_rate": 3.690035485539291e-05, + "loss": 0.1863, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18637944757938385, + "step": 1745, + "valid_targets_mean": 1177.1, + "valid_targets_min": 636 + }, + { + "epoch": 1.8382352941176472, + "grad_norm": 0.812792057458698, + "learning_rate": 3.6872284076279205e-05, + "loss": 0.1911, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18359485268592834, + "step": 1750, + "valid_targets_mean": 1280.1, + "valid_targets_min": 814 + }, + { + "epoch": 1.8434873949579833, + "grad_norm": 0.7516261504287793, + "learning_rate": 3.684409754069215e-05, + "loss": 0.1801, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18630534410476685, + "step": 1755, + "valid_targets_mean": 1253.6, + "valid_targets_min": 604 + }, + { + "epoch": 1.8487394957983194, + "grad_norm": 0.7873312358062879, + "learning_rate": 3.681579544201244e-05, + "loss": 0.1939, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1809154450893402, + "step": 1760, + "valid_targets_mean": 1232.8, + "valid_targets_min": 661 + }, + { + "epoch": 1.8539915966386555, + "grad_norm": 0.7042638950908449, + "learning_rate": 3.6787377974413614e-05, + "loss": 0.1927, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1879248321056366, + "step": 1765, + "valid_targets_mean": 1484.8, + "valid_targets_min": 728 + }, + { + "epoch": 1.8592436974789917, + "grad_norm": 0.8708411897151677, + "learning_rate": 3.6758845332860734e-05, + "loss": 0.1897, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2018292248249054, + "step": 1770, + "valid_targets_mean": 1383.6, + "valid_targets_min": 692 + }, + { + "epoch": 1.8644957983193278, + "grad_norm": 0.727245204127273, + "learning_rate": 3.673019771310903e-05, + "loss": 0.1971, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19675494730472565, + "step": 1775, + "valid_targets_mean": 1386.2, + "valid_targets_min": 840 + }, + { + "epoch": 1.8697478991596639, + "grad_norm": 0.769303157042911, + "learning_rate": 3.670143531170258e-05, + "loss": 0.1945, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.200996533036232, + "step": 1780, + "valid_targets_mean": 1375.6, + "valid_targets_min": 772 + }, + { + "epoch": 1.875, + "grad_norm": 0.6945199303988268, + "learning_rate": 3.667255832597294e-05, + "loss": 0.1922, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19052547216415405, + "step": 1785, + "valid_targets_mean": 1612.4, + "valid_targets_min": 670 + }, + { + "epoch": 1.8802521008403361, + "grad_norm": 0.7679602226980033, + "learning_rate": 3.664356695403781e-05, + "loss": 0.1919, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18414106965065002, + "step": 1790, + "valid_targets_mean": 1427.0, + "valid_targets_min": 750 + }, + { + "epoch": 1.8855042016806722, + "grad_norm": 0.7707612142751945, + "learning_rate": 3.661446139479965e-05, + "loss": 0.1971, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20061108469963074, + "step": 1795, + "valid_targets_mean": 1479.3, + "valid_targets_min": 766 + }, + { + "epoch": 1.8907563025210083, + "grad_norm": 0.8561024756443094, + "learning_rate": 3.658524184794436e-05, + "loss": 0.1953, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16889707744121552, + "step": 1800, + "valid_targets_mean": 1241.5, + "valid_targets_min": 729 + }, + { + "epoch": 1.8960084033613445, + "grad_norm": 0.7618847795685194, + "learning_rate": 3.655590851393984e-05, + "loss": 0.1998, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20724733173847198, + "step": 1805, + "valid_targets_mean": 1410.9, + "valid_targets_min": 682 + }, + { + "epoch": 1.9012605042016806, + "grad_norm": 0.7752684468128507, + "learning_rate": 3.652646159403468e-05, + "loss": 0.206, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20427414774894714, + "step": 1810, + "valid_targets_mean": 1569.1, + "valid_targets_min": 738 + }, + { + "epoch": 1.9065126050420167, + "grad_norm": 0.7353501689368992, + "learning_rate": 3.649690129025675e-05, + "loss": 0.1986, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2081902176141739, + "step": 1815, + "valid_targets_mean": 1378.0, + "valid_targets_min": 731 + }, + { + "epoch": 1.9117647058823528, + "grad_norm": 0.7289002335110303, + "learning_rate": 3.6467227805411824e-05, + "loss": 0.1979, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21570971608161926, + "step": 1820, + "valid_targets_mean": 1620.0, + "valid_targets_min": 748 + }, + { + "epoch": 1.917016806722689, + "grad_norm": 0.7240815176489389, + "learning_rate": 3.6437441343082174e-05, + "loss": 0.1885, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18155962228775024, + "step": 1825, + "valid_targets_mean": 1355.1, + "valid_targets_min": 564 + }, + { + "epoch": 1.9222689075630253, + "grad_norm": 0.7462727456723074, + "learning_rate": 3.6407542107625167e-05, + "loss": 0.189, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18159963190555573, + "step": 1830, + "valid_targets_mean": 1419.1, + "valid_targets_min": 651 + }, + { + "epoch": 1.9275210084033614, + "grad_norm": 0.9386783714270683, + "learning_rate": 3.637753030417192e-05, + "loss": 0.2, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18306277692317963, + "step": 1835, + "valid_targets_mean": 1291.7, + "valid_targets_min": 687 + }, + { + "epoch": 1.9327731092436975, + "grad_norm": 0.725039331848806, + "learning_rate": 3.6347406138625805e-05, + "loss": 0.1896, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17465978860855103, + "step": 1840, + "valid_targets_mean": 1236.8, + "valid_targets_min": 703 + }, + { + "epoch": 1.9380252100840336, + "grad_norm": 0.7526079231589902, + "learning_rate": 3.631716981766111e-05, + "loss": 0.186, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16068580746650696, + "step": 1845, + "valid_targets_mean": 1258.9, + "valid_targets_min": 522 + }, + { + "epoch": 1.9432773109243697, + "grad_norm": 0.7599278884583646, + "learning_rate": 3.6286821548721594e-05, + "loss": 0.1901, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1918371468782425, + "step": 1850, + "valid_targets_mean": 1495.5, + "valid_targets_min": 764 + }, + { + "epoch": 1.9485294117647058, + "grad_norm": 0.7979519291571235, + "learning_rate": 3.625636154001904e-05, + "loss": 0.2073, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21574504673480988, + "step": 1855, + "valid_targets_mean": 1421.0, + "valid_targets_min": 548 + }, + { + "epoch": 1.9537815126050422, + "grad_norm": 0.7338015635554208, + "learning_rate": 3.622579000053186e-05, + "loss": 0.1853, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20440888404846191, + "step": 1860, + "valid_targets_mean": 1487.2, + "valid_targets_min": 694 + }, + { + "epoch": 1.9590336134453783, + "grad_norm": 0.7129631803753865, + "learning_rate": 3.619510714000368e-05, + "loss": 0.1916, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2010660171508789, + "step": 1865, + "valid_targets_mean": 1512.4, + "valid_targets_min": 823 + }, + { + "epoch": 1.9642857142857144, + "grad_norm": 0.6958574230399347, + "learning_rate": 3.616431316894181e-05, + "loss": 0.1671, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15293735265731812, + "step": 1870, + "valid_targets_mean": 1375.4, + "valid_targets_min": 595 + }, + { + "epoch": 1.9695378151260505, + "grad_norm": 0.8984376849635196, + "learning_rate": 3.613340829861592e-05, + "loss": 0.1902, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2001931369304657, + "step": 1875, + "valid_targets_mean": 1401.2, + "valid_targets_min": 693 + }, + { + "epoch": 1.9747899159663866, + "grad_norm": 0.796278651195792, + "learning_rate": 3.61023927410565e-05, + "loss": 0.1886, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18896615505218506, + "step": 1880, + "valid_targets_mean": 1185.6, + "valid_targets_min": 720 + }, + { + "epoch": 1.9800420168067228, + "grad_norm": 0.6919750871597347, + "learning_rate": 3.607126670905346e-05, + "loss": 0.1871, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16711284220218658, + "step": 1885, + "valid_targets_mean": 1364.2, + "valid_targets_min": 685 + }, + { + "epoch": 1.9852941176470589, + "grad_norm": 0.6805728110467865, + "learning_rate": 3.60400304161546e-05, + "loss": 0.1838, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17011727392673492, + "step": 1890, + "valid_targets_mean": 1345.2, + "valid_targets_min": 658 + }, + { + "epoch": 1.990546218487395, + "grad_norm": 0.7601178723938317, + "learning_rate": 3.600868407666426e-05, + "loss": 0.1895, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18218779563903809, + "step": 1895, + "valid_targets_mean": 1431.4, + "valid_targets_min": 686 + }, + { + "epoch": 1.995798319327731, + "grad_norm": 0.6963519557748621, + "learning_rate": 3.597722790564172e-05, + "loss": 0.1984, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19570836424827576, + "step": 1900, + "valid_targets_mean": 1505.8, + "valid_targets_min": 713 + }, + { + "epoch": 2.0010504201680672, + "grad_norm": 0.8543332754648679, + "learning_rate": 3.5945662118899824e-05, + "loss": 0.2233, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3345944881439209, + "step": 1905, + "valid_targets_mean": 2493.1, + "valid_targets_min": 954 + }, + { + "epoch": 2.0063025210084033, + "grad_norm": 0.6540945057835557, + "learning_rate": 3.5913986933003455e-05, + "loss": 0.3021, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2893906235694885, + "step": 1910, + "valid_targets_mean": 3336.9, + "valid_targets_min": 533 + }, + { + "epoch": 2.0115546218487395, + "grad_norm": 0.5859587843451456, + "learning_rate": 3.5882202565268046e-05, + "loss": 0.2897, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.30491194128990173, + "step": 1915, + "valid_targets_mean": 3515.8, + "valid_targets_min": 1635 + }, + { + "epoch": 2.0168067226890756, + "grad_norm": 0.5848592413314749, + "learning_rate": 3.58503092337581e-05, + "loss": 0.2927, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3176591992378235, + "step": 1920, + "valid_targets_mean": 3744.6, + "valid_targets_min": 777 + }, + { + "epoch": 2.0220588235294117, + "grad_norm": 0.5277378066045798, + "learning_rate": 3.5818307157285705e-05, + "loss": 0.2788, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2889269292354584, + "step": 1925, + "valid_targets_mean": 4188.5, + "valid_targets_min": 2187 + }, + { + "epoch": 2.027310924369748, + "grad_norm": 0.6598583479222365, + "learning_rate": 3.5786196555409006e-05, + "loss": 0.2979, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.30424559116363525, + "step": 1930, + "valid_targets_mean": 3188.1, + "valid_targets_min": 1432 + }, + { + "epoch": 2.032563025210084, + "grad_norm": 0.6035540307689007, + "learning_rate": 3.575397764843073e-05, + "loss": 0.2808, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2632938027381897, + "step": 1935, + "valid_targets_mean": 3703.5, + "valid_targets_min": 767 + }, + { + "epoch": 2.03781512605042, + "grad_norm": 0.6545986679555346, + "learning_rate": 3.572165065739664e-05, + "loss": 0.2807, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2869631052017212, + "step": 1940, + "valid_targets_mean": 3793.3, + "valid_targets_min": 1488 + }, + { + "epoch": 2.043067226890756, + "grad_norm": 0.5266355858459322, + "learning_rate": 3.5689215804094053e-05, + "loss": 0.2847, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2697930932044983, + "step": 1945, + "valid_targets_mean": 3814.2, + "valid_targets_min": 578 + }, + { + "epoch": 2.0483193277310923, + "grad_norm": 0.5529414922643042, + "learning_rate": 3.5656673311050285e-05, + "loss": 0.3058, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.298675537109375, + "step": 1950, + "valid_targets_mean": 3997.1, + "valid_targets_min": 1241 + }, + { + "epoch": 2.0535714285714284, + "grad_norm": 0.5889438843034916, + "learning_rate": 3.562402340153115e-05, + "loss": 0.2915, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3097384572029114, + "step": 1955, + "valid_targets_mean": 3797.0, + "valid_targets_min": 807 + }, + { + "epoch": 2.0588235294117645, + "grad_norm": 0.4888383801769635, + "learning_rate": 3.559126629953942e-05, + "loss": 0.2944, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2800885736942291, + "step": 1960, + "valid_targets_mean": 5091.3, + "valid_targets_min": 2061 + }, + { + "epoch": 2.064075630252101, + "grad_norm": 0.5549566154812772, + "learning_rate": 3.5558402229813287e-05, + "loss": 0.2964, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.28934812545776367, + "step": 1965, + "valid_targets_mean": 4230.9, + "valid_targets_min": 1329 + }, + { + "epoch": 2.069327731092437, + "grad_norm": 0.5836584192752005, + "learning_rate": 3.552543141782483e-05, + "loss": 0.2831, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2896938621997833, + "step": 1970, + "valid_targets_mean": 3577.5, + "valid_targets_min": 1412 + }, + { + "epoch": 2.0745798319327733, + "grad_norm": 0.6187434500702056, + "learning_rate": 3.549235408977843e-05, + "loss": 0.2955, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2899538576602936, + "step": 1975, + "valid_targets_mean": 3247.0, + "valid_targets_min": 1334 + }, + { + "epoch": 2.0798319327731094, + "grad_norm": 0.5443173852803067, + "learning_rate": 3.545917047260928e-05, + "loss": 0.3036, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.27411580085754395, + "step": 1980, + "valid_targets_mean": 4207.9, + "valid_targets_min": 1847 + }, + { + "epoch": 2.0850840336134455, + "grad_norm": 0.6049544183292745, + "learning_rate": 3.542588079398179e-05, + "loss": 0.2962, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2940400540828705, + "step": 1985, + "valid_targets_mean": 3505.8, + "valid_targets_min": 1040 + }, + { + "epoch": 2.0903361344537816, + "grad_norm": 0.6603766972468182, + "learning_rate": 3.539248528228801e-05, + "loss": 0.3076, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3235289454460144, + "step": 1990, + "valid_targets_mean": 3247.1, + "valid_targets_min": 1269 + }, + { + "epoch": 2.0955882352941178, + "grad_norm": 0.6507849332876462, + "learning_rate": 3.535898416664611e-05, + "loss": 0.304, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.29736390709877014, + "step": 1995, + "valid_targets_mean": 2779.6, + "valid_targets_min": 1041 + }, + { + "epoch": 2.100840336134454, + "grad_norm": 0.6263414769134444, + "learning_rate": 3.5325377676898766e-05, + "loss": 0.2963, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.30523204803466797, + "step": 2000, + "valid_targets_mean": 2963.0, + "valid_targets_min": 1291 + }, + { + "epoch": 2.10609243697479, + "grad_norm": 0.7168587293071478, + "learning_rate": 3.529166604361161e-05, + "loss": 0.2933, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3294321298599243, + "step": 2005, + "valid_targets_mean": 2588.5, + "valid_targets_min": 1285 + }, + { + "epoch": 2.111344537815126, + "grad_norm": 0.7408150111837036, + "learning_rate": 3.525784949807162e-05, + "loss": 0.2856, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.28167465329170227, + "step": 2010, + "valid_targets_mean": 3554.5, + "valid_targets_min": 865 + }, + { + "epoch": 2.116596638655462, + "grad_norm": 0.6431903275157029, + "learning_rate": 3.522392827228557e-05, + "loss": 0.2898, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2769734561443329, + "step": 2015, + "valid_targets_mean": 2872.8, + "valid_targets_min": 958 + }, + { + "epoch": 2.1218487394957983, + "grad_norm": 0.6159459227356286, + "learning_rate": 3.518990259897841e-05, + "loss": 0.2991, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.30407899618148804, + "step": 2020, + "valid_targets_mean": 3317.6, + "valid_targets_min": 771 + }, + { + "epoch": 2.1271008403361344, + "grad_norm": 0.5523195230692622, + "learning_rate": 3.515577271159167e-05, + "loss": 0.2962, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2792849838733673, + "step": 2025, + "valid_targets_mean": 3849.6, + "valid_targets_min": 1631 + }, + { + "epoch": 2.1323529411764706, + "grad_norm": 0.5889011467855694, + "learning_rate": 3.512153884428188e-05, + "loss": 0.2929, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2551637589931488, + "step": 2030, + "valid_targets_mean": 3065.6, + "valid_targets_min": 908 + }, + { + "epoch": 2.1376050420168067, + "grad_norm": 0.6584415672877822, + "learning_rate": 3.5087201231918944e-05, + "loss": 0.2884, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2937019467353821, + "step": 2035, + "valid_targets_mean": 2962.0, + "valid_targets_min": 1264 + }, + { + "epoch": 2.142857142857143, + "grad_norm": 0.5843888599963277, + "learning_rate": 3.505276011008454e-05, + "loss": 0.2907, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.29179146885871887, + "step": 2040, + "valid_targets_mean": 3853.1, + "valid_targets_min": 1889 + }, + { + "epoch": 2.148109243697479, + "grad_norm": 0.6018556070826566, + "learning_rate": 3.501821571507048e-05, + "loss": 0.2867, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.27817726135253906, + "step": 2045, + "valid_targets_mean": 3645.2, + "valid_targets_min": 1075 + }, + { + "epoch": 2.153361344537815, + "grad_norm": 0.7369039817083102, + "learning_rate": 3.498356828387714e-05, + "loss": 0.2908, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.28218644857406616, + "step": 2050, + "valid_targets_mean": 2874.9, + "valid_targets_min": 1036 + }, + { + "epoch": 2.158613445378151, + "grad_norm": 0.5740508320378505, + "learning_rate": 3.494881805421176e-05, + "loss": 0.2923, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2825021743774414, + "step": 2055, + "valid_targets_mean": 3808.9, + "valid_targets_min": 1162 + }, + { + "epoch": 2.1638655462184873, + "grad_norm": 0.6677586403458295, + "learning_rate": 3.4913965264486894e-05, + "loss": 0.2876, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2949675917625427, + "step": 2060, + "valid_targets_mean": 3164.9, + "valid_targets_min": 1281 + }, + { + "epoch": 2.1691176470588234, + "grad_norm": 0.583170841394605, + "learning_rate": 3.48790101538187e-05, + "loss": 0.284, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2632118761539459, + "step": 2065, + "valid_targets_mean": 3503.5, + "valid_targets_min": 1841 + }, + { + "epoch": 2.1743697478991595, + "grad_norm": 0.6659128870236808, + "learning_rate": 3.484395296202537e-05, + "loss": 0.3006, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.30187827348709106, + "step": 2070, + "valid_targets_mean": 3121.7, + "valid_targets_min": 1629 + }, + { + "epoch": 2.1796218487394956, + "grad_norm": 0.7188591131831868, + "learning_rate": 3.480879392962541e-05, + "loss": 0.2885, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2901453971862793, + "step": 2075, + "valid_targets_mean": 2668.6, + "valid_targets_min": 1254 + }, + { + "epoch": 2.184873949579832, + "grad_norm": 0.7182569920584896, + "learning_rate": 3.477353329783606e-05, + "loss": 0.2927, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.30515027046203613, + "step": 2080, + "valid_targets_mean": 3032.6, + "valid_targets_min": 1774 + }, + { + "epoch": 2.190126050420168, + "grad_norm": 0.678604840038963, + "learning_rate": 3.4738171308571595e-05, + "loss": 0.2928, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2986491322517395, + "step": 2085, + "valid_targets_mean": 3079.8, + "valid_targets_min": 1643 + }, + { + "epoch": 2.1953781512605044, + "grad_norm": 0.6392734138959271, + "learning_rate": 3.470270820444168e-05, + "loss": 0.2875, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3071242570877075, + "step": 2090, + "valid_targets_mean": 3021.6, + "valid_targets_min": 1244 + }, + { + "epoch": 2.2006302521008405, + "grad_norm": 0.585164572193224, + "learning_rate": 3.4667144228749697e-05, + "loss": 0.2878, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2744428515434265, + "step": 2095, + "valid_targets_mean": 3588.4, + "valid_targets_min": 959 + }, + { + "epoch": 2.2058823529411766, + "grad_norm": 0.5843477775486158, + "learning_rate": 3.463147962549109e-05, + "loss": 0.2826, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2655976414680481, + "step": 2100, + "valid_targets_mean": 3404.8, + "valid_targets_min": 2037 + }, + { + "epoch": 2.2111344537815127, + "grad_norm": 0.5703037332493616, + "learning_rate": 3.459571463935168e-05, + "loss": 0.2817, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2898704409599304, + "step": 2105, + "valid_targets_mean": 3745.2, + "valid_targets_min": 1168 + }, + { + "epoch": 2.216386554621849, + "grad_norm": 0.6261977462323101, + "learning_rate": 3.455984951570598e-05, + "loss": 0.2819, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2655256390571594, + "step": 2110, + "valid_targets_mean": 3479.8, + "valid_targets_min": 1700 + }, + { + "epoch": 2.221638655462185, + "grad_norm": 0.6273371865248328, + "learning_rate": 3.452388450061556e-05, + "loss": 0.2832, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.25678104162216187, + "step": 2115, + "valid_targets_mean": 2905.8, + "valid_targets_min": 1261 + }, + { + "epoch": 2.226890756302521, + "grad_norm": 0.6154152263889715, + "learning_rate": 3.448781984082727e-05, + "loss": 0.2983, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2871716022491455, + "step": 2120, + "valid_targets_mean": 3363.2, + "valid_targets_min": 1124 + }, + { + "epoch": 2.232142857142857, + "grad_norm": 0.6237253157214722, + "learning_rate": 3.4451655783771625e-05, + "loss": 0.2874, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2972951829433441, + "step": 2125, + "valid_targets_mean": 3210.6, + "valid_targets_min": 1361 + }, + { + "epoch": 2.2373949579831933, + "grad_norm": 0.5944182232171416, + "learning_rate": 3.4415392577561064e-05, + "loss": 0.2727, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.26949986815452576, + "step": 2130, + "valid_targets_mean": 2948.4, + "valid_targets_min": 1555 + }, + { + "epoch": 2.2426470588235294, + "grad_norm": 0.6239663761256676, + "learning_rate": 3.4379030470988285e-05, + "loss": 0.2888, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.31491410732269287, + "step": 2135, + "valid_targets_mean": 3311.2, + "valid_targets_min": 1739 + }, + { + "epoch": 2.2478991596638656, + "grad_norm": 0.6358976127732551, + "learning_rate": 3.4342569713524496e-05, + "loss": 0.278, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2920129895210266, + "step": 2140, + "valid_targets_mean": 3192.8, + "valid_targets_min": 1278 + }, + { + "epoch": 2.2531512605042017, + "grad_norm": 0.534574837437247, + "learning_rate": 3.4306010555317735e-05, + "loss": 0.2728, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2571936249732971, + "step": 2145, + "valid_targets_mean": 3951.6, + "valid_targets_min": 1522 + }, + { + "epoch": 2.258403361344538, + "grad_norm": 0.6364635502715449, + "learning_rate": 3.4269353247191135e-05, + "loss": 0.2662, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.28747859597206116, + "step": 2150, + "valid_targets_mean": 3641.8, + "valid_targets_min": 464 + }, + { + "epoch": 2.263655462184874, + "grad_norm": 0.5854458561363409, + "learning_rate": 3.423259804064122e-05, + "loss": 0.2933, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2922632098197937, + "step": 2155, + "valid_targets_mean": 3598.4, + "valid_targets_min": 1003 + }, + { + "epoch": 2.26890756302521, + "grad_norm": 0.6600515244262581, + "learning_rate": 3.419574518783616e-05, + "loss": 0.2741, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2910274267196655, + "step": 2160, + "valid_targets_mean": 3158.1, + "valid_targets_min": 1632 + }, + { + "epoch": 2.274159663865546, + "grad_norm": 0.6099216472379927, + "learning_rate": 3.4158794941614055e-05, + "loss": 0.2822, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2801975905895233, + "step": 2165, + "valid_targets_mean": 3131.9, + "valid_targets_min": 1256 + }, + { + "epoch": 2.2794117647058822, + "grad_norm": 0.6173217093072781, + "learning_rate": 3.4121747555481216e-05, + "loss": 0.2932, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2909969091415405, + "step": 2170, + "valid_targets_mean": 3894.9, + "valid_targets_min": 1336 + }, + { + "epoch": 2.2846638655462184, + "grad_norm": 0.5395127043883584, + "learning_rate": 3.4084603283610365e-05, + "loss": 0.2944, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2728331685066223, + "step": 2175, + "valid_targets_mean": 4360.4, + "valid_targets_min": 1651 + }, + { + "epoch": 2.2899159663865545, + "grad_norm": 0.6332732127944597, + "learning_rate": 3.404736238083897e-05, + "loss": 0.2742, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2798515558242798, + "step": 2180, + "valid_targets_mean": 2921.1, + "valid_targets_min": 644 + }, + { + "epoch": 2.2951680672268906, + "grad_norm": 0.7961507640330674, + "learning_rate": 3.401002510266744e-05, + "loss": 0.2707, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.26711398363113403, + "step": 2185, + "valid_targets_mean": 2848.1, + "valid_targets_min": 1397 + }, + { + "epoch": 2.3004201680672267, + "grad_norm": 0.6593038634993043, + "learning_rate": 3.397259170525739e-05, + "loss": 0.2726, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.28789085149765015, + "step": 2190, + "valid_targets_mean": 2673.2, + "valid_targets_min": 1557 + }, + { + "epoch": 2.3056722689075633, + "grad_norm": 0.6958476283104791, + "learning_rate": 3.393506244542991e-05, + "loss": 0.2786, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.292041540145874, + "step": 2195, + "valid_targets_mean": 2930.8, + "valid_targets_min": 1405 + }, + { + "epoch": 2.310924369747899, + "grad_norm": 0.6218694808083172, + "learning_rate": 3.389743758066374e-05, + "loss": 0.2754, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2553059458732605, + "step": 2200, + "valid_targets_mean": 3421.8, + "valid_targets_min": 1042 + }, + { + "epoch": 2.3161764705882355, + "grad_norm": 0.6961575232099882, + "learning_rate": 3.385971736909357e-05, + "loss": 0.2664, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.27729037404060364, + "step": 2205, + "valid_targets_mean": 3172.2, + "valid_targets_min": 858 + }, + { + "epoch": 2.3214285714285716, + "grad_norm": 0.6655059432652326, + "learning_rate": 3.382190206950822e-05, + "loss": 0.2769, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.27774959802627563, + "step": 2210, + "valid_targets_mean": 3166.3, + "valid_targets_min": 1288 + }, + { + "epoch": 2.3266806722689077, + "grad_norm": 0.5920405087936736, + "learning_rate": 3.3783991941348916e-05, + "loss": 0.2892, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2696320414543152, + "step": 2215, + "valid_targets_mean": 3645.1, + "valid_targets_min": 1915 + }, + { + "epoch": 2.331932773109244, + "grad_norm": 0.6019837190284246, + "learning_rate": 3.374598724470745e-05, + "loss": 0.282, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2848033010959625, + "step": 2220, + "valid_targets_mean": 3868.2, + "valid_targets_min": 1501 + }, + { + "epoch": 2.33718487394958, + "grad_norm": 0.6419175889567692, + "learning_rate": 3.370788824032441e-05, + "loss": 0.2706, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.27997952699661255, + "step": 2225, + "valid_targets_mean": 2992.5, + "valid_targets_min": 1255 + }, + { + "epoch": 2.342436974789916, + "grad_norm": 0.6429288935922298, + "learning_rate": 3.366969518958746e-05, + "loss": 0.2797, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.29206526279449463, + "step": 2230, + "valid_targets_mean": 3205.4, + "valid_targets_min": 1586 + }, + { + "epoch": 2.347689075630252, + "grad_norm": 0.5926026217237049, + "learning_rate": 3.363140835452945e-05, + "loss": 0.2777, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2542131543159485, + "step": 2235, + "valid_targets_mean": 3410.4, + "valid_targets_min": 1181 + }, + { + "epoch": 2.3529411764705883, + "grad_norm": 0.6805026667731596, + "learning_rate": 3.3593027997826654e-05, + "loss": 0.2666, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.26993298530578613, + "step": 2240, + "valid_targets_mean": 2876.6, + "valid_targets_min": 1428 + }, + { + "epoch": 2.3581932773109244, + "grad_norm": 0.6149224206718514, + "learning_rate": 3.355455438279702e-05, + "loss": 0.2674, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.27489912509918213, + "step": 2245, + "valid_targets_mean": 3850.8, + "valid_targets_min": 1708 + }, + { + "epoch": 2.3634453781512605, + "grad_norm": 0.7148223911895215, + "learning_rate": 3.351598777339827e-05, + "loss": 0.2817, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.31252795457839966, + "step": 2250, + "valid_targets_mean": 3311.1, + "valid_targets_min": 1171 + }, + { + "epoch": 2.3686974789915967, + "grad_norm": 0.6343777416548871, + "learning_rate": 3.3477328434226164e-05, + "loss": 0.2884, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2894600033760071, + "step": 2255, + "valid_targets_mean": 3490.8, + "valid_targets_min": 1834 + }, + { + "epoch": 2.3739495798319328, + "grad_norm": 0.5713389821309428, + "learning_rate": 3.343857663051264e-05, + "loss": 0.2728, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.28061312437057495, + "step": 2260, + "valid_targets_mean": 4200.2, + "valid_targets_min": 1529 + }, + { + "epoch": 2.379201680672269, + "grad_norm": 0.6593813910051031, + "learning_rate": 3.339973262812403e-05, + "loss": 0.2949, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.28659868240356445, + "step": 2265, + "valid_targets_mean": 3408.4, + "valid_targets_min": 845 + }, + { + "epoch": 2.384453781512605, + "grad_norm": 0.5688545517719381, + "learning_rate": 3.336079669355921e-05, + "loss": 0.2671, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2584436535835266, + "step": 2270, + "valid_targets_mean": 3692.9, + "valid_targets_min": 2113 + }, + { + "epoch": 2.389705882352941, + "grad_norm": 0.6802358237019724, + "learning_rate": 3.332176909394777e-05, + "loss": 0.2938, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3029017448425293, + "step": 2275, + "valid_targets_mean": 2837.8, + "valid_targets_min": 802 + }, + { + "epoch": 2.3949579831932772, + "grad_norm": 0.6451243325404382, + "learning_rate": 3.3282650097048206e-05, + "loss": 0.2884, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.26884186267852783, + "step": 2280, + "valid_targets_mean": 3303.2, + "valid_targets_min": 1433 + }, + { + "epoch": 2.4002100840336134, + "grad_norm": 0.7202674984435038, + "learning_rate": 3.324343997124606e-05, + "loss": 0.2868, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3011503219604492, + "step": 2285, + "valid_targets_mean": 3398.4, + "valid_targets_min": 1035 + }, + { + "epoch": 2.4054621848739495, + "grad_norm": 0.6862578318316971, + "learning_rate": 3.3204138985552094e-05, + "loss": 0.281, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.28322312235832214, + "step": 2290, + "valid_targets_mean": 2917.6, + "valid_targets_min": 637 + }, + { + "epoch": 2.4107142857142856, + "grad_norm": 0.6876766550885656, + "learning_rate": 3.316474740960041e-05, + "loss": 0.2872, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2967104911804199, + "step": 2295, + "valid_targets_mean": 3035.1, + "valid_targets_min": 814 + }, + { + "epoch": 2.4159663865546217, + "grad_norm": 0.603593965602333, + "learning_rate": 3.312526551364667e-05, + "loss": 0.2821, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.26389676332473755, + "step": 2300, + "valid_targets_mean": 3494.5, + "valid_targets_min": 1913 + }, + { + "epoch": 2.421218487394958, + "grad_norm": 0.6258585295206295, + "learning_rate": 3.308569356856616e-05, + "loss": 0.2672, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2644697427749634, + "step": 2305, + "valid_targets_mean": 3577.7, + "valid_targets_min": 1410 + }, + { + "epoch": 2.426470588235294, + "grad_norm": 0.6298839340403605, + "learning_rate": 3.3046031845851993e-05, + "loss": 0.2848, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.26435354351997375, + "step": 2310, + "valid_targets_mean": 3195.6, + "valid_targets_min": 1390 + }, + { + "epoch": 2.43172268907563, + "grad_norm": 0.6686960769778729, + "learning_rate": 3.3006280617613214e-05, + "loss": 0.2852, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.333891898393631, + "step": 2315, + "valid_targets_mean": 3242.2, + "valid_targets_min": 611 + }, + { + "epoch": 2.4369747899159666, + "grad_norm": 0.6994882884638276, + "learning_rate": 3.296644015657295e-05, + "loss": 0.28, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.29009950160980225, + "step": 2320, + "valid_targets_mean": 3322.3, + "valid_targets_min": 1451 + }, + { + "epoch": 2.4422268907563023, + "grad_norm": 0.6022542746468339, + "learning_rate": 3.292651073606652e-05, + "loss": 0.2766, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24634996056556702, + "step": 2325, + "valid_targets_mean": 3026.8, + "valid_targets_min": 1459 + }, + { + "epoch": 2.447478991596639, + "grad_norm": 0.7597076620942451, + "learning_rate": 3.288649263003958e-05, + "loss": 0.2712, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.30025792121887207, + "step": 2330, + "valid_targets_mean": 2535.8, + "valid_targets_min": 999 + }, + { + "epoch": 2.452731092436975, + "grad_norm": 0.5901929232154103, + "learning_rate": 3.284638611304623e-05, + "loss": 0.2667, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24954357743263245, + "step": 2335, + "valid_targets_mean": 3463.1, + "valid_targets_min": 1564 + }, + { + "epoch": 2.457983193277311, + "grad_norm": 0.6305958469820415, + "learning_rate": 3.280619146024714e-05, + "loss": 0.2732, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2825808525085449, + "step": 2340, + "valid_targets_mean": 3291.3, + "valid_targets_min": 1470 + }, + { + "epoch": 2.463235294117647, + "grad_norm": 0.6407328134623678, + "learning_rate": 3.2765908947407665e-05, + "loss": 0.2567, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.26442772150039673, + "step": 2345, + "valid_targets_mean": 3654.3, + "valid_targets_min": 1935 + }, + { + "epoch": 2.4684873949579833, + "grad_norm": 0.6192241477472046, + "learning_rate": 3.2725538850895933e-05, + "loss": 0.2602, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.25553327798843384, + "step": 2350, + "valid_targets_mean": 3334.8, + "valid_targets_min": 1375 + }, + { + "epoch": 2.4737394957983194, + "grad_norm": 0.5958070120631284, + "learning_rate": 3.268508144768096e-05, + "loss": 0.2704, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.25967782735824585, + "step": 2355, + "valid_targets_mean": 3422.6, + "valid_targets_min": 1294 + }, + { + "epoch": 2.4789915966386555, + "grad_norm": 0.5693719485778825, + "learning_rate": 3.264453701533075e-05, + "loss": 0.2583, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.25220775604248047, + "step": 2360, + "valid_targets_mean": 3406.5, + "valid_targets_min": 1496 + }, + { + "epoch": 2.4842436974789917, + "grad_norm": 0.6509477999261548, + "learning_rate": 3.260390583201041e-05, + "loss": 0.2596, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.27943873405456543, + "step": 2365, + "valid_targets_mean": 3359.4, + "valid_targets_min": 1333 + }, + { + "epoch": 2.4894957983193278, + "grad_norm": 0.6327828789713742, + "learning_rate": 3.2563188176480217e-05, + "loss": 0.2618, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.27448466420173645, + "step": 2370, + "valid_targets_mean": 3461.3, + "valid_targets_min": 2264 + }, + { + "epoch": 2.494747899159664, + "grad_norm": 0.6536523986307107, + "learning_rate": 3.252238432809368e-05, + "loss": 0.2801, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2812950015068054, + "step": 2375, + "valid_targets_mean": 3145.4, + "valid_targets_min": 1454 + }, + { + "epoch": 2.5, + "grad_norm": 0.6139150491194192, + "learning_rate": 3.2481494566795716e-05, + "loss": 0.2761, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.27129268646240234, + "step": 2380, + "valid_targets_mean": 3347.1, + "valid_targets_min": 1712 + }, + { + "epoch": 2.505252100840336, + "grad_norm": 0.6255364740679421, + "learning_rate": 3.244051917312061e-05, + "loss": 0.2653, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2420213669538498, + "step": 2385, + "valid_targets_mean": 3450.1, + "valid_targets_min": 1433 + }, + { + "epoch": 2.5105042016806722, + "grad_norm": 0.5931305720132205, + "learning_rate": 3.239945842819018e-05, + "loss": 0.2664, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2606050372123718, + "step": 2390, + "valid_targets_mean": 3711.4, + "valid_targets_min": 1943 + }, + { + "epoch": 2.5157563025210083, + "grad_norm": 0.5818743103427734, + "learning_rate": 3.2358312613711804e-05, + "loss": 0.2649, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24495342373847961, + "step": 2395, + "valid_targets_mean": 3649.8, + "valid_targets_min": 1945 + }, + { + "epoch": 2.5210084033613445, + "grad_norm": 0.6430898542162261, + "learning_rate": 3.231708201197653e-05, + "loss": 0.2809, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2672806978225708, + "step": 2400, + "valid_targets_mean": 2710.3, + "valid_targets_min": 815 + }, + { + "epoch": 2.5262605042016806, + "grad_norm": 0.6238779450079466, + "learning_rate": 3.227576690585706e-05, + "loss": 0.2769, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.29193007946014404, + "step": 2405, + "valid_targets_mean": 3416.9, + "valid_targets_min": 809 + }, + { + "epoch": 2.5315126050420167, + "grad_norm": 0.5995241914800916, + "learning_rate": 3.223436757880591e-05, + "loss": 0.2674, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2675004005432129, + "step": 2410, + "valid_targets_mean": 3632.6, + "valid_targets_min": 1727 + }, + { + "epoch": 2.536764705882353, + "grad_norm": 0.6158294085854414, + "learning_rate": 3.219288431485337e-05, + "loss": 0.2642, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2477218508720398, + "step": 2415, + "valid_targets_mean": 2918.1, + "valid_targets_min": 1622 + }, + { + "epoch": 2.542016806722689, + "grad_norm": 0.8470134075805191, + "learning_rate": 3.2151317398605646e-05, + "loss": 0.2375, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1993420273065567, + "step": 2420, + "valid_targets_mean": 1337.4, + "valid_targets_min": 788 + }, + { + "epoch": 2.5472689075630255, + "grad_norm": 0.7459112191461049, + "learning_rate": 3.2109667115242815e-05, + "loss": 0.1872, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18858204782009125, + "step": 2425, + "valid_targets_mean": 1537.9, + "valid_targets_min": 957 + }, + { + "epoch": 2.552521008403361, + "grad_norm": 0.764955976635607, + "learning_rate": 3.206793375051694e-05, + "loss": 0.1806, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17688506841659546, + "step": 2430, + "valid_targets_mean": 1386.6, + "valid_targets_min": 796 + }, + { + "epoch": 2.5577731092436977, + "grad_norm": 0.9461176823521338, + "learning_rate": 3.2026117590750086e-05, + "loss": 0.1832, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18542060256004333, + "step": 2435, + "valid_targets_mean": 1313.4, + "valid_targets_min": 697 + }, + { + "epoch": 2.5630252100840334, + "grad_norm": 0.7925028804553308, + "learning_rate": 3.198421892283235e-05, + "loss": 0.1811, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18615254759788513, + "step": 2440, + "valid_targets_mean": 1576.1, + "valid_targets_min": 638 + }, + { + "epoch": 2.56827731092437, + "grad_norm": 0.7519556440109215, + "learning_rate": 3.1942238034219885e-05, + "loss": 0.1794, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18748995661735535, + "step": 2445, + "valid_targets_mean": 1508.0, + "valid_targets_min": 727 + }, + { + "epoch": 2.5735294117647056, + "grad_norm": 0.7720688633693402, + "learning_rate": 3.190017521293296e-05, + "loss": 0.1859, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16558489203453064, + "step": 2450, + "valid_targets_mean": 1276.2, + "valid_targets_min": 761 + }, + { + "epoch": 2.578781512605042, + "grad_norm": 0.8326618926243746, + "learning_rate": 3.185803074755395e-05, + "loss": 0.17, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1751636564731598, + "step": 2455, + "valid_targets_mean": 1297.8, + "valid_targets_min": 714 + }, + { + "epoch": 2.5840336134453783, + "grad_norm": 0.7347796399611563, + "learning_rate": 3.1815804927225363e-05, + "loss": 0.1901, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1736968755722046, + "step": 2460, + "valid_targets_mean": 1447.1, + "valid_targets_min": 741 + }, + { + "epoch": 2.5892857142857144, + "grad_norm": 0.7982508928947285, + "learning_rate": 3.1773498041647876e-05, + "loss": 0.1796, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20142167806625366, + "step": 2465, + "valid_targets_mean": 1720.9, + "valid_targets_min": 663 + }, + { + "epoch": 2.5945378151260505, + "grad_norm": 0.7855892482872033, + "learning_rate": 3.173111038107834e-05, + "loss": 0.1727, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18200182914733887, + "step": 2470, + "valid_targets_mean": 1435.6, + "valid_targets_min": 632 + }, + { + "epoch": 2.5997899159663866, + "grad_norm": 0.7759266996305735, + "learning_rate": 3.168864223632776e-05, + "loss": 0.1783, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17558130621910095, + "step": 2475, + "valid_targets_mean": 1619.9, + "valid_targets_min": 933 + }, + { + "epoch": 2.6050420168067228, + "grad_norm": 0.6783776091632051, + "learning_rate": 3.1646093898759334e-05, + "loss": 0.1783, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16645342111587524, + "step": 2480, + "valid_targets_mean": 1491.7, + "valid_targets_min": 717 + }, + { + "epoch": 2.610294117647059, + "grad_norm": 0.7711910637914073, + "learning_rate": 3.160346566028645e-05, + "loss": 0.1673, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16639794409275055, + "step": 2485, + "valid_targets_mean": 1278.4, + "valid_targets_min": 659 + }, + { + "epoch": 2.615546218487395, + "grad_norm": 0.7139740512846204, + "learning_rate": 3.156075781337068e-05, + "loss": 0.1657, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15931686758995056, + "step": 2490, + "valid_targets_mean": 1346.2, + "valid_targets_min": 642 + }, + { + "epoch": 2.620798319327731, + "grad_norm": 0.7301516156278756, + "learning_rate": 3.1517970651019735e-05, + "loss": 0.1709, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1589939445257187, + "step": 2495, + "valid_targets_mean": 1324.8, + "valid_targets_min": 765 + }, + { + "epoch": 2.6260504201680672, + "grad_norm": 0.8269901402636304, + "learning_rate": 3.1475104466785536e-05, + "loss": 0.1823, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1824565976858139, + "step": 2500, + "valid_targets_mean": 1293.7, + "valid_targets_min": 631 + }, + { + "epoch": 2.6313025210084033, + "grad_norm": 0.8200023743718566, + "learning_rate": 3.143215955476211e-05, + "loss": 0.1829, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19661253690719604, + "step": 2505, + "valid_targets_mean": 1490.3, + "valid_targets_min": 623 + }, + { + "epoch": 2.6365546218487395, + "grad_norm": 0.7270060792013762, + "learning_rate": 3.138913620958365e-05, + "loss": 0.1796, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1958092451095581, + "step": 2510, + "valid_targets_mean": 1748.8, + "valid_targets_min": 818 + }, + { + "epoch": 2.6418067226890756, + "grad_norm": 0.728759015109214, + "learning_rate": 3.134603472642244e-05, + "loss": 0.1742, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16739603877067566, + "step": 2515, + "valid_targets_mean": 1434.9, + "valid_targets_min": 776 + }, + { + "epoch": 2.6470588235294117, + "grad_norm": 0.8025983924576464, + "learning_rate": 3.1302855400986866e-05, + "loss": 0.1765, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17958450317382812, + "step": 2520, + "valid_targets_mean": 1402.4, + "valid_targets_min": 623 + }, + { + "epoch": 2.652310924369748, + "grad_norm": 0.7842835266150214, + "learning_rate": 3.1259598529519336e-05, + "loss": 0.1771, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18177050352096558, + "step": 2525, + "valid_targets_mean": 1400.9, + "valid_targets_min": 693 + }, + { + "epoch": 2.657563025210084, + "grad_norm": 0.7753249562445936, + "learning_rate": 3.121626440879432e-05, + "loss": 0.1705, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1475217640399933, + "step": 2530, + "valid_targets_mean": 1109.4, + "valid_targets_min": 611 + }, + { + "epoch": 2.66281512605042, + "grad_norm": 0.7722564104049819, + "learning_rate": 3.117285333611625e-05, + "loss": 0.1691, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18021240830421448, + "step": 2535, + "valid_targets_mean": 1552.2, + "valid_targets_min": 793 + }, + { + "epoch": 2.668067226890756, + "grad_norm": 0.8324884710244702, + "learning_rate": 3.112936560931752e-05, + "loss": 0.1678, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1621646136045456, + "step": 2540, + "valid_targets_mean": 1393.4, + "valid_targets_min": 563 + }, + { + "epoch": 2.6733193277310923, + "grad_norm": 0.745079772832585, + "learning_rate": 3.108580152675642e-05, + "loss": 0.1715, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16466446220874786, + "step": 2545, + "valid_targets_mean": 1476.5, + "valid_targets_min": 837 + }, + { + "epoch": 2.678571428571429, + "grad_norm": 0.7667224190162166, + "learning_rate": 3.104216138731511e-05, + "loss": 0.1689, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17364142835140228, + "step": 2550, + "valid_targets_mean": 1660.7, + "valid_targets_min": 1107 + }, + { + "epoch": 2.6838235294117645, + "grad_norm": 0.8705202254035619, + "learning_rate": 3.0998445490397546e-05, + "loss": 0.1821, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17687436938285828, + "step": 2555, + "valid_targets_mean": 1498.9, + "valid_targets_min": 680 + }, + { + "epoch": 2.689075630252101, + "grad_norm": 0.7422198641689959, + "learning_rate": 3.095465413592743e-05, + "loss": 0.1637, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1798504889011383, + "step": 2560, + "valid_targets_mean": 1571.8, + "valid_targets_min": 803 + }, + { + "epoch": 2.6943277310924367, + "grad_norm": 0.8053104805546935, + "learning_rate": 3.091078762434616e-05, + "loss": 0.1717, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.175202876329422, + "step": 2565, + "valid_targets_mean": 1496.6, + "valid_targets_min": 631 + }, + { + "epoch": 2.6995798319327733, + "grad_norm": 0.7483069663873031, + "learning_rate": 3.086684625661081e-05, + "loss": 0.1719, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16679367423057556, + "step": 2570, + "valid_targets_mean": 1476.0, + "valid_targets_min": 804 + }, + { + "epoch": 2.7048319327731094, + "grad_norm": 0.7649264183537576, + "learning_rate": 3.082283033419197e-05, + "loss": 0.1764, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16266639530658722, + "step": 2575, + "valid_targets_mean": 1448.8, + "valid_targets_min": 675 + }, + { + "epoch": 2.7100840336134455, + "grad_norm": 0.7515149499265241, + "learning_rate": 3.077874015907174e-05, + "loss": 0.1657, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18091100454330444, + "step": 2580, + "valid_targets_mean": 1305.0, + "valid_targets_min": 856 + }, + { + "epoch": 2.7153361344537816, + "grad_norm": 0.7377534312107921, + "learning_rate": 3.073457603374167e-05, + "loss": 0.1655, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1628911793231964, + "step": 2585, + "valid_targets_mean": 1487.6, + "valid_targets_min": 715 + }, + { + "epoch": 2.7205882352941178, + "grad_norm": 0.7717568619128692, + "learning_rate": 3.069033826120066e-05, + "loss": 0.1615, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1856994479894638, + "step": 2590, + "valid_targets_mean": 1619.1, + "valid_targets_min": 678 + }, + { + "epoch": 2.725840336134454, + "grad_norm": 0.9267036067403248, + "learning_rate": 3.064602714495286e-05, + "loss": 0.1696, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19266122579574585, + "step": 2595, + "valid_targets_mean": 1382.1, + "valid_targets_min": 676 + }, + { + "epoch": 2.73109243697479, + "grad_norm": 0.7500546233055486, + "learning_rate": 3.060164298900565e-05, + "loss": 0.1689, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1605774164199829, + "step": 2600, + "valid_targets_mean": 1260.2, + "valid_targets_min": 794 + }, + { + "epoch": 2.736344537815126, + "grad_norm": 0.9445550576448264, + "learning_rate": 3.055718609786749e-05, + "loss": 0.17, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16394124925136566, + "step": 2605, + "valid_targets_mean": 1414.1, + "valid_targets_min": 607 + }, + { + "epoch": 2.741596638655462, + "grad_norm": 0.7880924622108275, + "learning_rate": 3.051265677654585e-05, + "loss": 0.1683, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1700436919927597, + "step": 2610, + "valid_targets_mean": 1450.9, + "valid_targets_min": 741 + }, + { + "epoch": 2.7468487394957983, + "grad_norm": 0.7995324958770467, + "learning_rate": 3.0468055330545162e-05, + "loss": 0.1769, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18648771941661835, + "step": 2615, + "valid_targets_mean": 1626.9, + "valid_targets_min": 858 + }, + { + "epoch": 2.7521008403361344, + "grad_norm": 0.776585890510735, + "learning_rate": 3.0423382065864653e-05, + "loss": 0.1587, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16372038424015045, + "step": 2620, + "valid_targets_mean": 1370.7, + "valid_targets_min": 689 + }, + { + "epoch": 2.7573529411764706, + "grad_norm": 0.8233797828888295, + "learning_rate": 3.0378637288996304e-05, + "loss": 0.1754, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1707250475883484, + "step": 2625, + "valid_targets_mean": 1327.7, + "valid_targets_min": 690 + }, + { + "epoch": 2.7626050420168067, + "grad_norm": 0.7313593178890555, + "learning_rate": 3.033382130692269e-05, + "loss": 0.1718, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16939744353294373, + "step": 2630, + "valid_targets_mean": 1433.4, + "valid_targets_min": 718 + }, + { + "epoch": 2.767857142857143, + "grad_norm": 0.7983600909257519, + "learning_rate": 3.0288934427114955e-05, + "loss": 0.1794, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16010600328445435, + "step": 2635, + "valid_targets_mean": 1398.2, + "valid_targets_min": 618 + }, + { + "epoch": 2.773109243697479, + "grad_norm": 0.7280785441425935, + "learning_rate": 3.0243976957530602e-05, + "loss": 0.1629, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16162815690040588, + "step": 2640, + "valid_targets_mean": 1479.6, + "valid_targets_min": 629 + }, + { + "epoch": 2.778361344537815, + "grad_norm": 0.7839303867427334, + "learning_rate": 3.0198949206611475e-05, + "loss": 0.1695, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18356014788150787, + "step": 2645, + "valid_targets_mean": 1549.6, + "valid_targets_min": 650 + }, + { + "epoch": 2.783613445378151, + "grad_norm": 0.7391305503246356, + "learning_rate": 3.0153851483281582e-05, + "loss": 0.1702, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16755986213684082, + "step": 2650, + "valid_targets_mean": 1363.6, + "valid_targets_min": 677 + }, + { + "epoch": 2.7888655462184873, + "grad_norm": 0.7900413678108272, + "learning_rate": 3.010868409694499e-05, + "loss": 0.1672, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1623220145702362, + "step": 2655, + "valid_targets_mean": 1367.9, + "valid_targets_min": 679 + }, + { + "epoch": 2.7941176470588234, + "grad_norm": 0.7222759869118193, + "learning_rate": 3.0063447357483712e-05, + "loss": 0.165, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16432425379753113, + "step": 2660, + "valid_targets_mean": 1393.1, + "valid_targets_min": 504 + }, + { + "epoch": 2.79936974789916, + "grad_norm": 0.7458633773608461, + "learning_rate": 3.0018141575255587e-05, + "loss": 0.167, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16822689771652222, + "step": 2665, + "valid_targets_mean": 1577.6, + "valid_targets_min": 1006 + }, + { + "epoch": 2.8046218487394956, + "grad_norm": 0.7555827595039865, + "learning_rate": 2.9972767061092107e-05, + "loss": 0.1725, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15489238500595093, + "step": 2670, + "valid_targets_mean": 1338.3, + "valid_targets_min": 661 + }, + { + "epoch": 2.809873949579832, + "grad_norm": 0.6713741267521114, + "learning_rate": 2.9927324126296352e-05, + "loss": 0.1752, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1501934975385666, + "step": 2675, + "valid_targets_mean": 1335.4, + "valid_targets_min": 886 + }, + { + "epoch": 2.815126050420168, + "grad_norm": 0.677528061579685, + "learning_rate": 2.98818130826408e-05, + "loss": 0.1694, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1680719256401062, + "step": 2680, + "valid_targets_mean": 1633.0, + "valid_targets_min": 909 + }, + { + "epoch": 2.8203781512605044, + "grad_norm": 0.8220892091600075, + "learning_rate": 2.9836234242365204e-05, + "loss": 0.1728, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17720499634742737, + "step": 2685, + "valid_targets_mean": 1308.2, + "valid_targets_min": 793 + }, + { + "epoch": 2.82563025210084, + "grad_norm": 0.8315780706625598, + "learning_rate": 2.979058791817447e-05, + "loss": 0.1678, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1801975965499878, + "step": 2690, + "valid_targets_mean": 1479.8, + "valid_targets_min": 861 + }, + { + "epoch": 2.8308823529411766, + "grad_norm": 0.7948697249631214, + "learning_rate": 2.974487442323647e-05, + "loss": 0.1653, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16297297179698944, + "step": 2695, + "valid_targets_mean": 1284.6, + "valid_targets_min": 752 + }, + { + "epoch": 2.8361344537815127, + "grad_norm": 0.7446282359364188, + "learning_rate": 2.9699094071179938e-05, + "loss": 0.1677, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18304650485515594, + "step": 2700, + "valid_targets_mean": 1584.1, + "valid_targets_min": 830 + }, + { + "epoch": 2.841386554621849, + "grad_norm": 0.718619587429062, + "learning_rate": 2.9653247176092286e-05, + "loss": 0.1528, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1484600156545639, + "step": 2705, + "valid_targets_mean": 1445.1, + "valid_targets_min": 638 + }, + { + "epoch": 2.846638655462185, + "grad_norm": 0.8381765419273387, + "learning_rate": 2.9607334052517466e-05, + "loss": 0.1681, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1818123310804367, + "step": 2710, + "valid_targets_mean": 1449.8, + "valid_targets_min": 605 + }, + { + "epoch": 2.851890756302521, + "grad_norm": 0.7250086940420657, + "learning_rate": 2.9561355015453803e-05, + "loss": 0.1685, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16832154989242554, + "step": 2715, + "valid_targets_mean": 1551.5, + "valid_targets_min": 746 + }, + { + "epoch": 2.857142857142857, + "grad_norm": 0.7099316939262316, + "learning_rate": 2.9515310380351847e-05, + "loss": 0.1605, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16392531991004944, + "step": 2720, + "valid_targets_mean": 1306.3, + "valid_targets_min": 723 + }, + { + "epoch": 2.8623949579831933, + "grad_norm": 0.7472866347997246, + "learning_rate": 2.9469200463112186e-05, + "loss": 0.1714, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17414012551307678, + "step": 2725, + "valid_targets_mean": 1487.9, + "valid_targets_min": 855 + }, + { + "epoch": 2.8676470588235294, + "grad_norm": 0.7126081269612909, + "learning_rate": 2.9423025580083298e-05, + "loss": 0.168, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15881696343421936, + "step": 2730, + "valid_targets_mean": 1503.1, + "valid_targets_min": 902 + }, + { + "epoch": 2.8728991596638656, + "grad_norm": 0.7172891409501757, + "learning_rate": 2.937678604805938e-05, + "loss": 0.1724, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16258196532726288, + "step": 2735, + "valid_targets_mean": 1501.8, + "valid_targets_min": 798 + }, + { + "epoch": 2.8781512605042017, + "grad_norm": 0.7828132309340979, + "learning_rate": 2.9330482184278168e-05, + "loss": 0.1667, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1718115508556366, + "step": 2740, + "valid_targets_mean": 1378.9, + "valid_targets_min": 740 + }, + { + "epoch": 2.883403361344538, + "grad_norm": 0.7837917980983125, + "learning_rate": 2.9284114306418758e-05, + "loss": 0.1614, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1576087772846222, + "step": 2745, + "valid_targets_mean": 1222.1, + "valid_targets_min": 244 + }, + { + "epoch": 2.888655462184874, + "grad_norm": 0.7472309237344245, + "learning_rate": 2.923768273259942e-05, + "loss": 0.1743, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15255385637283325, + "step": 2750, + "valid_targets_mean": 1328.9, + "valid_targets_min": 714 + }, + { + "epoch": 2.89390756302521, + "grad_norm": 0.796880354826496, + "learning_rate": 2.919118778137546e-05, + "loss": 0.1691, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15773728489875793, + "step": 2755, + "valid_targets_mean": 1268.8, + "valid_targets_min": 585 + }, + { + "epoch": 2.899159663865546, + "grad_norm": 0.7916812281947033, + "learning_rate": 2.9144629771736954e-05, + "loss": 0.1816, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18590059876441956, + "step": 2760, + "valid_targets_mean": 1596.2, + "valid_targets_min": 1041 + }, + { + "epoch": 2.9044117647058822, + "grad_norm": 0.7189169579851691, + "learning_rate": 2.9098009023106645e-05, + "loss": 0.1706, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15632124245166779, + "step": 2765, + "valid_targets_mean": 1373.1, + "valid_targets_min": 657 + }, + { + "epoch": 2.9096638655462184, + "grad_norm": 0.7049554537703587, + "learning_rate": 2.9051325855337684e-05, + "loss": 0.1717, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15910044312477112, + "step": 2770, + "valid_targets_mean": 1468.1, + "valid_targets_min": 959 + }, + { + "epoch": 2.9149159663865545, + "grad_norm": 0.7054773517266925, + "learning_rate": 2.90045805887115e-05, + "loss": 0.166, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1691712886095047, + "step": 2775, + "valid_targets_mean": 1426.8, + "valid_targets_min": 620 + }, + { + "epoch": 2.9201680672268906, + "grad_norm": 0.8510450051223593, + "learning_rate": 2.8957773543935518e-05, + "loss": 0.1674, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1627202183008194, + "step": 2780, + "valid_targets_mean": 1360.6, + "valid_targets_min": 732 + }, + { + "epoch": 2.9254201680672267, + "grad_norm": 0.7255441493487386, + "learning_rate": 2.8910905042141046e-05, + "loss": 0.1715, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17565231025218964, + "step": 2785, + "valid_targets_mean": 1550.9, + "valid_targets_min": 732 + }, + { + "epoch": 2.9306722689075633, + "grad_norm": 0.7448004871056576, + "learning_rate": 2.8863975404881022e-05, + "loss": 0.166, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.170585036277771, + "step": 2790, + "valid_targets_mean": 1635.2, + "valid_targets_min": 682 + }, + { + "epoch": 2.935924369747899, + "grad_norm": 0.8125236767167314, + "learning_rate": 2.881698495412781e-05, + "loss": 0.1626, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16882717609405518, + "step": 2795, + "valid_targets_mean": 1338.4, + "valid_targets_min": 596 + }, + { + "epoch": 2.9411764705882355, + "grad_norm": 0.7100556725806012, + "learning_rate": 2.8769934012271004e-05, + "loss": 0.16, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1684436947107315, + "step": 2800, + "valid_targets_mean": 1609.4, + "valid_targets_min": 747 + }, + { + "epoch": 2.946428571428571, + "grad_norm": 0.742789781874144, + "learning_rate": 2.8722822902115228e-05, + "loss": 0.1778, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1685582548379898, + "step": 2805, + "valid_targets_mean": 1568.2, + "valid_targets_min": 820 + }, + { + "epoch": 2.9516806722689077, + "grad_norm": 0.7211288410702199, + "learning_rate": 2.8675651946877884e-05, + "loss": 0.1657, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17647072672843933, + "step": 2810, + "valid_targets_mean": 1670.1, + "valid_targets_min": 799 + }, + { + "epoch": 2.956932773109244, + "grad_norm": 0.7463660696176379, + "learning_rate": 2.862842147018696e-05, + "loss": 0.16, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17189790308475494, + "step": 2815, + "valid_targets_mean": 1533.6, + "valid_targets_min": 1047 + }, + { + "epoch": 2.96218487394958, + "grad_norm": 0.7064510545820726, + "learning_rate": 2.858113179607881e-05, + "loss": 0.1556, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1601008176803589, + "step": 2820, + "valid_targets_mean": 1528.5, + "valid_targets_min": 741 + }, + { + "epoch": 2.967436974789916, + "grad_norm": 0.7179205966287691, + "learning_rate": 2.8533783248995938e-05, + "loss": 0.1522, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15484890341758728, + "step": 2825, + "valid_targets_mean": 1404.0, + "valid_targets_min": 720 + }, + { + "epoch": 2.972689075630252, + "grad_norm": 0.7844547172494378, + "learning_rate": 2.848637615378475e-05, + "loss": 0.1693, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16542135179042816, + "step": 2830, + "valid_targets_mean": 1366.3, + "valid_targets_min": 892 + }, + { + "epoch": 2.9779411764705883, + "grad_norm": 0.7331691954809272, + "learning_rate": 2.8438910835693314e-05, + "loss": 0.165, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17777270078659058, + "step": 2835, + "valid_targets_mean": 1436.8, + "valid_targets_min": 684 + }, + { + "epoch": 2.9831932773109244, + "grad_norm": 0.6822641232454941, + "learning_rate": 2.8391387620369192e-05, + "loss": 0.1587, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1580207496881485, + "step": 2840, + "valid_targets_mean": 1425.5, + "valid_targets_min": 874 + }, + { + "epoch": 2.9884453781512605, + "grad_norm": 0.7108579727414756, + "learning_rate": 2.834380683385714e-05, + "loss": 0.1616, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16222992539405823, + "step": 2845, + "valid_targets_mean": 1604.8, + "valid_targets_min": 1280 + }, + { + "epoch": 2.9936974789915967, + "grad_norm": 0.7199485862107549, + "learning_rate": 2.8296168802596892e-05, + "loss": 0.1667, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16997018456459045, + "step": 2850, + "valid_targets_mean": 1522.8, + "valid_targets_min": 589 + }, + { + "epoch": 2.9989495798319328, + "grad_norm": 0.7245690379476749, + "learning_rate": 2.8248473853420933e-05, + "loss": 0.171, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18465590476989746, + "step": 2855, + "valid_targets_mean": 1654.8, + "valid_targets_min": 918 + }, + { + "epoch": 3.004201680672269, + "grad_norm": 0.6536431805707318, + "learning_rate": 2.8200722313552247e-05, + "loss": 0.2481, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2750670313835144, + "step": 2860, + "valid_targets_mean": 3678.0, + "valid_targets_min": 702 + }, + { + "epoch": 3.009453781512605, + "grad_norm": 0.5616581452948703, + "learning_rate": 2.8152914510602073e-05, + "loss": 0.2663, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2694254219532013, + "step": 2865, + "valid_targets_mean": 4133.2, + "valid_targets_min": 1550 + }, + { + "epoch": 3.014705882352941, + "grad_norm": 0.5914552324016616, + "learning_rate": 2.810505077256765e-05, + "loss": 0.2531, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.26886335015296936, + "step": 2870, + "valid_targets_mean": 3929.9, + "valid_targets_min": 1296 + }, + { + "epoch": 3.0199579831932772, + "grad_norm": 0.5617545432111057, + "learning_rate": 2.8057131427829983e-05, + "loss": 0.2488, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23543497920036316, + "step": 2875, + "valid_targets_mean": 4362.6, + "valid_targets_min": 1681 + }, + { + "epoch": 3.0252100840336134, + "grad_norm": 0.5909970139213782, + "learning_rate": 2.800915680515157e-05, + "loss": 0.2512, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.269046425819397, + "step": 2880, + "valid_targets_mean": 3591.2, + "valid_targets_min": 1044 + }, + { + "epoch": 3.0304621848739495, + "grad_norm": 0.548113977574793, + "learning_rate": 2.7961127233674167e-05, + "loss": 0.2608, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2423868477344513, + "step": 2885, + "valid_targets_mean": 3697.8, + "valid_targets_min": 920 + }, + { + "epoch": 3.0357142857142856, + "grad_norm": 0.5485874887437441, + "learning_rate": 2.7913043042916513e-05, + "loss": 0.2389, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.25993612408638, + "step": 2890, + "valid_targets_mean": 5826.4, + "valid_targets_min": 2060 + }, + { + "epoch": 3.0409663865546217, + "grad_norm": 0.5329423434447529, + "learning_rate": 2.786490456277208e-05, + "loss": 0.2544, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24909579753875732, + "step": 2895, + "valid_targets_mean": 4033.6, + "valid_targets_min": 467 + }, + { + "epoch": 3.046218487394958, + "grad_norm": 0.5983501432535179, + "learning_rate": 2.7816712123506796e-05, + "loss": 0.2631, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2781432271003723, + "step": 2900, + "valid_targets_mean": 3789.9, + "valid_targets_min": 1689 + }, + { + "epoch": 3.051470588235294, + "grad_norm": 0.5971903589113992, + "learning_rate": 2.776846605575681e-05, + "loss": 0.2551, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2563186287879944, + "step": 2905, + "valid_targets_mean": 3695.6, + "valid_targets_min": 1477 + }, + { + "epoch": 3.05672268907563, + "grad_norm": 0.5806312781845833, + "learning_rate": 2.772016669052618e-05, + "loss": 0.2649, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2883797883987427, + "step": 2910, + "valid_targets_mean": 4019.2, + "valid_targets_min": 1223 + }, + { + "epoch": 3.0619747899159666, + "grad_norm": 0.5300497777002529, + "learning_rate": 2.767181435918464e-05, + "loss": 0.2572, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.27011632919311523, + "step": 2915, + "valid_targets_mean": 4429.1, + "valid_targets_min": 1552 + }, + { + "epoch": 3.0672268907563027, + "grad_norm": 0.6074007571412762, + "learning_rate": 2.7623409393465298e-05, + "loss": 0.2513, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2498617321252823, + "step": 2920, + "valid_targets_mean": 3706.6, + "valid_targets_min": 1439 + }, + { + "epoch": 3.072478991596639, + "grad_norm": 0.626168733306276, + "learning_rate": 2.7574952125462386e-05, + "loss": 0.2522, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23380611836910248, + "step": 2925, + "valid_targets_mean": 3199.5, + "valid_targets_min": 1402 + }, + { + "epoch": 3.077731092436975, + "grad_norm": 0.6268290865377733, + "learning_rate": 2.7526442887628962e-05, + "loss": 0.2704, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.27413225173950195, + "step": 2930, + "valid_targets_mean": 3583.0, + "valid_targets_min": 1586 + }, + { + "epoch": 3.082983193277311, + "grad_norm": 0.6176358259961854, + "learning_rate": 2.7477882012774633e-05, + "loss": 0.2567, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2532740831375122, + "step": 2935, + "valid_targets_mean": 3411.6, + "valid_targets_min": 1538 + }, + { + "epoch": 3.088235294117647, + "grad_norm": 0.6568380568558851, + "learning_rate": 2.742926983406328e-05, + "loss": 0.2605, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2723920941352844, + "step": 2940, + "valid_targets_mean": 2824.4, + "valid_targets_min": 1058 + }, + { + "epoch": 3.0934873949579833, + "grad_norm": 0.6596581392165033, + "learning_rate": 2.7380606685010767e-05, + "loss": 0.2743, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2707256078720093, + "step": 2945, + "valid_targets_mean": 2777.6, + "valid_targets_min": 1205 + }, + { + "epoch": 3.0987394957983194, + "grad_norm": 0.6126808354592166, + "learning_rate": 2.7331892899482654e-05, + "loss": 0.2574, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.266759991645813, + "step": 2950, + "valid_targets_mean": 3421.2, + "valid_targets_min": 1165 + }, + { + "epoch": 3.1039915966386555, + "grad_norm": 0.6307476273476691, + "learning_rate": 2.7283128811691893e-05, + "loss": 0.2605, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2549319565296173, + "step": 2955, + "valid_targets_mean": 3220.3, + "valid_targets_min": 1267 + }, + { + "epoch": 3.1092436974789917, + "grad_norm": 0.6279599813034801, + "learning_rate": 2.7234314756196564e-05, + "loss": 0.255, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24072325229644775, + "step": 2960, + "valid_targets_mean": 3117.6, + "valid_targets_min": 1026 + }, + { + "epoch": 3.1144957983193278, + "grad_norm": 0.612911115813002, + "learning_rate": 2.718545106789755e-05, + "loss": 0.2471, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.25921279191970825, + "step": 2965, + "valid_targets_mean": 3350.1, + "valid_targets_min": 1345 + }, + { + "epoch": 3.119747899159664, + "grad_norm": 0.6086001253575483, + "learning_rate": 2.713653808203626e-05, + "loss": 0.2625, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24595654010772705, + "step": 2970, + "valid_targets_mean": 3563.4, + "valid_targets_min": 2050 + }, + { + "epoch": 3.125, + "grad_norm": 0.6022736229918767, + "learning_rate": 2.7087576134192305e-05, + "loss": 0.263, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23543179035186768, + "step": 2975, + "valid_targets_mean": 3142.4, + "valid_targets_min": 1166 + }, + { + "epoch": 3.130252100840336, + "grad_norm": 0.6154494544856133, + "learning_rate": 2.7038565560281252e-05, + "loss": 0.2626, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2742067575454712, + "step": 2980, + "valid_targets_mean": 3220.9, + "valid_targets_min": 997 + }, + { + "epoch": 3.1355042016806722, + "grad_norm": 0.6742689274132734, + "learning_rate": 2.6989506696552224e-05, + "loss": 0.2457, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2767985463142395, + "step": 2985, + "valid_targets_mean": 2980.7, + "valid_targets_min": 1293 + }, + { + "epoch": 3.1407563025210083, + "grad_norm": 0.6039332698980796, + "learning_rate": 2.6940399879585685e-05, + "loss": 0.255, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23629191517829895, + "step": 2990, + "valid_targets_mean": 3027.2, + "valid_targets_min": 1732 + }, + { + "epoch": 3.1460084033613445, + "grad_norm": 0.6818227952934203, + "learning_rate": 2.6891245446291093e-05, + "loss": 0.2566, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.27924174070358276, + "step": 2995, + "valid_targets_mean": 3159.9, + "valid_targets_min": 1108 + }, + { + "epoch": 3.1512605042016806, + "grad_norm": 0.6924339005528242, + "learning_rate": 2.6842043733904578e-05, + "loss": 0.2517, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.25699329376220703, + "step": 3000, + "valid_targets_mean": 3364.2, + "valid_targets_min": 571 + }, + { + "epoch": 3.1565126050420167, + "grad_norm": 0.675775810675891, + "learning_rate": 2.6792795079986634e-05, + "loss": 0.258, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.25223487615585327, + "step": 3005, + "valid_targets_mean": 2891.1, + "valid_targets_min": 738 + }, + { + "epoch": 3.161764705882353, + "grad_norm": 0.7118892851934508, + "learning_rate": 2.6743499822419833e-05, + "loss": 0.246, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.26765280961990356, + "step": 3010, + "valid_targets_mean": 2982.2, + "valid_targets_min": 1798 + }, + { + "epoch": 3.167016806722689, + "grad_norm": 0.6135998796483827, + "learning_rate": 2.669415829940646e-05, + "loss": 0.2528, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24437305331230164, + "step": 3015, + "valid_targets_mean": 3367.0, + "valid_targets_min": 1338 + }, + { + "epoch": 3.172268907563025, + "grad_norm": 0.6308992296328928, + "learning_rate": 2.6644770849466226e-05, + "loss": 0.2566, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.26935499906539917, + "step": 3020, + "valid_targets_mean": 3564.4, + "valid_targets_min": 1276 + }, + { + "epoch": 3.177521008403361, + "grad_norm": 0.6604476871808482, + "learning_rate": 2.6595337811433925e-05, + "loss": 0.2546, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.25287342071533203, + "step": 3025, + "valid_targets_mean": 3842.9, + "valid_targets_min": 1668 + }, + { + "epoch": 3.1827731092436973, + "grad_norm": 0.5864716374259419, + "learning_rate": 2.654585952445714e-05, + "loss": 0.2538, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2597090005874634, + "step": 3030, + "valid_targets_mean": 3920.2, + "valid_targets_min": 1373 + }, + { + "epoch": 3.1880252100840334, + "grad_norm": 0.6138428018636582, + "learning_rate": 2.6496336327993882e-05, + "loss": 0.2572, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2661425769329071, + "step": 3035, + "valid_targets_mean": 3629.1, + "valid_targets_min": 1858 + }, + { + "epoch": 3.19327731092437, + "grad_norm": 0.5951194931237926, + "learning_rate": 2.6446768561810264e-05, + "loss": 0.2559, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2323005348443985, + "step": 3040, + "valid_targets_mean": 3384.1, + "valid_targets_min": 922 + }, + { + "epoch": 3.198529411764706, + "grad_norm": 0.6617141663860238, + "learning_rate": 2.6397156565978198e-05, + "loss": 0.2537, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.28470370173454285, + "step": 3045, + "valid_targets_mean": 3499.2, + "valid_targets_min": 2483 + }, + { + "epoch": 3.203781512605042, + "grad_norm": 0.6472312935786627, + "learning_rate": 2.6347500680873043e-05, + "loss": 0.2491, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24719394743442535, + "step": 3050, + "valid_targets_mean": 2993.0, + "valid_targets_min": 977 + }, + { + "epoch": 3.2090336134453783, + "grad_norm": 0.5796753467452805, + "learning_rate": 2.6297801247171258e-05, + "loss": 0.2403, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2180900275707245, + "step": 3055, + "valid_targets_mean": 3620.9, + "valid_targets_min": 1856 + }, + { + "epoch": 3.2142857142857144, + "grad_norm": 0.663197194188445, + "learning_rate": 2.6248058605848097e-05, + "loss": 0.2469, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24358363449573517, + "step": 3060, + "valid_targets_mean": 3015.3, + "valid_targets_min": 1200 + }, + { + "epoch": 3.2195378151260505, + "grad_norm": 0.5921044967379778, + "learning_rate": 2.6198273098175234e-05, + "loss": 0.2468, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21505384147167206, + "step": 3065, + "valid_targets_mean": 3572.4, + "valid_targets_min": 1607 + }, + { + "epoch": 3.2247899159663866, + "grad_norm": 0.656610014798293, + "learning_rate": 2.614844506571844e-05, + "loss": 0.2586, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24926620721817017, + "step": 3070, + "valid_targets_mean": 2880.9, + "valid_targets_min": 1358 + }, + { + "epoch": 3.2300420168067228, + "grad_norm": 0.6222197525250114, + "learning_rate": 2.609857485033525e-05, + "loss": 0.2518, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2442103624343872, + "step": 3075, + "valid_targets_mean": 3209.0, + "valid_targets_min": 1219 + }, + { + "epoch": 3.235294117647059, + "grad_norm": 0.587521968482715, + "learning_rate": 2.6048662794172595e-05, + "loss": 0.2545, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23662276566028595, + "step": 3080, + "valid_targets_mean": 3512.0, + "valid_targets_min": 1168 + }, + { + "epoch": 3.240546218487395, + "grad_norm": 0.6685246266555611, + "learning_rate": 2.599870923966447e-05, + "loss": 0.2345, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2525354027748108, + "step": 3085, + "valid_targets_mean": 2764.2, + "valid_targets_min": 474 + }, + { + "epoch": 3.245798319327731, + "grad_norm": 0.6202106667084994, + "learning_rate": 2.5948714529529565e-05, + "loss": 0.2481, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24517540633678436, + "step": 3090, + "valid_targets_mean": 3665.3, + "valid_targets_min": 1140 + }, + { + "epoch": 3.2510504201680672, + "grad_norm": 0.5785793477278848, + "learning_rate": 2.5898679006768958e-05, + "loss": 0.2418, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22179822623729706, + "step": 3095, + "valid_targets_mean": 3486.1, + "valid_targets_min": 1482 + }, + { + "epoch": 3.2563025210084033, + "grad_norm": 0.6033278556859933, + "learning_rate": 2.5848603014663702e-05, + "loss": 0.2375, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21563810110092163, + "step": 3100, + "valid_targets_mean": 3097.8, + "valid_targets_min": 904 + }, + { + "epoch": 3.2615546218487395, + "grad_norm": 0.6455004631708245, + "learning_rate": 2.579848689677252e-05, + "loss": 0.2513, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.29056334495544434, + "step": 3105, + "valid_targets_mean": 3727.6, + "valid_targets_min": 1194 + }, + { + "epoch": 3.2668067226890756, + "grad_norm": 0.5925539085498962, + "learning_rate": 2.5748330996929414e-05, + "loss": 0.2471, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2517462372779846, + "step": 3110, + "valid_targets_mean": 3901.4, + "valid_targets_min": 1527 + }, + { + "epoch": 3.2720588235294117, + "grad_norm": 0.6625252347137165, + "learning_rate": 2.5698135659241334e-05, + "loss": 0.2458, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2597498893737793, + "step": 3115, + "valid_targets_mean": 3953.8, + "valid_targets_min": 1428 + }, + { + "epoch": 3.277310924369748, + "grad_norm": 0.6869236027507247, + "learning_rate": 2.564790122808579e-05, + "loss": 0.2531, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.27155032753944397, + "step": 3120, + "valid_targets_mean": 3239.1, + "valid_targets_min": 1460 + }, + { + "epoch": 3.282563025210084, + "grad_norm": 0.641846245505168, + "learning_rate": 2.5597628048108504e-05, + "loss": 0.2653, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.26535165309906006, + "step": 3125, + "valid_targets_mean": 3494.8, + "valid_targets_min": 1172 + }, + { + "epoch": 3.28781512605042, + "grad_norm": 0.6112401795648174, + "learning_rate": 2.5547316464221058e-05, + "loss": 0.2422, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2558062672615051, + "step": 3130, + "valid_targets_mean": 3518.0, + "valid_targets_min": 1229 + }, + { + "epoch": 3.293067226890756, + "grad_norm": 0.5712486962165064, + "learning_rate": 2.5496966821598493e-05, + "loss": 0.24, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23176561295986176, + "step": 3135, + "valid_targets_mean": 3590.5, + "valid_targets_min": 1523 + }, + { + "epoch": 3.2983193277310923, + "grad_norm": 0.6085435476900142, + "learning_rate": 2.5446579465676977e-05, + "loss": 0.2376, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23727688193321228, + "step": 3140, + "valid_targets_mean": 3541.0, + "valid_targets_min": 997 + }, + { + "epoch": 3.3035714285714284, + "grad_norm": 0.6531904825025399, + "learning_rate": 2.5396154742151407e-05, + "loss": 0.2383, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2473251223564148, + "step": 3145, + "valid_targets_mean": 3417.0, + "valid_targets_min": 621 + }, + { + "epoch": 3.3088235294117645, + "grad_norm": 0.6509222958342396, + "learning_rate": 2.5345692996973075e-05, + "loss": 0.2445, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24736976623535156, + "step": 3150, + "valid_targets_mean": 3183.2, + "valid_targets_min": 1282 + }, + { + "epoch": 3.314075630252101, + "grad_norm": 0.5707923779013074, + "learning_rate": 2.5295194576347233e-05, + "loss": 0.229, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21255888044834137, + "step": 3155, + "valid_targets_mean": 3807.4, + "valid_targets_min": 1143 + }, + { + "epoch": 3.3193277310924367, + "grad_norm": 0.638283494349549, + "learning_rate": 2.5244659826730774e-05, + "loss": 0.2369, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23158839344978333, + "step": 3160, + "valid_targets_mean": 3191.6, + "valid_targets_min": 1438 + }, + { + "epoch": 3.3245798319327733, + "grad_norm": 0.5983879302794481, + "learning_rate": 2.519408909482984e-05, + "loss": 0.2587, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23230604827404022, + "step": 3165, + "valid_targets_mean": 3549.1, + "valid_targets_min": 2091 + }, + { + "epoch": 3.3298319327731094, + "grad_norm": 0.6356003504281118, + "learning_rate": 2.5143482727597427e-05, + "loss": 0.2408, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23692654073238373, + "step": 3170, + "valid_targets_mean": 3175.4, + "valid_targets_min": 1305 + }, + { + "epoch": 3.3350840336134455, + "grad_norm": 0.5822669278425938, + "learning_rate": 2.509284107223102e-05, + "loss": 0.2441, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2323712259531021, + "step": 3175, + "valid_targets_mean": 3699.6, + "valid_targets_min": 1428 + }, + { + "epoch": 3.3403361344537816, + "grad_norm": 0.6034461853939603, + "learning_rate": 2.50421644761702e-05, + "loss": 0.242, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2210870236158371, + "step": 3180, + "valid_targets_mean": 3405.7, + "valid_targets_min": 1388 + }, + { + "epoch": 3.3455882352941178, + "grad_norm": 0.6142007275077153, + "learning_rate": 2.499145328709429e-05, + "loss": 0.2497, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.25747138261795044, + "step": 3185, + "valid_targets_mean": 3644.9, + "valid_targets_min": 1823 + }, + { + "epoch": 3.350840336134454, + "grad_norm": 0.6119837836741985, + "learning_rate": 2.4940707852919924e-05, + "loss": 0.2296, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2111436128616333, + "step": 3190, + "valid_targets_mean": 3011.4, + "valid_targets_min": 1109 + }, + { + "epoch": 3.35609243697479, + "grad_norm": 0.6533534419454151, + "learning_rate": 2.488992852179868e-05, + "loss": 0.2436, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23850302398204803, + "step": 3195, + "valid_targets_mean": 3141.6, + "valid_targets_min": 1649 + }, + { + "epoch": 3.361344537815126, + "grad_norm": 0.7140300662865305, + "learning_rate": 2.483911564211472e-05, + "loss": 0.2366, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.26096731424331665, + "step": 3200, + "valid_targets_mean": 2904.2, + "valid_targets_min": 1249 + }, + { + "epoch": 3.366596638655462, + "grad_norm": 0.7251927942844403, + "learning_rate": 2.4788269562482355e-05, + "loss": 0.2531, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.26130279898643494, + "step": 3205, + "valid_targets_mean": 3641.2, + "valid_targets_min": 1793 + }, + { + "epoch": 3.3718487394957983, + "grad_norm": 0.6421393556947993, + "learning_rate": 2.4737390631743675e-05, + "loss": 0.2463, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2507364749908447, + "step": 3210, + "valid_targets_mean": 3154.0, + "valid_targets_min": 1054 + }, + { + "epoch": 3.3771008403361344, + "grad_norm": 0.6437737473605846, + "learning_rate": 2.4686479198966146e-05, + "loss": 0.2458, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24308231472969055, + "step": 3215, + "valid_targets_mean": 3276.6, + "valid_targets_min": 1055 + }, + { + "epoch": 3.3823529411764706, + "grad_norm": 0.6571399883695811, + "learning_rate": 2.463553561344024e-05, + "loss": 0.2507, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24305208027362823, + "step": 3220, + "valid_targets_mean": 3750.0, + "valid_targets_min": 1241 + }, + { + "epoch": 3.3876050420168067, + "grad_norm": 0.650161760454692, + "learning_rate": 2.4584560224677013e-05, + "loss": 0.2453, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24910904467105865, + "step": 3225, + "valid_targets_mean": 3649.5, + "valid_targets_min": 1174 + }, + { + "epoch": 3.392857142857143, + "grad_norm": 0.645357588744853, + "learning_rate": 2.4533553382405702e-05, + "loss": 0.2565, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2722882926464081, + "step": 3230, + "valid_targets_mean": 3284.9, + "valid_targets_min": 992 + }, + { + "epoch": 3.398109243697479, + "grad_norm": 0.6297523245044137, + "learning_rate": 2.4482515436571365e-05, + "loss": 0.2473, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.25592392683029175, + "step": 3235, + "valid_targets_mean": 3817.9, + "valid_targets_min": 1133 + }, + { + "epoch": 3.403361344537815, + "grad_norm": 0.6382149094735594, + "learning_rate": 2.4431446737332437e-05, + "loss": 0.2478, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2542281150817871, + "step": 3240, + "valid_targets_mean": 3242.6, + "valid_targets_min": 1409 + }, + { + "epoch": 3.408613445378151, + "grad_norm": 0.726502424494956, + "learning_rate": 2.438034763505833e-05, + "loss": 0.2499, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.25886449217796326, + "step": 3245, + "valid_targets_mean": 3062.4, + "valid_targets_min": 719 + }, + { + "epoch": 3.4138655462184873, + "grad_norm": 0.659719001774402, + "learning_rate": 2.432921848032707e-05, + "loss": 0.2515, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.25948482751846313, + "step": 3250, + "valid_targets_mean": 3307.1, + "valid_targets_min": 1239 + }, + { + "epoch": 3.4191176470588234, + "grad_norm": 0.6125599642876945, + "learning_rate": 2.427805962392286e-05, + "loss": 0.2416, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24624377489089966, + "step": 3255, + "valid_targets_mean": 3635.1, + "valid_targets_min": 1349 + }, + { + "epoch": 3.4243697478991595, + "grad_norm": 0.6755501860373633, + "learning_rate": 2.4226871416833683e-05, + "loss": 0.2453, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2604214549064636, + "step": 3260, + "valid_targets_mean": 3250.2, + "valid_targets_min": 1434 + }, + { + "epoch": 3.4296218487394956, + "grad_norm": 0.6523430203235168, + "learning_rate": 2.4175654210248848e-05, + "loss": 0.2408, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23800113797187805, + "step": 3265, + "valid_targets_mean": 3233.2, + "valid_targets_min": 521 + }, + { + "epoch": 3.434873949579832, + "grad_norm": 0.6487475032548123, + "learning_rate": 2.4124408355556677e-05, + "loss": 0.2548, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2616475224494934, + "step": 3270, + "valid_targets_mean": 3477.9, + "valid_targets_min": 937 + }, + { + "epoch": 3.440126050420168, + "grad_norm": 0.7183856650514495, + "learning_rate": 2.4073134204342014e-05, + "loss": 0.254, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.25091075897216797, + "step": 3275, + "valid_targets_mean": 3096.8, + "valid_targets_min": 1239 + }, + { + "epoch": 3.4453781512605044, + "grad_norm": 0.6435718093662096, + "learning_rate": 2.4021832108383837e-05, + "loss": 0.2332, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23243436217308044, + "step": 3280, + "valid_targets_mean": 3552.1, + "valid_targets_min": 1457 + }, + { + "epoch": 3.4506302521008405, + "grad_norm": 0.6794408128931803, + "learning_rate": 2.3970502419652854e-05, + "loss": 0.2358, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24406090378761292, + "step": 3285, + "valid_targets_mean": 3231.3, + "valid_targets_min": 1307 + }, + { + "epoch": 3.4558823529411766, + "grad_norm": 0.6369525387600705, + "learning_rate": 2.3919145490309076e-05, + "loss": 0.2397, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24544468522071838, + "step": 3290, + "valid_targets_mean": 3674.0, + "valid_targets_min": 1773 + }, + { + "epoch": 3.4611344537815127, + "grad_norm": 0.6864257084128846, + "learning_rate": 2.38677616726994e-05, + "loss": 0.2314, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23525570333003998, + "step": 3295, + "valid_targets_mean": 3274.8, + "valid_targets_min": 1035 + }, + { + "epoch": 3.466386554621849, + "grad_norm": 0.6249370596202156, + "learning_rate": 2.381635131935521e-05, + "loss": 0.2307, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23440296947956085, + "step": 3300, + "valid_targets_mean": 3696.1, + "valid_targets_min": 1333 + }, + { + "epoch": 3.471638655462185, + "grad_norm": 0.609366608375307, + "learning_rate": 2.3764914782989926e-05, + "loss": 0.235, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2386169135570526, + "step": 3305, + "valid_targets_mean": 3717.7, + "valid_targets_min": 1062 + }, + { + "epoch": 3.476890756302521, + "grad_norm": 0.6957649137605235, + "learning_rate": 2.3713452416496625e-05, + "loss": 0.2263, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2374548614025116, + "step": 3310, + "valid_targets_mean": 2991.9, + "valid_targets_min": 993 + }, + { + "epoch": 3.482142857142857, + "grad_norm": 0.6360187725166639, + "learning_rate": 2.366196457294558e-05, + "loss": 0.2258, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23413576185703278, + "step": 3315, + "valid_targets_mean": 3540.1, + "valid_targets_min": 873 + }, + { + "epoch": 3.4873949579831933, + "grad_norm": 0.6151473063134504, + "learning_rate": 2.3610451605581858e-05, + "loss": 0.2278, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21768996119499207, + "step": 3320, + "valid_targets_mean": 3565.8, + "valid_targets_min": 1152 + }, + { + "epoch": 3.4926470588235294, + "grad_norm": 0.6627058497672066, + "learning_rate": 2.3558913867822905e-05, + "loss": 0.238, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24642956256866455, + "step": 3325, + "valid_targets_mean": 3437.2, + "valid_targets_min": 1128 + }, + { + "epoch": 3.4978991596638656, + "grad_norm": 0.6487038665095798, + "learning_rate": 2.3507351713256105e-05, + "loss": 0.2494, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22559967637062073, + "step": 3330, + "valid_targets_mean": 3062.5, + "valid_targets_min": 1123 + }, + { + "epoch": 3.5031512605042017, + "grad_norm": 0.7141894926568165, + "learning_rate": 2.3455765495636353e-05, + "loss": 0.2404, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2572299838066101, + "step": 3335, + "valid_targets_mean": 2870.6, + "valid_targets_min": 1278 + }, + { + "epoch": 3.508403361344538, + "grad_norm": 0.7021679105572891, + "learning_rate": 2.3404155568883643e-05, + "loss": 0.224, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23877769708633423, + "step": 3340, + "valid_targets_mean": 3168.8, + "valid_targets_min": 1834 + }, + { + "epoch": 3.513655462184874, + "grad_norm": 0.597320613139139, + "learning_rate": 2.3352522287080625e-05, + "loss": 0.2369, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21225066483020782, + "step": 3345, + "valid_targets_mean": 3446.2, + "valid_targets_min": 420 + }, + { + "epoch": 3.51890756302521, + "grad_norm": 0.6380276235544516, + "learning_rate": 2.3300866004470182e-05, + "loss": 0.2432, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24665868282318115, + "step": 3350, + "valid_targets_mean": 3379.9, + "valid_targets_min": 757 + }, + { + "epoch": 3.524159663865546, + "grad_norm": 0.7068358500231999, + "learning_rate": 2.324918707545302e-05, + "loss": 0.241, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24660983681678772, + "step": 3355, + "valid_targets_mean": 2930.9, + "valid_targets_min": 732 + }, + { + "epoch": 3.5294117647058822, + "grad_norm": 0.6415894870301354, + "learning_rate": 2.3197485854585183e-05, + "loss": 0.2365, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2307543158531189, + "step": 3360, + "valid_targets_mean": 3399.6, + "valid_targets_min": 929 + }, + { + "epoch": 3.5346638655462184, + "grad_norm": 0.6658926618185477, + "learning_rate": 2.3145762696575675e-05, + "loss": 0.2382, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.25282666087150574, + "step": 3365, + "valid_targets_mean": 3603.7, + "valid_targets_min": 1217 + }, + { + "epoch": 3.5399159663865545, + "grad_norm": 0.9220749340704859, + "learning_rate": 2.3094017956283995e-05, + "loss": 0.223, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17968519032001495, + "step": 3370, + "valid_targets_mean": 1437.6, + "valid_targets_min": 544 + }, + { + "epoch": 3.5451680672268906, + "grad_norm": 0.8146754285295436, + "learning_rate": 2.3042251988717728e-05, + "loss": 0.1748, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1631278544664383, + "step": 3375, + "valid_targets_mean": 1329.9, + "valid_targets_min": 632 + }, + { + "epoch": 3.5504201680672267, + "grad_norm": 0.8079169271047991, + "learning_rate": 2.2990465149030077e-05, + "loss": 0.1602, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14737124741077423, + "step": 3380, + "valid_targets_mean": 1353.5, + "valid_targets_min": 514 + }, + { + "epoch": 3.5556722689075633, + "grad_norm": 0.8535871657760787, + "learning_rate": 2.2938657792517446e-05, + "loss": 0.164, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16740497946739197, + "step": 3385, + "valid_targets_mean": 1316.6, + "valid_targets_min": 701 + }, + { + "epoch": 3.560924369747899, + "grad_norm": 0.7719202998888485, + "learning_rate": 2.2886830274617017e-05, + "loss": 0.1537, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1611393243074417, + "step": 3390, + "valid_targets_mean": 1592.3, + "valid_targets_min": 754 + }, + { + "epoch": 3.5661764705882355, + "grad_norm": 0.7958529561306797, + "learning_rate": 2.2834982950904267e-05, + "loss": 0.1582, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14342686533927917, + "step": 3395, + "valid_targets_mean": 1302.9, + "valid_targets_min": 746 + }, + { + "epoch": 3.571428571428571, + "grad_norm": 0.8182753300383552, + "learning_rate": 2.2783116177090573e-05, + "loss": 0.1669, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16086168587207794, + "step": 3400, + "valid_targets_mean": 1477.3, + "valid_targets_min": 774 + }, + { + "epoch": 3.5766806722689077, + "grad_norm": 0.8440198093915002, + "learning_rate": 2.2731230309020762e-05, + "loss": 0.1445, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14826279878616333, + "step": 3405, + "valid_targets_mean": 1277.8, + "valid_targets_min": 648 + }, + { + "epoch": 3.581932773109244, + "grad_norm": 0.7376313701958287, + "learning_rate": 2.2679325702670642e-05, + "loss": 0.1665, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1509246826171875, + "step": 3410, + "valid_targets_mean": 1484.6, + "valid_targets_min": 708 + }, + { + "epoch": 3.58718487394958, + "grad_norm": 0.7318924656750266, + "learning_rate": 2.2627402714144586e-05, + "loss": 0.1481, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13782326877117157, + "step": 3415, + "valid_targets_mean": 1430.1, + "valid_targets_min": 770 + }, + { + "epoch": 3.592436974789916, + "grad_norm": 0.7765160826126889, + "learning_rate": 2.2575461699673085e-05, + "loss": 0.1547, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13097913563251495, + "step": 3420, + "valid_targets_mean": 1201.6, + "valid_targets_min": 572 + }, + { + "epoch": 3.597689075630252, + "grad_norm": 0.7638002189556976, + "learning_rate": 2.2523503015610303e-05, + "loss": 0.1527, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1455516219139099, + "step": 3425, + "valid_targets_mean": 1363.5, + "valid_targets_min": 627 + }, + { + "epoch": 3.6029411764705883, + "grad_norm": 1.2976616643941823, + "learning_rate": 2.2471527018431637e-05, + "loss": 0.1559, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16458860039710999, + "step": 3430, + "valid_targets_mean": 1451.6, + "valid_targets_min": 765 + }, + { + "epoch": 3.6081932773109244, + "grad_norm": 0.7946926976962566, + "learning_rate": 2.2419534064731238e-05, + "loss": 0.145, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15298821032047272, + "step": 3435, + "valid_targets_mean": 1393.4, + "valid_targets_min": 740 + }, + { + "epoch": 3.6134453781512605, + "grad_norm": 0.7749793995924292, + "learning_rate": 2.236752451121963e-05, + "loss": 0.1465, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1496553122997284, + "step": 3440, + "valid_targets_mean": 1498.2, + "valid_targets_min": 821 + }, + { + "epoch": 3.6186974789915967, + "grad_norm": 0.8079854962978418, + "learning_rate": 2.2315498714721198e-05, + "loss": 0.1432, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1507023572921753, + "step": 3445, + "valid_targets_mean": 1411.3, + "valid_targets_min": 691 + }, + { + "epoch": 3.6239495798319328, + "grad_norm": 0.7810771746182552, + "learning_rate": 2.2263457032171762e-05, + "loss": 0.1525, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1364845335483551, + "step": 3450, + "valid_targets_mean": 1252.6, + "valid_targets_min": 721 + }, + { + "epoch": 3.629201680672269, + "grad_norm": 0.7854800292698711, + "learning_rate": 2.2211399820616154e-05, + "loss": 0.1548, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15126636624336243, + "step": 3455, + "valid_targets_mean": 1422.4, + "valid_targets_min": 727 + }, + { + "epoch": 3.634453781512605, + "grad_norm": 0.7420584859304036, + "learning_rate": 2.2159327437205733e-05, + "loss": 0.1575, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14271925389766693, + "step": 3460, + "valid_targets_mean": 1345.2, + "valid_targets_min": 681 + }, + { + "epoch": 3.639705882352941, + "grad_norm": 0.7964739958712432, + "learning_rate": 2.210724023919595e-05, + "loss": 0.1527, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16524961590766907, + "step": 3465, + "valid_targets_mean": 1557.1, + "valid_targets_min": 814 + }, + { + "epoch": 3.6449579831932772, + "grad_norm": 0.737091402225577, + "learning_rate": 2.205513858394389e-05, + "loss": 0.1525, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16383059322834015, + "step": 3470, + "valid_targets_mean": 1626.4, + "valid_targets_min": 832 + }, + { + "epoch": 3.6502100840336134, + "grad_norm": 0.7022804917492798, + "learning_rate": 2.2003022828905832e-05, + "loss": 0.1504, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14327232539653778, + "step": 3475, + "valid_targets_mean": 1605.8, + "valid_targets_min": 891 + }, + { + "epoch": 3.6554621848739495, + "grad_norm": 0.9525205693478359, + "learning_rate": 2.19508933316348e-05, + "loss": 0.1504, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15683533251285553, + "step": 3480, + "valid_targets_mean": 1267.2, + "valid_targets_min": 621 + }, + { + "epoch": 3.6607142857142856, + "grad_norm": 0.76863394644955, + "learning_rate": 2.189875044977808e-05, + "loss": 0.1386, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12910358607769012, + "step": 3485, + "valid_targets_mean": 1270.9, + "valid_targets_min": 704 + }, + { + "epoch": 3.6659663865546217, + "grad_norm": 0.8107277676634275, + "learning_rate": 2.1846594541074796e-05, + "loss": 0.1515, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15735816955566406, + "step": 3490, + "valid_targets_mean": 1564.4, + "valid_targets_min": 872 + }, + { + "epoch": 3.671218487394958, + "grad_norm": 0.8063598539952364, + "learning_rate": 2.179442596335345e-05, + "loss": 0.1422, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13597534596920013, + "step": 3495, + "valid_targets_mean": 1323.2, + "valid_targets_min": 584 + }, + { + "epoch": 3.6764705882352944, + "grad_norm": 0.7114116421864716, + "learning_rate": 2.174224507452945e-05, + "loss": 0.149, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1412769854068756, + "step": 3500, + "valid_targets_mean": 1568.7, + "valid_targets_min": 999 + }, + { + "epoch": 3.68172268907563, + "grad_norm": 0.9027372835508958, + "learning_rate": 2.1690052232602677e-05, + "loss": 0.1554, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17291805148124695, + "step": 3505, + "valid_targets_mean": 1610.1, + "valid_targets_min": 750 + }, + { + "epoch": 3.6869747899159666, + "grad_norm": 0.7921785974495511, + "learning_rate": 2.1637847795655022e-05, + "loss": 0.1454, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13400542736053467, + "step": 3510, + "valid_targets_mean": 1269.1, + "valid_targets_min": 613 + }, + { + "epoch": 3.6922268907563023, + "grad_norm": 0.7595580625561714, + "learning_rate": 2.1585632121847925e-05, + "loss": 0.1481, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14459824562072754, + "step": 3515, + "valid_targets_mean": 1640.6, + "valid_targets_min": 768 + }, + { + "epoch": 3.697478991596639, + "grad_norm": 0.8461026963697874, + "learning_rate": 2.153340556941991e-05, + "loss": 0.1452, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13768309354782104, + "step": 3520, + "valid_targets_mean": 1270.5, + "valid_targets_min": 700 + }, + { + "epoch": 3.7027310924369745, + "grad_norm": 0.8139291786249493, + "learning_rate": 2.1481168496684145e-05, + "loss": 0.153, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13502518832683563, + "step": 3525, + "valid_targets_mean": 1266.8, + "valid_targets_min": 800 + }, + { + "epoch": 3.707983193277311, + "grad_norm": 0.7773733165903327, + "learning_rate": 2.142892126202597e-05, + "loss": 0.1434, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14710843563079834, + "step": 3530, + "valid_targets_mean": 1562.7, + "valid_targets_min": 843 + }, + { + "epoch": 3.713235294117647, + "grad_norm": 0.8540100911584824, + "learning_rate": 2.137666422390045e-05, + "loss": 0.143, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14058175683021545, + "step": 3535, + "valid_targets_mean": 1169.9, + "valid_targets_min": 746 + }, + { + "epoch": 3.7184873949579833, + "grad_norm": 0.8192520728614282, + "learning_rate": 2.132439774082991e-05, + "loss": 0.1351, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.136886328458786, + "step": 3540, + "valid_targets_mean": 1270.4, + "valid_targets_min": 772 + }, + { + "epoch": 3.7237394957983194, + "grad_norm": 0.7591394569870296, + "learning_rate": 2.1272122171401467e-05, + "loss": 0.1438, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12614212930202484, + "step": 3545, + "valid_targets_mean": 1218.7, + "valid_targets_min": 619 + }, + { + "epoch": 3.7289915966386555, + "grad_norm": 0.8033788971182879, + "learning_rate": 2.1219837874264573e-05, + "loss": 0.1497, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14868700504302979, + "step": 3550, + "valid_targets_mean": 1416.0, + "valid_targets_min": 734 + }, + { + "epoch": 3.7342436974789917, + "grad_norm": 0.7186280622481173, + "learning_rate": 2.116754520812857e-05, + "loss": 0.1436, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14419475197792053, + "step": 3555, + "valid_targets_mean": 1500.3, + "valid_targets_min": 831 + }, + { + "epoch": 3.7394957983193278, + "grad_norm": 0.8001515867898759, + "learning_rate": 2.111524453176022e-05, + "loss": 0.1483, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14432606101036072, + "step": 3560, + "valid_targets_mean": 1469.2, + "valid_targets_min": 722 + }, + { + "epoch": 3.744747899159664, + "grad_norm": 0.7937436890534154, + "learning_rate": 2.1062936203981227e-05, + "loss": 0.1449, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1394154131412506, + "step": 3565, + "valid_targets_mean": 1317.1, + "valid_targets_min": 711 + }, + { + "epoch": 3.75, + "grad_norm": 0.768116550112638, + "learning_rate": 2.10106205836658e-05, + "loss": 0.1398, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13312450051307678, + "step": 3570, + "valid_targets_mean": 1313.2, + "valid_targets_min": 733 + }, + { + "epoch": 3.755252100840336, + "grad_norm": 0.8277161948796012, + "learning_rate": 2.095829802973817e-05, + "loss": 0.1449, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15327024459838867, + "step": 3575, + "valid_targets_mean": 1500.1, + "valid_targets_min": 931 + }, + { + "epoch": 3.7605042016806722, + "grad_norm": 0.7538438394237286, + "learning_rate": 2.090596890117016e-05, + "loss": 0.1515, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14686134457588196, + "step": 3580, + "valid_targets_mean": 1631.1, + "valid_targets_min": 1011 + }, + { + "epoch": 3.7657563025210083, + "grad_norm": 0.8173261031285455, + "learning_rate": 2.0853633556978674e-05, + "loss": 0.1542, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14837123453617096, + "step": 3585, + "valid_targets_mean": 1393.4, + "valid_targets_min": 748 + }, + { + "epoch": 3.7710084033613445, + "grad_norm": 0.8094111718458211, + "learning_rate": 2.0801292356223265e-05, + "loss": 0.1419, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14551788568496704, + "step": 3590, + "valid_targets_mean": 1533.6, + "valid_targets_min": 699 + }, + { + "epoch": 3.7762605042016806, + "grad_norm": 0.9683838865909208, + "learning_rate": 2.0748945658003695e-05, + "loss": 0.1363, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13133487105369568, + "step": 3595, + "valid_targets_mean": 1311.3, + "valid_targets_min": 534 + }, + { + "epoch": 3.7815126050420167, + "grad_norm": 0.7858949321807766, + "learning_rate": 2.0696593821457392e-05, + "loss": 0.149, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13803954422473907, + "step": 3600, + "valid_targets_mean": 1410.7, + "valid_targets_min": 687 + }, + { + "epoch": 3.786764705882353, + "grad_norm": 0.7682170107004075, + "learning_rate": 2.064423720575709e-05, + "loss": 0.1444, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1322372555732727, + "step": 3605, + "valid_targets_mean": 1287.4, + "valid_targets_min": 549 + }, + { + "epoch": 3.792016806722689, + "grad_norm": 0.785944883857896, + "learning_rate": 2.0591876170108257e-05, + "loss": 0.1397, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13903062045574188, + "step": 3610, + "valid_targets_mean": 1356.6, + "valid_targets_min": 725 + }, + { + "epoch": 3.7972689075630255, + "grad_norm": 1.0766948059764874, + "learning_rate": 2.0539511073746743e-05, + "loss": 0.1395, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1596774160861969, + "step": 3615, + "valid_targets_mean": 1579.2, + "valid_targets_min": 852 + }, + { + "epoch": 3.802521008403361, + "grad_norm": 0.8802148487961788, + "learning_rate": 2.0487142275936213e-05, + "loss": 0.1496, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1571769416332245, + "step": 3620, + "valid_targets_mean": 1478.4, + "valid_targets_min": 978 + }, + { + "epoch": 3.8077731092436977, + "grad_norm": 0.9017272636806979, + "learning_rate": 2.0434770135965743e-05, + "loss": 0.1523, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1524774432182312, + "step": 3625, + "valid_targets_mean": 1463.6, + "valid_targets_min": 545 + }, + { + "epoch": 3.8130252100840334, + "grad_norm": 0.794244937697772, + "learning_rate": 2.0382395013147347e-05, + "loss": 0.1458, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15117822587490082, + "step": 3630, + "valid_targets_mean": 1314.1, + "valid_targets_min": 622 + }, + { + "epoch": 3.81827731092437, + "grad_norm": 0.683828437827683, + "learning_rate": 2.033001726681349e-05, + "loss": 0.1479, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17605149745941162, + "step": 3635, + "valid_targets_mean": 1785.9, + "valid_targets_min": 849 + }, + { + "epoch": 3.8235294117647056, + "grad_norm": 0.8701621923894823, + "learning_rate": 2.027763725631463e-05, + "loss": 0.1445, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1420620083808899, + "step": 3640, + "valid_targets_mean": 1337.8, + "valid_targets_min": 612 + }, + { + "epoch": 3.828781512605042, + "grad_norm": 0.8336992892361698, + "learning_rate": 2.0225255341016794e-05, + "loss": 0.1437, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13892850279808044, + "step": 3645, + "valid_targets_mean": 1443.2, + "valid_targets_min": 673 + }, + { + "epoch": 3.8340336134453783, + "grad_norm": 0.8497904024804793, + "learning_rate": 2.017287188029904e-05, + "loss": 0.14, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14770525693893433, + "step": 3650, + "valid_targets_mean": 1358.2, + "valid_targets_min": 746 + }, + { + "epoch": 3.8392857142857144, + "grad_norm": 0.7320787153441641, + "learning_rate": 2.0120487233551035e-05, + "loss": 0.1391, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13209758698940277, + "step": 3655, + "valid_targets_mean": 1293.9, + "valid_targets_min": 672 + }, + { + "epoch": 3.8445378151260505, + "grad_norm": 0.8025485910991912, + "learning_rate": 2.006810176017059e-05, + "loss": 0.1343, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1370171755552292, + "step": 3660, + "valid_targets_mean": 1362.8, + "valid_targets_min": 670 + }, + { + "epoch": 3.8497899159663866, + "grad_norm": 0.7870212464053592, + "learning_rate": 2.0015715819561205e-05, + "loss": 0.147, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1440301537513733, + "step": 3665, + "valid_targets_mean": 1569.8, + "valid_targets_min": 647 + }, + { + "epoch": 3.8550420168067228, + "grad_norm": 0.7590451152844765, + "learning_rate": 1.9963329771129558e-05, + "loss": 0.1425, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12877610325813293, + "step": 3670, + "valid_targets_mean": 1300.3, + "valid_targets_min": 613 + }, + { + "epoch": 3.860294117647059, + "grad_norm": 0.8086227373232483, + "learning_rate": 1.9910943974283066e-05, + "loss": 0.1416, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13503482937812805, + "step": 3675, + "valid_targets_mean": 1306.6, + "valid_targets_min": 746 + }, + { + "epoch": 3.865546218487395, + "grad_norm": 0.7360884641253568, + "learning_rate": 1.9858558788427447e-05, + "loss": 0.1456, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1362096667289734, + "step": 3680, + "valid_targets_mean": 1580.3, + "valid_targets_min": 892 + }, + { + "epoch": 3.870798319327731, + "grad_norm": 0.8447821850921354, + "learning_rate": 1.9806174572964205e-05, + "loss": 0.1497, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15582120418548584, + "step": 3685, + "valid_targets_mean": 1388.9, + "valid_targets_min": 635 + }, + { + "epoch": 3.8760504201680672, + "grad_norm": 0.7698208399307699, + "learning_rate": 1.975379168728819e-05, + "loss": 0.1404, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1433495581150055, + "step": 3690, + "valid_targets_mean": 1522.7, + "valid_targets_min": 636 + }, + { + "epoch": 3.8813025210084033, + "grad_norm": 0.8559947536872534, + "learning_rate": 1.9701410490785128e-05, + "loss": 0.1434, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15050233900547028, + "step": 3695, + "valid_targets_mean": 1404.7, + "valid_targets_min": 641 + }, + { + "epoch": 3.8865546218487395, + "grad_norm": 0.8384924745171093, + "learning_rate": 1.9649031342829178e-05, + "loss": 0.1449, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14834997057914734, + "step": 3700, + "valid_targets_mean": 1505.6, + "valid_targets_min": 818 + }, + { + "epoch": 3.8918067226890756, + "grad_norm": 0.904316575159625, + "learning_rate": 1.9596654602780398e-05, + "loss": 0.1418, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14717188477516174, + "step": 3705, + "valid_targets_mean": 1389.2, + "valid_targets_min": 625 + }, + { + "epoch": 3.8970588235294117, + "grad_norm": 0.8089593091562093, + "learning_rate": 1.9544280629982364e-05, + "loss": 0.1507, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16768889129161835, + "step": 3710, + "valid_targets_mean": 1636.1, + "valid_targets_min": 888 + }, + { + "epoch": 3.902310924369748, + "grad_norm": 1.1385386317837363, + "learning_rate": 1.949190978375966e-05, + "loss": 0.151, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1377800554037094, + "step": 3715, + "valid_targets_mean": 1567.6, + "valid_targets_min": 908 + }, + { + "epoch": 3.907563025210084, + "grad_norm": 0.7625175757891974, + "learning_rate": 1.9439542423415413e-05, + "loss": 0.1456, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1343471109867096, + "step": 3720, + "valid_targets_mean": 1259.7, + "valid_targets_min": 522 + }, + { + "epoch": 3.91281512605042, + "grad_norm": 0.7881066764674685, + "learning_rate": 1.9387178908228838e-05, + "loss": 0.1505, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1399286389350891, + "step": 3725, + "valid_targets_mean": 1342.3, + "valid_targets_min": 730 + }, + { + "epoch": 3.918067226890756, + "grad_norm": 0.7975143538194005, + "learning_rate": 1.933481959745276e-05, + "loss": 0.1378, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13079893589019775, + "step": 3730, + "valid_targets_mean": 1350.1, + "valid_targets_min": 869 + }, + { + "epoch": 3.9233193277310923, + "grad_norm": 0.7958077340565655, + "learning_rate": 1.9282464850311184e-05, + "loss": 0.1418, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14043010771274567, + "step": 3735, + "valid_targets_mean": 1477.9, + "valid_targets_min": 769 + }, + { + "epoch": 3.928571428571429, + "grad_norm": 0.8357581182064178, + "learning_rate": 1.9230115025996764e-05, + "loss": 0.1489, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13817790150642395, + "step": 3740, + "valid_targets_mean": 1340.2, + "valid_targets_min": 716 + }, + { + "epoch": 3.9338235294117645, + "grad_norm": 0.7898072090831375, + "learning_rate": 1.9177770483668416e-05, + "loss": 0.1404, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13853862881660461, + "step": 3745, + "valid_targets_mean": 1375.1, + "valid_targets_min": 707 + }, + { + "epoch": 3.939075630252101, + "grad_norm": 0.8156265634718887, + "learning_rate": 1.912543158244881e-05, + "loss": 0.1368, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13628491759300232, + "step": 3750, + "valid_targets_mean": 1429.2, + "valid_targets_min": 964 + }, + { + "epoch": 3.9443277310924367, + "grad_norm": 0.8498119635524579, + "learning_rate": 1.9073098681421895e-05, + "loss": 0.1494, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17182615399360657, + "step": 3755, + "valid_targets_mean": 1610.7, + "valid_targets_min": 793 + }, + { + "epoch": 3.9495798319327733, + "grad_norm": 0.7982935292914652, + "learning_rate": 1.902077213963048e-05, + "loss": 0.1466, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1300593912601471, + "step": 3760, + "valid_targets_mean": 1399.4, + "valid_targets_min": 727 + }, + { + "epoch": 3.9548319327731094, + "grad_norm": 0.7854022510245628, + "learning_rate": 1.896845231607372e-05, + "loss": 0.1389, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13969582319259644, + "step": 3765, + "valid_targets_mean": 1396.2, + "valid_targets_min": 734 + }, + { + "epoch": 3.9600840336134455, + "grad_norm": 0.5894392686560074, + "learning_rate": 1.8916139569704704e-05, + "loss": 0.1356, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10743817687034607, + "step": 3770, + "valid_targets_mean": 2173.6, + "valid_targets_min": 917 + }, + { + "epoch": 3.9653361344537816, + "grad_norm": 0.7395136244392762, + "learning_rate": 1.886383425942795e-05, + "loss": 0.1304, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1325417160987854, + "step": 3775, + "valid_targets_mean": 1583.9, + "valid_targets_min": 930 + }, + { + "epoch": 3.9705882352941178, + "grad_norm": 0.7865246777578737, + "learning_rate": 1.8811536744096956e-05, + "loss": 0.1425, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13856448233127594, + "step": 3780, + "valid_targets_mean": 1454.1, + "valid_targets_min": 570 + }, + { + "epoch": 3.975840336134454, + "grad_norm": 0.7942309792805228, + "learning_rate": 1.8759247382511748e-05, + "loss": 0.1395, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14219339191913605, + "step": 3785, + "valid_targets_mean": 1557.5, + "valid_targets_min": 870 + }, + { + "epoch": 3.98109243697479, + "grad_norm": 0.8125974018026644, + "learning_rate": 1.8706966533416413e-05, + "loss": 0.1386, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14180970191955566, + "step": 3790, + "valid_targets_mean": 1599.9, + "valid_targets_min": 1070 + }, + { + "epoch": 3.986344537815126, + "grad_norm": 0.7872308732821972, + "learning_rate": 1.8654694555496624e-05, + "loss": 0.138, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15511301159858704, + "step": 3795, + "valid_targets_mean": 1596.4, + "valid_targets_min": 626 + }, + { + "epoch": 3.991596638655462, + "grad_norm": 0.8264202266884269, + "learning_rate": 1.860243180737721e-05, + "loss": 0.1378, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13887375593185425, + "step": 3800, + "valid_targets_mean": 1423.5, + "valid_targets_min": 718 + }, + { + "epoch": 3.9968487394957983, + "grad_norm": 0.8547785642731142, + "learning_rate": 1.8550178647619664e-05, + "loss": 0.1445, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14218434691429138, + "step": 3805, + "valid_targets_mean": 1343.2, + "valid_targets_min": 646 + }, + { + "epoch": 4.0021008403361344, + "grad_norm": 0.9794746439498689, + "learning_rate": 1.84979354347197e-05, + "loss": 0.1849, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2445564717054367, + "step": 3810, + "valid_targets_mean": 3945.9, + "valid_targets_min": 1698 + }, + { + "epoch": 4.007352941176471, + "grad_norm": 0.6295029416310093, + "learning_rate": 1.8445702527104782e-05, + "loss": 0.2336, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21728411316871643, + "step": 3815, + "valid_targets_mean": 3601.0, + "valid_targets_min": 981 + }, + { + "epoch": 4.012605042016807, + "grad_norm": 0.6261229756084788, + "learning_rate": 1.8393480283131677e-05, + "loss": 0.2318, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2355230748653412, + "step": 3820, + "valid_targets_mean": 3562.5, + "valid_targets_min": 835 + }, + { + "epoch": 4.017857142857143, + "grad_norm": 0.5498474690761935, + "learning_rate": 1.8341269061083996e-05, + "loss": 0.2298, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23167270421981812, + "step": 3825, + "valid_targets_mean": 4304.1, + "valid_targets_min": 1201 + }, + { + "epoch": 4.023109243697479, + "grad_norm": 0.593694354846493, + "learning_rate": 1.8289069219169717e-05, + "loss": 0.216, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22287964820861816, + "step": 3830, + "valid_targets_mean": 3669.4, + "valid_targets_min": 980 + }, + { + "epoch": 4.0283613445378155, + "grad_norm": 0.6618298739900584, + "learning_rate": 1.8236881115518766e-05, + "loss": 0.2384, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2557893693447113, + "step": 3835, + "valid_targets_mean": 4120.9, + "valid_targets_min": 1512 + }, + { + "epoch": 4.033613445378151, + "grad_norm": 0.6142046700506524, + "learning_rate": 1.8184705108180516e-05, + "loss": 0.2077, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2090051770210266, + "step": 3840, + "valid_targets_mean": 3758.4, + "valid_targets_min": 1734 + }, + { + "epoch": 4.038865546218488, + "grad_norm": 0.5794721395589425, + "learning_rate": 1.8132541555121353e-05, + "loss": 0.2284, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2171669602394104, + "step": 3845, + "valid_targets_mean": 4416.4, + "valid_targets_min": 1381 + }, + { + "epoch": 4.044117647058823, + "grad_norm": 0.5873970760320343, + "learning_rate": 1.808039081422223e-05, + "loss": 0.2267, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23693841695785522, + "step": 3850, + "valid_targets_mean": 3650.9, + "valid_targets_min": 1024 + }, + { + "epoch": 4.04936974789916, + "grad_norm": 0.6544469337267305, + "learning_rate": 1.802825324327618e-05, + "loss": 0.2364, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22341692447662354, + "step": 3855, + "valid_targets_mean": 3792.1, + "valid_targets_min": 2107 + }, + { + "epoch": 4.054621848739496, + "grad_norm": 0.6368703549214123, + "learning_rate": 1.7976129199985886e-05, + "loss": 0.2273, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.216568723320961, + "step": 3860, + "valid_targets_mean": 3349.4, + "valid_targets_min": 802 + }, + { + "epoch": 4.059873949579832, + "grad_norm": 0.6024180533305669, + "learning_rate": 1.7924019041961228e-05, + "loss": 0.2282, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22188133001327515, + "step": 3865, + "valid_targets_mean": 3829.7, + "valid_targets_min": 1597 + }, + { + "epoch": 4.065126050420168, + "grad_norm": 0.6323374001658106, + "learning_rate": 1.7871923126716827e-05, + "loss": 0.2319, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21390947699546814, + "step": 3870, + "valid_targets_mean": 2841.6, + "valid_targets_min": 1535 + }, + { + "epoch": 4.070378151260504, + "grad_norm": 0.5926408570492498, + "learning_rate": 1.7819841811669573e-05, + "loss": 0.2226, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23295366764068604, + "step": 3875, + "valid_targets_mean": 4229.0, + "valid_targets_min": 1385 + }, + { + "epoch": 4.07563025210084, + "grad_norm": 0.6456267570500575, + "learning_rate": 1.7767775454136194e-05, + "loss": 0.2314, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24474671483039856, + "step": 3880, + "valid_targets_mean": 3543.5, + "valid_targets_min": 1451 + }, + { + "epoch": 4.080882352941177, + "grad_norm": 0.7628071822726314, + "learning_rate": 1.7715724411330806e-05, + "loss": 0.2372, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2485944777727127, + "step": 3885, + "valid_targets_mean": 2809.7, + "valid_targets_min": 1269 + }, + { + "epoch": 4.086134453781512, + "grad_norm": 0.6699354098606171, + "learning_rate": 1.7663689040362446e-05, + "loss": 0.2262, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23240669071674347, + "step": 3890, + "valid_targets_mean": 2924.8, + "valid_targets_min": 935 + }, + { + "epoch": 4.091386554621849, + "grad_norm": 0.6582143455705185, + "learning_rate": 1.761166969823262e-05, + "loss": 0.2376, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2368423342704773, + "step": 3895, + "valid_targets_mean": 3029.1, + "valid_targets_min": 1695 + }, + { + "epoch": 4.0966386554621845, + "grad_norm": 0.7189637917203952, + "learning_rate": 1.7559666741832896e-05, + "loss": 0.2321, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2396736443042755, + "step": 3900, + "valid_targets_mean": 3217.1, + "valid_targets_min": 671 + }, + { + "epoch": 4.101890756302521, + "grad_norm": 0.651225210749888, + "learning_rate": 1.750768052794239e-05, + "loss": 0.2289, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23836606740951538, + "step": 3905, + "valid_targets_mean": 3716.9, + "valid_targets_min": 1020 + }, + { + "epoch": 4.107142857142857, + "grad_norm": 0.6518633827861082, + "learning_rate": 1.7455711413225372e-05, + "loss": 0.2251, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.233098566532135, + "step": 3910, + "valid_targets_mean": 3237.8, + "valid_targets_min": 1889 + }, + { + "epoch": 4.112394957983193, + "grad_norm": 0.6876543636905016, + "learning_rate": 1.7403759754228794e-05, + "loss": 0.2211, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22473348677158356, + "step": 3915, + "valid_targets_mean": 2959.4, + "valid_targets_min": 1385 + }, + { + "epoch": 4.117647058823529, + "grad_norm": 0.7187642767454995, + "learning_rate": 1.7351825907379837e-05, + "loss": 0.2268, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.25105470418930054, + "step": 3920, + "valid_targets_mean": 3390.4, + "valid_targets_min": 1588 + }, + { + "epoch": 4.1228991596638656, + "grad_norm": 0.6768076603434932, + "learning_rate": 1.7299910228983513e-05, + "loss": 0.2292, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23110558092594147, + "step": 3925, + "valid_targets_mean": 3135.2, + "valid_targets_min": 699 + }, + { + "epoch": 4.128151260504202, + "grad_norm": 0.6753396109242978, + "learning_rate": 1.7248013075220128e-05, + "loss": 0.2302, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22585970163345337, + "step": 3930, + "valid_targets_mean": 2970.0, + "valid_targets_min": 648 + }, + { + "epoch": 4.133403361344538, + "grad_norm": 0.6444337615377012, + "learning_rate": 1.7196134802142945e-05, + "loss": 0.225, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2224642038345337, + "step": 3935, + "valid_targets_mean": 3744.2, + "valid_targets_min": 1934 + }, + { + "epoch": 4.138655462184874, + "grad_norm": 0.6792362480524322, + "learning_rate": 1.7144275765675673e-05, + "loss": 0.2255, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23104789853096008, + "step": 3940, + "valid_targets_mean": 3753.4, + "valid_targets_min": 863 + }, + { + "epoch": 4.14390756302521, + "grad_norm": 0.6240116424894049, + "learning_rate": 1.7092436321610042e-05, + "loss": 0.2203, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2116166055202484, + "step": 3945, + "valid_targets_mean": 3309.5, + "valid_targets_min": 1410 + }, + { + "epoch": 4.149159663865547, + "grad_norm": 0.6706279698577615, + "learning_rate": 1.704061682560336e-05, + "loss": 0.23, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.25118085741996765, + "step": 3950, + "valid_targets_mean": 4311.5, + "valid_targets_min": 2040 + }, + { + "epoch": 4.154411764705882, + "grad_norm": 0.7103731685784668, + "learning_rate": 1.698881763317609e-05, + "loss": 0.2221, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23094293475151062, + "step": 3955, + "valid_targets_mean": 2688.4, + "valid_targets_min": 1458 + }, + { + "epoch": 4.159663865546219, + "grad_norm": 0.6553558995778831, + "learning_rate": 1.69370390997094e-05, + "loss": 0.2234, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2209138721227646, + "step": 3960, + "valid_targets_mean": 3155.8, + "valid_targets_min": 1110 + }, + { + "epoch": 4.1649159663865545, + "grad_norm": 0.6997001621889637, + "learning_rate": 1.6885281580442677e-05, + "loss": 0.2202, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22238752245903015, + "step": 3965, + "valid_targets_mean": 2572.8, + "valid_targets_min": 513 + }, + { + "epoch": 4.170168067226891, + "grad_norm": 2.385982583274398, + "learning_rate": 1.6833545430471194e-05, + "loss": 0.225, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2642630636692047, + "step": 3970, + "valid_targets_mean": 2760.3, + "valid_targets_min": 1636 + }, + { + "epoch": 4.175420168067227, + "grad_norm": 0.6281184165319054, + "learning_rate": 1.678183100474359e-05, + "loss": 0.226, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23373137414455414, + "step": 3975, + "valid_targets_mean": 3912.6, + "valid_targets_min": 1801 + }, + { + "epoch": 4.180672268907563, + "grad_norm": 0.7646111653644774, + "learning_rate": 1.6730138658059448e-05, + "loss": 0.2232, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2311634123325348, + "step": 3980, + "valid_targets_mean": 3197.1, + "valid_targets_min": 924 + }, + { + "epoch": 4.185924369747899, + "grad_norm": 0.7085277743946552, + "learning_rate": 1.667846874506689e-05, + "loss": 0.2264, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2161899358034134, + "step": 3985, + "valid_targets_mean": 2886.2, + "valid_targets_min": 1401 + }, + { + "epoch": 4.1911764705882355, + "grad_norm": 0.7229719956908336, + "learning_rate": 1.662682162026012e-05, + "loss": 0.2322, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24561478197574615, + "step": 3990, + "valid_targets_mean": 3041.9, + "valid_targets_min": 1265 + }, + { + "epoch": 4.196428571428571, + "grad_norm": 0.6233236849228904, + "learning_rate": 1.6575197637976995e-05, + "loss": 0.2102, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20357422530651093, + "step": 3995, + "valid_targets_mean": 3318.8, + "valid_targets_min": 1648 + }, + { + "epoch": 4.201680672268908, + "grad_norm": 0.684658245418384, + "learning_rate": 1.652359715239661e-05, + "loss": 0.2252, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21792471408843994, + "step": 4000, + "valid_targets_mean": 3989.8, + "valid_targets_min": 1844 + }, + { + "epoch": 4.206932773109243, + "grad_norm": 0.6398769831531746, + "learning_rate": 1.6472020517536828e-05, + "loss": 0.2161, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2144005000591278, + "step": 4005, + "valid_targets_mean": 3636.7, + "valid_targets_min": 1261 + }, + { + "epoch": 4.21218487394958, + "grad_norm": 0.7341420848535544, + "learning_rate": 1.6420468087251907e-05, + "loss": 0.2205, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20942559838294983, + "step": 4010, + "valid_targets_mean": 3165.4, + "valid_targets_min": 1294 + }, + { + "epoch": 4.217436974789916, + "grad_norm": 0.7202011687730974, + "learning_rate": 1.6368940215230026e-05, + "loss": 0.2235, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24036064743995667, + "step": 4015, + "valid_targets_mean": 3169.3, + "valid_targets_min": 1432 + }, + { + "epoch": 4.222689075630252, + "grad_norm": 0.6828224156387892, + "learning_rate": 1.6317437254990875e-05, + "loss": 0.218, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23701542615890503, + "step": 4020, + "valid_targets_mean": 3107.8, + "valid_targets_min": 742 + }, + { + "epoch": 4.227941176470588, + "grad_norm": 0.6787140516821543, + "learning_rate": 1.626595955988325e-05, + "loss": 0.2258, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21809794008731842, + "step": 4025, + "valid_targets_mean": 3005.8, + "valid_targets_min": 988 + }, + { + "epoch": 4.233193277310924, + "grad_norm": 0.7166611868537497, + "learning_rate": 1.6214507483082593e-05, + "loss": 0.2252, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.233636736869812, + "step": 4030, + "valid_targets_mean": 3192.8, + "valid_targets_min": 654 + }, + { + "epoch": 4.23844537815126, + "grad_norm": 0.6756135280787572, + "learning_rate": 1.6163081377588588e-05, + "loss": 0.209, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22536295652389526, + "step": 4035, + "valid_targets_mean": 3349.0, + "valid_targets_min": 1328 + }, + { + "epoch": 4.243697478991597, + "grad_norm": 0.6733677254055387, + "learning_rate": 1.6111681596222732e-05, + "loss": 0.2174, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2062094807624817, + "step": 4040, + "valid_targets_mean": 3037.0, + "valid_targets_min": 1302 + }, + { + "epoch": 4.248949579831933, + "grad_norm": 0.7009721818052325, + "learning_rate": 1.606030849162593e-05, + "loss": 0.2173, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2229950726032257, + "step": 4045, + "valid_targets_mean": 3635.6, + "valid_targets_min": 1701 + }, + { + "epoch": 4.254201680672269, + "grad_norm": 0.6661284889755613, + "learning_rate": 1.600896241625605e-05, + "loss": 0.2136, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22747060656547546, + "step": 4050, + "valid_targets_mean": 3422.1, + "valid_targets_min": 1319 + }, + { + "epoch": 4.2594537815126055, + "grad_norm": 0.6094686088609381, + "learning_rate": 1.5957643722385532e-05, + "loss": 0.2019, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21023216843605042, + "step": 4055, + "valid_targets_mean": 3806.1, + "valid_targets_min": 1194 + }, + { + "epoch": 4.264705882352941, + "grad_norm": 0.6259994730524294, + "learning_rate": 1.590635276209896e-05, + "loss": 0.2292, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20072561502456665, + "step": 4060, + "valid_targets_mean": 3004.6, + "valid_targets_min": 1453 + }, + { + "epoch": 4.269957983193278, + "grad_norm": 0.5928071676270973, + "learning_rate": 1.5855089887290634e-05, + "loss": 0.2154, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2144814431667328, + "step": 4065, + "valid_targets_mean": 3975.1, + "valid_targets_min": 1743 + }, + { + "epoch": 4.275210084033613, + "grad_norm": 0.7034766602053386, + "learning_rate": 1.5803855449662175e-05, + "loss": 0.2244, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23000982403755188, + "step": 4070, + "valid_targets_mean": 3192.5, + "valid_targets_min": 1234 + }, + { + "epoch": 4.28046218487395, + "grad_norm": 0.6797161663877974, + "learning_rate": 1.5752649800720096e-05, + "loss": 0.232, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2336946427822113, + "step": 4075, + "valid_targets_mean": 3073.8, + "valid_targets_min": 1188 + }, + { + "epoch": 4.285714285714286, + "grad_norm": 0.5845573966663017, + "learning_rate": 1.5701473291773395e-05, + "loss": 0.2252, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2029433399438858, + "step": 4080, + "valid_targets_mean": 3894.5, + "valid_targets_min": 618 + }, + { + "epoch": 4.290966386554622, + "grad_norm": 0.9566677599879087, + "learning_rate": 1.5650326273931166e-05, + "loss": 0.2134, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21042492985725403, + "step": 4085, + "valid_targets_mean": 3189.6, + "valid_targets_min": 1364 + }, + { + "epoch": 4.296218487394958, + "grad_norm": 0.6929467596600297, + "learning_rate": 1.559920909810016e-05, + "loss": 0.2129, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22422900795936584, + "step": 4090, + "valid_targets_mean": 3735.1, + "valid_targets_min": 1514 + }, + { + "epoch": 4.301470588235294, + "grad_norm": 0.7889834685287505, + "learning_rate": 1.5548122114982393e-05, + "loss": 0.2079, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22729304432868958, + "step": 4095, + "valid_targets_mean": 2972.1, + "valid_targets_min": 1073 + }, + { + "epoch": 4.30672268907563, + "grad_norm": 0.7145190034824895, + "learning_rate": 1.5497065675072728e-05, + "loss": 0.2131, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22352570295333862, + "step": 4100, + "valid_targets_mean": 2926.5, + "valid_targets_min": 1026 + }, + { + "epoch": 4.311974789915967, + "grad_norm": 0.6561593136868893, + "learning_rate": 1.5446040128656485e-05, + "loss": 0.2064, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19251301884651184, + "step": 4105, + "valid_targets_mean": 2859.4, + "valid_targets_min": 857 + }, + { + "epoch": 4.317226890756302, + "grad_norm": 0.6862200086122758, + "learning_rate": 1.539504582580704e-05, + "loss": 0.204, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21139201521873474, + "step": 4110, + "valid_targets_mean": 3083.8, + "valid_targets_min": 720 + }, + { + "epoch": 4.322478991596639, + "grad_norm": 0.776255577609975, + "learning_rate": 1.5344083116383395e-05, + "loss": 0.2201, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24367398023605347, + "step": 4115, + "valid_targets_mean": 3220.5, + "valid_targets_min": 1175 + }, + { + "epoch": 4.3277310924369745, + "grad_norm": 0.6825477266343268, + "learning_rate": 1.529315235002781e-05, + "loss": 0.2168, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20516598224639893, + "step": 4120, + "valid_targets_mean": 3000.1, + "valid_targets_min": 1411 + }, + { + "epoch": 4.332983193277311, + "grad_norm": 0.6569828485036016, + "learning_rate": 1.5242253876163399e-05, + "loss": 0.2167, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2060314565896988, + "step": 4125, + "valid_targets_mean": 3553.2, + "valid_targets_min": 1743 + }, + { + "epoch": 4.338235294117647, + "grad_norm": 0.7319933985960059, + "learning_rate": 1.5191388043991712e-05, + "loss": 0.2178, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2330959588289261, + "step": 4130, + "valid_targets_mean": 3180.8, + "valid_targets_min": 1398 + }, + { + "epoch": 4.343487394957983, + "grad_norm": 0.6718430936496146, + "learning_rate": 1.5140555202490359e-05, + "loss": 0.2108, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20311537384986877, + "step": 4135, + "valid_targets_mean": 3596.6, + "valid_targets_min": 1767 + }, + { + "epoch": 4.348739495798319, + "grad_norm": 0.6541737718826137, + "learning_rate": 1.5089755700410602e-05, + "loss": 0.218, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20354878902435303, + "step": 4140, + "valid_targets_mean": 3805.3, + "valid_targets_min": 1145 + }, + { + "epoch": 4.3539915966386555, + "grad_norm": 0.6642189302688583, + "learning_rate": 1.5038989886274992e-05, + "loss": 0.2104, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2232103943824768, + "step": 4145, + "valid_targets_mean": 3490.6, + "valid_targets_min": 1722 + }, + { + "epoch": 4.359243697478991, + "grad_norm": 0.6521008246137644, + "learning_rate": 1.498825810837492e-05, + "loss": 0.2014, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19541659951210022, + "step": 4150, + "valid_targets_mean": 3157.6, + "valid_targets_min": 1423 + }, + { + "epoch": 4.364495798319328, + "grad_norm": 0.6924321128175812, + "learning_rate": 1.4937560714768283e-05, + "loss": 0.2236, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22630862891674042, + "step": 4155, + "valid_targets_mean": 3276.0, + "valid_targets_min": 1426 + }, + { + "epoch": 4.369747899159664, + "grad_norm": 0.7066936740974944, + "learning_rate": 1.4886898053277086e-05, + "loss": 0.225, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2139957845211029, + "step": 4160, + "valid_targets_mean": 3190.3, + "valid_targets_min": 538 + }, + { + "epoch": 4.375, + "grad_norm": 0.7759687498686932, + "learning_rate": 1.4836270471485029e-05, + "loss": 0.2155, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2279035598039627, + "step": 4165, + "valid_targets_mean": 2498.0, + "valid_targets_min": 537 + }, + { + "epoch": 4.380252100840336, + "grad_norm": 0.6772887664667172, + "learning_rate": 1.4785678316735144e-05, + "loss": 0.2255, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21676117181777954, + "step": 4170, + "valid_targets_mean": 3068.9, + "valid_targets_min": 721 + }, + { + "epoch": 4.385504201680672, + "grad_norm": 0.8980937779941081, + "learning_rate": 1.4735121936127406e-05, + "loss": 0.2121, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24256817996501923, + "step": 4175, + "valid_targets_mean": 3478.7, + "valid_targets_min": 1625 + }, + { + "epoch": 4.390756302521009, + "grad_norm": 0.7329255290185969, + "learning_rate": 1.4684601676516366e-05, + "loss": 0.2311, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2386029064655304, + "step": 4180, + "valid_targets_mean": 3130.2, + "valid_targets_min": 1400 + }, + { + "epoch": 4.3960084033613445, + "grad_norm": 0.7786336588807071, + "learning_rate": 1.4634117884508738e-05, + "loss": 0.214, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19800731539726257, + "step": 4185, + "valid_targets_mean": 3135.8, + "valid_targets_min": 1648 + }, + { + "epoch": 4.401260504201681, + "grad_norm": 0.7631967058787871, + "learning_rate": 1.458367090646105e-05, + "loss": 0.2248, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2008107602596283, + "step": 4190, + "valid_targets_mean": 2437.4, + "valid_targets_min": 648 + }, + { + "epoch": 4.406512605042017, + "grad_norm": 0.7191244352959169, + "learning_rate": 1.4533261088477257e-05, + "loss": 0.2154, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20372244715690613, + "step": 4195, + "valid_targets_mean": 2783.8, + "valid_targets_min": 885 + }, + { + "epoch": 4.411764705882353, + "grad_norm": 0.7150862191687413, + "learning_rate": 1.448288877640637e-05, + "loss": 0.222, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20869606733322144, + "step": 4200, + "valid_targets_mean": 3689.0, + "valid_targets_min": 1325 + }, + { + "epoch": 4.417016806722689, + "grad_norm": 0.716489559808733, + "learning_rate": 1.4432554315840082e-05, + "loss": 0.219, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20727670192718506, + "step": 4205, + "valid_targets_mean": 3362.6, + "valid_targets_min": 953 + }, + { + "epoch": 4.4222689075630255, + "grad_norm": 0.7087446848068543, + "learning_rate": 1.438225805211039e-05, + "loss": 0.2114, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.224325031042099, + "step": 4210, + "valid_targets_mean": 3481.2, + "valid_targets_min": 1592 + }, + { + "epoch": 4.427521008403361, + "grad_norm": 0.6500807963798068, + "learning_rate": 1.4332000330287248e-05, + "loss": 0.2204, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20948271453380585, + "step": 4215, + "valid_targets_mean": 3169.1, + "valid_targets_min": 530 + }, + { + "epoch": 4.432773109243698, + "grad_norm": 0.6730778830395577, + "learning_rate": 1.428178149517617e-05, + "loss": 0.2244, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2134353220462799, + "step": 4220, + "valid_targets_mean": 3418.1, + "valid_targets_min": 1066 + }, + { + "epoch": 4.438025210084033, + "grad_norm": 0.6727213761188319, + "learning_rate": 1.4231601891315876e-05, + "loss": 0.2218, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2243449091911316, + "step": 4225, + "valid_targets_mean": 4071.0, + "valid_targets_min": 1885 + }, + { + "epoch": 4.44327731092437, + "grad_norm": 0.7011377195102847, + "learning_rate": 1.418146186297594e-05, + "loss": 0.2064, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19244351983070374, + "step": 4230, + "valid_targets_mean": 3914.1, + "valid_targets_min": 852 + }, + { + "epoch": 4.448529411764706, + "grad_norm": 0.6685868237134905, + "learning_rate": 1.413136175415441e-05, + "loss": 0.2199, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22170649468898773, + "step": 4235, + "valid_targets_mean": 2790.1, + "valid_targets_min": 1025 + }, + { + "epoch": 4.453781512605042, + "grad_norm": 0.6475753723469297, + "learning_rate": 1.4081301908575457e-05, + "loss": 0.2077, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2239975482225418, + "step": 4240, + "valid_targets_mean": 4196.2, + "valid_targets_min": 1397 + }, + { + "epoch": 4.459033613445378, + "grad_norm": 0.8141488892094502, + "learning_rate": 1.4031282669687035e-05, + "loss": 0.207, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19613388180732727, + "step": 4245, + "valid_targets_mean": 3816.1, + "valid_targets_min": 1920 + }, + { + "epoch": 4.464285714285714, + "grad_norm": 0.6806187299183513, + "learning_rate": 1.3981304380658474e-05, + "loss": 0.2048, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20587432384490967, + "step": 4250, + "valid_targets_mean": 3625.5, + "valid_targets_min": 1687 + }, + { + "epoch": 4.46953781512605, + "grad_norm": 0.7502387892882345, + "learning_rate": 1.3931367384378183e-05, + "loss": 0.2101, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2327464073896408, + "step": 4255, + "valid_targets_mean": 3404.2, + "valid_targets_min": 1210 + }, + { + "epoch": 4.474789915966387, + "grad_norm": 0.6570388636908775, + "learning_rate": 1.3881472023451262e-05, + "loss": 0.201, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1919768750667572, + "step": 4260, + "valid_targets_mean": 3334.3, + "valid_targets_min": 1360 + }, + { + "epoch": 4.480042016806722, + "grad_norm": 0.6969625105218161, + "learning_rate": 1.3831618640197153e-05, + "loss": 0.2051, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21205592155456543, + "step": 4265, + "valid_targets_mean": 3091.5, + "valid_targets_min": 1447 + }, + { + "epoch": 4.485294117647059, + "grad_norm": 0.7307640724228113, + "learning_rate": 1.3781807576647315e-05, + "loss": 0.1982, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.204860657453537, + "step": 4270, + "valid_targets_mean": 2715.1, + "valid_targets_min": 1243 + }, + { + "epoch": 4.4905462184873945, + "grad_norm": 0.7293687135782331, + "learning_rate": 1.373203917454285e-05, + "loss": 0.207, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21605542302131653, + "step": 4275, + "valid_targets_mean": 2944.4, + "valid_targets_min": 897 + }, + { + "epoch": 4.495798319327731, + "grad_norm": 0.7287294839891085, + "learning_rate": 1.3682313775332186e-05, + "loss": 0.2254, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2306896150112152, + "step": 4280, + "valid_targets_mean": 3085.3, + "valid_targets_min": 1312 + }, + { + "epoch": 4.501050420168067, + "grad_norm": 0.6982921140070419, + "learning_rate": 1.3632631720168705e-05, + "loss": 0.2065, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20665548741817474, + "step": 4285, + "valid_targets_mean": 3413.9, + "valid_targets_min": 1469 + }, + { + "epoch": 4.506302521008403, + "grad_norm": 0.7131094152829368, + "learning_rate": 1.358299334990842e-05, + "loss": 0.2055, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2063906341791153, + "step": 4290, + "valid_targets_mean": 2992.4, + "valid_targets_min": 1593 + }, + { + "epoch": 4.51155462184874, + "grad_norm": 0.7372869299957252, + "learning_rate": 1.3533399005107635e-05, + "loss": 0.2104, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22824421525001526, + "step": 4295, + "valid_targets_mean": 3131.6, + "valid_targets_min": 1664 + }, + { + "epoch": 4.516806722689076, + "grad_norm": 0.6346433949828432, + "learning_rate": 1.3483849026020603e-05, + "loss": 0.1992, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19013050198554993, + "step": 4300, + "valid_targets_mean": 3709.5, + "valid_targets_min": 1605 + }, + { + "epoch": 4.522058823529412, + "grad_norm": 0.6754439443280119, + "learning_rate": 1.3434343752597199e-05, + "loss": 0.2258, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22575265169143677, + "step": 4305, + "valid_targets_mean": 3649.6, + "valid_targets_min": 1737 + }, + { + "epoch": 4.527310924369748, + "grad_norm": 0.6967616700028672, + "learning_rate": 1.3384883524480576e-05, + "loss": 0.2156, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22875870764255524, + "step": 4310, + "valid_targets_mean": 3512.8, + "valid_targets_min": 1817 + }, + { + "epoch": 4.532563025210084, + "grad_norm": 0.6886827979081415, + "learning_rate": 1.333546868100486e-05, + "loss": 0.2043, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20903798937797546, + "step": 4315, + "valid_targets_mean": 3413.6, + "valid_targets_min": 2026 + }, + { + "epoch": 4.53781512605042, + "grad_norm": 0.660189404042565, + "learning_rate": 1.3286099561192784e-05, + "loss": 0.207, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21688057482242584, + "step": 4320, + "valid_targets_mean": 3905.8, + "valid_targets_min": 1214 + }, + { + "epoch": 4.543067226890757, + "grad_norm": 0.8043966125939357, + "learning_rate": 1.3236776503753397e-05, + "loss": 0.1721, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14316143095493317, + "step": 4325, + "valid_targets_mean": 1467.6, + "valid_targets_min": 715 + }, + { + "epoch": 4.548319327731092, + "grad_norm": 0.7841054688198438, + "learning_rate": 1.3187499847079713e-05, + "loss": 0.1451, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14375540614128113, + "step": 4330, + "valid_targets_mean": 1573.2, + "valid_targets_min": 725 + }, + { + "epoch": 4.553571428571429, + "grad_norm": 0.8186335723421362, + "learning_rate": 1.3138269929246427e-05, + "loss": 0.1396, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15070709586143494, + "step": 4335, + "valid_targets_mean": 1469.3, + "valid_targets_min": 714 + }, + { + "epoch": 4.5588235294117645, + "grad_norm": 0.8679170015389952, + "learning_rate": 1.308908708800753e-05, + "loss": 0.1393, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14169779419898987, + "step": 4340, + "valid_targets_mean": 1390.9, + "valid_targets_min": 615 + }, + { + "epoch": 4.564075630252101, + "grad_norm": 0.9114994147726516, + "learning_rate": 1.3039951660794063e-05, + "loss": 0.1401, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14317017793655396, + "step": 4345, + "valid_targets_mean": 1436.4, + "valid_targets_min": 715 + }, + { + "epoch": 4.569327731092437, + "grad_norm": 0.8898038163908437, + "learning_rate": 1.2990863984711773e-05, + "loss": 0.1421, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17335724830627441, + "step": 4350, + "valid_targets_mean": 1576.6, + "valid_targets_min": 625 + }, + { + "epoch": 4.574579831932773, + "grad_norm": 0.785064729278413, + "learning_rate": 1.294182439653878e-05, + "loss": 0.1329, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12577390670776367, + "step": 4355, + "valid_targets_mean": 1400.9, + "valid_targets_min": 761 + }, + { + "epoch": 4.579831932773109, + "grad_norm": 0.7745818948625097, + "learning_rate": 1.2892833232723297e-05, + "loss": 0.1444, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21761628985404968, + "step": 4360, + "valid_targets_mean": 1609.2, + "valid_targets_min": 703 + }, + { + "epoch": 4.5850840336134455, + "grad_norm": 0.9711741060616659, + "learning_rate": 1.2843890829381303e-05, + "loss": 0.1307, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14271649718284607, + "step": 4365, + "valid_targets_mean": 1564.4, + "valid_targets_min": 733 + }, + { + "epoch": 4.590336134453781, + "grad_norm": 0.8866160542903732, + "learning_rate": 1.2794997522294263e-05, + "loss": 0.1366, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13775603473186493, + "step": 4370, + "valid_targets_mean": 1521.2, + "valid_targets_min": 835 + }, + { + "epoch": 4.595588235294118, + "grad_norm": 0.8231923650364629, + "learning_rate": 1.2746153646906766e-05, + "loss": 0.1282, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13401484489440918, + "step": 4375, + "valid_targets_mean": 1525.2, + "valid_targets_min": 815 + }, + { + "epoch": 4.600840336134453, + "grad_norm": 0.8550257487811143, + "learning_rate": 1.2697359538324303e-05, + "loss": 0.1316, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13395115733146667, + "step": 4380, + "valid_targets_mean": 1584.4, + "valid_targets_min": 797 + }, + { + "epoch": 4.60609243697479, + "grad_norm": 0.8426859205924878, + "learning_rate": 1.2648615531310907e-05, + "loss": 0.1317, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12041187286376953, + "step": 4385, + "valid_targets_mean": 1384.5, + "valid_targets_min": 570 + }, + { + "epoch": 4.6113445378151265, + "grad_norm": 0.786905654669723, + "learning_rate": 1.259992196028688e-05, + "loss": 0.1232, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11873074620962143, + "step": 4390, + "valid_targets_mean": 1481.8, + "valid_targets_min": 548 + }, + { + "epoch": 4.616596638655462, + "grad_norm": 0.8303948199867104, + "learning_rate": 1.2551279159326495e-05, + "loss": 0.1208, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11647927761077881, + "step": 4395, + "valid_targets_mean": 1247.1, + "valid_targets_min": 682 + }, + { + "epoch": 4.621848739495798, + "grad_norm": 0.8753106179981709, + "learning_rate": 1.2502687462155709e-05, + "loss": 0.1312, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1494443118572235, + "step": 4400, + "valid_targets_mean": 1686.6, + "valid_targets_min": 896 + }, + { + "epoch": 4.6271008403361344, + "grad_norm": 0.8050150714693087, + "learning_rate": 1.2454147202149865e-05, + "loss": 0.1312, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12719589471817017, + "step": 4405, + "valid_targets_mean": 1415.3, + "valid_targets_min": 597 + }, + { + "epoch": 4.632352941176471, + "grad_norm": 0.8009830063907718, + "learning_rate": 1.2405658712331409e-05, + "loss": 0.1342, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12356242537498474, + "step": 4410, + "valid_targets_mean": 1527.1, + "valid_targets_min": 706 + }, + { + "epoch": 4.637605042016807, + "grad_norm": 0.7347334443196466, + "learning_rate": 1.2357222325367604e-05, + "loss": 0.1311, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11749774217605591, + "step": 4415, + "valid_targets_mean": 1439.2, + "valid_targets_min": 754 + }, + { + "epoch": 4.642857142857143, + "grad_norm": 0.8064940468859054, + "learning_rate": 1.2308838373568249e-05, + "loss": 0.1308, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12089011818170547, + "step": 4420, + "valid_targets_mean": 1403.5, + "valid_targets_min": 785 + }, + { + "epoch": 4.648109243697479, + "grad_norm": 0.7972098191885254, + "learning_rate": 1.2260507188883395e-05, + "loss": 0.1317, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12170597910881042, + "step": 4425, + "valid_targets_mean": 1499.6, + "valid_targets_min": 617 + }, + { + "epoch": 4.6533613445378155, + "grad_norm": 0.975037389066893, + "learning_rate": 1.2212229102901077e-05, + "loss": 0.1311, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13412654399871826, + "step": 4430, + "valid_targets_mean": 1218.8, + "valid_targets_min": 648 + }, + { + "epoch": 4.658613445378151, + "grad_norm": 0.8641754817962347, + "learning_rate": 1.2164004446845037e-05, + "loss": 0.1226, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13030359148979187, + "step": 4435, + "valid_targets_mean": 1603.4, + "valid_targets_min": 1184 + }, + { + "epoch": 4.663865546218488, + "grad_norm": 0.9180121006760533, + "learning_rate": 1.2115833551572438e-05, + "loss": 0.1216, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12268111109733582, + "step": 4440, + "valid_targets_mean": 1407.5, + "valid_targets_min": 774 + }, + { + "epoch": 4.669117647058823, + "grad_norm": 0.8547903927275693, + "learning_rate": 1.2067716747571616e-05, + "loss": 0.1261, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13655883073806763, + "step": 4445, + "valid_targets_mean": 1627.1, + "valid_targets_min": 734 + }, + { + "epoch": 4.67436974789916, + "grad_norm": 0.881631394330736, + "learning_rate": 1.201965436495978e-05, + "loss": 0.1273, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12907208502292633, + "step": 4450, + "valid_targets_mean": 1424.6, + "valid_targets_min": 1004 + }, + { + "epoch": 4.679621848739496, + "grad_norm": 0.8063717130180919, + "learning_rate": 1.1971646733480784e-05, + "loss": 0.1288, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13420622050762177, + "step": 4455, + "valid_targets_mean": 1478.4, + "valid_targets_min": 803 + }, + { + "epoch": 4.684873949579832, + "grad_norm": 0.8260967863457012, + "learning_rate": 1.1923694182502848e-05, + "loss": 0.1348, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11544696986675262, + "step": 4460, + "valid_targets_mean": 1341.6, + "valid_targets_min": 782 + }, + { + "epoch": 4.690126050420168, + "grad_norm": 0.8029075297918149, + "learning_rate": 1.1875797041016286e-05, + "loss": 0.1247, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12873606383800507, + "step": 4465, + "valid_targets_mean": 1627.8, + "valid_targets_min": 646 + }, + { + "epoch": 4.695378151260504, + "grad_norm": 0.8998520655105815, + "learning_rate": 1.1827955637631283e-05, + "loss": 0.1311, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14146029949188232, + "step": 4470, + "valid_targets_mean": 1465.2, + "valid_targets_min": 591 + }, + { + "epoch": 4.70063025210084, + "grad_norm": 0.9673884965286654, + "learning_rate": 1.1780170300575602e-05, + "loss": 0.1295, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15864944458007812, + "step": 4475, + "valid_targets_mean": 1623.8, + "valid_targets_min": 796 + }, + { + "epoch": 4.705882352941177, + "grad_norm": 0.8028753858678307, + "learning_rate": 1.1732441357692353e-05, + "loss": 0.1197, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11006323993206024, + "step": 4480, + "valid_targets_mean": 1318.8, + "valid_targets_min": 848 + }, + { + "epoch": 4.711134453781512, + "grad_norm": 0.7757517539215945, + "learning_rate": 1.1684769136437742e-05, + "loss": 0.1238, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1143508329987526, + "step": 4485, + "valid_targets_mean": 1281.6, + "valid_targets_min": 665 + }, + { + "epoch": 4.716386554621849, + "grad_norm": 0.8198556072030991, + "learning_rate": 1.1637153963878815e-05, + "loss": 0.1189, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10272709280252457, + "step": 4490, + "valid_targets_mean": 1267.4, + "valid_targets_min": 640 + }, + { + "epoch": 4.7216386554621845, + "grad_norm": 0.993622221837871, + "learning_rate": 1.1589596166691231e-05, + "loss": 0.1259, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14048606157302856, + "step": 4495, + "valid_targets_mean": 1505.4, + "valid_targets_min": 662 + }, + { + "epoch": 4.726890756302521, + "grad_norm": 0.9175391246008294, + "learning_rate": 1.1542096071157012e-05, + "loss": 0.1224, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12400451302528381, + "step": 4500, + "valid_targets_mean": 1243.3, + "valid_targets_min": 724 + }, + { + "epoch": 4.732142857142857, + "grad_norm": 0.8780528943864113, + "learning_rate": 1.1494654003162285e-05, + "loss": 0.1243, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12478488683700562, + "step": 4505, + "valid_targets_mean": 1371.4, + "valid_targets_min": 924 + }, + { + "epoch": 4.737394957983193, + "grad_norm": 1.0957377833225224, + "learning_rate": 1.1447270288195089e-05, + "loss": 0.1287, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1323080062866211, + "step": 4510, + "valid_targets_mean": 1497.8, + "valid_targets_min": 773 + }, + { + "epoch": 4.742647058823529, + "grad_norm": 0.9093558038524169, + "learning_rate": 1.1399945251343114e-05, + "loss": 0.1237, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14012199640274048, + "step": 4515, + "valid_targets_mean": 1446.2, + "valid_targets_min": 692 + }, + { + "epoch": 4.7478991596638656, + "grad_norm": 0.8399340996586211, + "learning_rate": 1.1352679217291457e-05, + "loss": 0.1251, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10750658810138702, + "step": 4520, + "valid_targets_mean": 1165.6, + "valid_targets_min": 776 + }, + { + "epoch": 4.753151260504202, + "grad_norm": 0.8065610789721998, + "learning_rate": 1.1305472510320419e-05, + "loss": 0.1192, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12666700780391693, + "step": 4525, + "valid_targets_mean": 1593.9, + "valid_targets_min": 634 + }, + { + "epoch": 4.758403361344538, + "grad_norm": 0.825002414616717, + "learning_rate": 1.1258325454303286e-05, + "loss": 0.13, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13277189433574677, + "step": 4530, + "valid_targets_mean": 1652.5, + "valid_targets_min": 573 + }, + { + "epoch": 4.7636554621848735, + "grad_norm": 0.8052034847245988, + "learning_rate": 1.1211238372704073e-05, + "loss": 0.1265, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12504729628562927, + "step": 4535, + "valid_targets_mean": 1694.2, + "valid_targets_min": 754 + }, + { + "epoch": 4.76890756302521, + "grad_norm": 0.7944186688073329, + "learning_rate": 1.1164211588575339e-05, + "loss": 0.1295, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11452824622392654, + "step": 4540, + "valid_targets_mean": 1335.4, + "valid_targets_min": 763 + }, + { + "epoch": 4.774159663865547, + "grad_norm": 0.9867441295496705, + "learning_rate": 1.1117245424555967e-05, + "loss": 0.1213, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12596900761127472, + "step": 4545, + "valid_targets_mean": 1470.9, + "valid_targets_min": 956 + }, + { + "epoch": 4.779411764705882, + "grad_norm": 0.9111318412419092, + "learning_rate": 1.1070340202868915e-05, + "loss": 0.1244, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12238766252994537, + "step": 4550, + "valid_targets_mean": 1322.6, + "valid_targets_min": 676 + }, + { + "epoch": 4.784663865546219, + "grad_norm": 0.9026375196081591, + "learning_rate": 1.1023496245319056e-05, + "loss": 0.1254, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12969665229320526, + "step": 4555, + "valid_targets_mean": 1267.3, + "valid_targets_min": 780 + }, + { + "epoch": 4.7899159663865545, + "grad_norm": 0.8044017655815434, + "learning_rate": 1.0976713873290925e-05, + "loss": 0.1178, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11323502659797668, + "step": 4560, + "valid_targets_mean": 1303.4, + "valid_targets_min": 677 + }, + { + "epoch": 4.795168067226891, + "grad_norm": 0.8200442636224358, + "learning_rate": 1.0929993407746543e-05, + "loss": 0.1178, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10392217338085175, + "step": 4565, + "valid_targets_mean": 1200.9, + "valid_targets_min": 727 + }, + { + "epoch": 4.800420168067227, + "grad_norm": 0.839175470474291, + "learning_rate": 1.0883335169223212e-05, + "loss": 0.1287, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13048666715621948, + "step": 4570, + "valid_targets_mean": 1514.3, + "valid_targets_min": 726 + }, + { + "epoch": 4.805672268907563, + "grad_norm": 0.8992567495172576, + "learning_rate": 1.0836739477831297e-05, + "loss": 0.1282, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13388502597808838, + "step": 4575, + "valid_targets_mean": 1504.9, + "valid_targets_min": 669 + }, + { + "epoch": 4.810924369747899, + "grad_norm": 0.8667203247346105, + "learning_rate": 1.0790206653252055e-05, + "loss": 0.1295, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12979502975940704, + "step": 4580, + "valid_targets_mean": 1499.6, + "valid_targets_min": 750 + }, + { + "epoch": 4.8161764705882355, + "grad_norm": 0.8236209984599626, + "learning_rate": 1.0743737014735434e-05, + "loss": 0.1251, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11989112198352814, + "step": 4585, + "valid_targets_mean": 1397.2, + "valid_targets_min": 736 + }, + { + "epoch": 4.821428571428571, + "grad_norm": 0.8603157391015415, + "learning_rate": 1.0697330881097857e-05, + "loss": 0.1304, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1339968591928482, + "step": 4590, + "valid_targets_mean": 1373.4, + "valid_targets_min": 694 + }, + { + "epoch": 4.826680672268908, + "grad_norm": 0.8846127818913729, + "learning_rate": 1.0650988570720077e-05, + "loss": 0.1246, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13660481572151184, + "step": 4595, + "valid_targets_mean": 1546.9, + "valid_targets_min": 727 + }, + { + "epoch": 4.831932773109243, + "grad_norm": 0.8465612563420826, + "learning_rate": 1.0604710401544963e-05, + "loss": 0.1193, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11273416876792908, + "step": 4600, + "valid_targets_mean": 1265.4, + "valid_targets_min": 809 + }, + { + "epoch": 4.83718487394958, + "grad_norm": 0.8108208139117962, + "learning_rate": 1.0558496691075318e-05, + "loss": 0.123, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11026652157306671, + "step": 4605, + "valid_targets_mean": 1368.5, + "valid_targets_min": 684 + }, + { + "epoch": 4.842436974789916, + "grad_norm": 0.8597461483981371, + "learning_rate": 1.0512347756371726e-05, + "loss": 0.1148, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12328451871871948, + "step": 4610, + "valid_targets_mean": 1360.0, + "valid_targets_min": 750 + }, + { + "epoch": 4.847689075630252, + "grad_norm": 0.8960809913992954, + "learning_rate": 1.0466263914050362e-05, + "loss": 0.1252, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1297706663608551, + "step": 4615, + "valid_targets_mean": 1508.2, + "valid_targets_min": 818 + }, + { + "epoch": 4.852941176470588, + "grad_norm": 0.8624681465534092, + "learning_rate": 1.0420245480280804e-05, + "loss": 0.124, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13054832816123962, + "step": 4620, + "valid_targets_mean": 1582.8, + "valid_targets_min": 665 + }, + { + "epoch": 4.858193277310924, + "grad_norm": 0.9437920037528255, + "learning_rate": 1.0374292770783891e-05, + "loss": 0.1205, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14127075672149658, + "step": 4625, + "valid_targets_mean": 1475.8, + "valid_targets_min": 1093 + }, + { + "epoch": 4.86344537815126, + "grad_norm": 0.8557418798703278, + "learning_rate": 1.0328406100829542e-05, + "loss": 0.126, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1389474719762802, + "step": 4630, + "valid_targets_mean": 1493.8, + "valid_targets_min": 632 + }, + { + "epoch": 4.868697478991597, + "grad_norm": 0.87445714339707, + "learning_rate": 1.0282585785234578e-05, + "loss": 0.1263, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13523709774017334, + "step": 4635, + "valid_targets_mean": 1507.4, + "valid_targets_min": 700 + }, + { + "epoch": 4.873949579831933, + "grad_norm": 0.8287344010980091, + "learning_rate": 1.023683213836061e-05, + "loss": 0.122, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11704841256141663, + "step": 4640, + "valid_targets_mean": 1353.1, + "valid_targets_min": 810 + }, + { + "epoch": 4.879201680672269, + "grad_norm": 0.8509384511271177, + "learning_rate": 1.0191145474111823e-05, + "loss": 0.1225, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11140401661396027, + "step": 4645, + "valid_targets_mean": 1293.3, + "valid_targets_min": 589 + }, + { + "epoch": 4.884453781512605, + "grad_norm": 0.9759630950705781, + "learning_rate": 1.0145526105932872e-05, + "loss": 0.1235, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13949152827262878, + "step": 4650, + "valid_targets_mean": 1433.0, + "valid_targets_min": 750 + }, + { + "epoch": 4.889705882352941, + "grad_norm": 0.9316341415558835, + "learning_rate": 1.0099974346806714e-05, + "loss": 0.1242, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12794744968414307, + "step": 4655, + "valid_targets_mean": 1385.1, + "valid_targets_min": 641 + }, + { + "epoch": 4.894957983193278, + "grad_norm": 0.8801743318163907, + "learning_rate": 1.0054490509252423e-05, + "loss": 0.1221, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1252344250679016, + "step": 4660, + "valid_targets_mean": 1543.5, + "valid_targets_min": 701 + }, + { + "epoch": 4.900210084033613, + "grad_norm": 0.8895967821752813, + "learning_rate": 1.0009074905323118e-05, + "loss": 0.1364, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12817296385765076, + "step": 4665, + "valid_targets_mean": 1708.4, + "valid_targets_min": 1202 + }, + { + "epoch": 4.90546218487395, + "grad_norm": 0.803668498672539, + "learning_rate": 9.963727846603784e-06, + "loss": 0.1265, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12417686730623245, + "step": 4670, + "valid_targets_mean": 1497.2, + "valid_targets_min": 770 + }, + { + "epoch": 4.910714285714286, + "grad_norm": 0.8209572965038717, + "learning_rate": 9.918449644209087e-06, + "loss": 0.125, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11642634868621826, + "step": 4675, + "valid_targets_mean": 1333.4, + "valid_targets_min": 646 + }, + { + "epoch": 4.915966386554622, + "grad_norm": 0.9106589305140345, + "learning_rate": 9.873240608781341e-06, + "loss": 0.1266, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.126824289560318, + "step": 4680, + "valid_targets_mean": 1260.1, + "valid_targets_min": 723 + }, + { + "epoch": 4.921218487394958, + "grad_norm": 0.8246969179034082, + "learning_rate": 9.828101050488308e-06, + "loss": 0.1202, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11583910137414932, + "step": 4685, + "valid_targets_mean": 1421.8, + "valid_targets_min": 808 + }, + { + "epoch": 4.926470588235294, + "grad_norm": 0.9467345871410094, + "learning_rate": 9.783031279021063e-06, + "loss": 0.1272, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.121206134557724, + "step": 4690, + "valid_targets_mean": 1255.4, + "valid_targets_min": 634 + }, + { + "epoch": 4.93172268907563, + "grad_norm": 0.8946786916723871, + "learning_rate": 9.738031603591926e-06, + "loss": 0.1217, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12146471440792084, + "step": 4695, + "valid_targets_mean": 1334.6, + "valid_targets_min": 821 + }, + { + "epoch": 4.936974789915967, + "grad_norm": 0.8415482635056759, + "learning_rate": 9.69310233293227e-06, + "loss": 0.1194, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12440873682498932, + "step": 4700, + "valid_targets_mean": 1562.7, + "valid_targets_min": 849 + }, + { + "epoch": 4.942226890756302, + "grad_norm": 0.8253084558385871, + "learning_rate": 9.648243775290476e-06, + "loss": 0.1203, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12124086171388626, + "step": 4705, + "valid_targets_mean": 1435.9, + "valid_targets_min": 781 + }, + { + "epoch": 4.947478991596639, + "grad_norm": 0.8212423721287204, + "learning_rate": 9.60345623842974e-06, + "loss": 0.1296, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10891197621822357, + "step": 4710, + "valid_targets_mean": 1341.2, + "valid_targets_min": 567 + }, + { + "epoch": 4.9527310924369745, + "grad_norm": 0.7441257737363668, + "learning_rate": 9.558740029626046e-06, + "loss": 0.12, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10063184797763824, + "step": 4715, + "valid_targets_mean": 1319.9, + "valid_targets_min": 810 + }, + { + "epoch": 4.957983193277311, + "grad_norm": 0.8222604138587376, + "learning_rate": 9.51409545566597e-06, + "loss": 0.1236, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12508775293827057, + "step": 4720, + "valid_targets_mean": 1657.6, + "valid_targets_min": 868 + }, + { + "epoch": 4.963235294117647, + "grad_norm": 0.8441572887401301, + "learning_rate": 9.469522822844663e-06, + "loss": 0.1134, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12001735717058182, + "step": 4725, + "valid_targets_mean": 1566.1, + "valid_targets_min": 682 + }, + { + "epoch": 4.968487394957983, + "grad_norm": 0.8622442317465762, + "learning_rate": 9.425022436963664e-06, + "loss": 0.1153, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13704422116279602, + "step": 4730, + "valid_targets_mean": 1575.5, + "valid_targets_min": 797 + }, + { + "epoch": 4.973739495798319, + "grad_norm": 0.8300300731222955, + "learning_rate": 9.380594603328875e-06, + "loss": 0.1228, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11850959062576294, + "step": 4735, + "valid_targets_mean": 1568.6, + "valid_targets_min": 639 + }, + { + "epoch": 4.9789915966386555, + "grad_norm": 0.8820976325913817, + "learning_rate": 9.336239626748432e-06, + "loss": 0.1199, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12084612995386124, + "step": 4740, + "valid_targets_mean": 1482.9, + "valid_targets_min": 920 + }, + { + "epoch": 4.984243697478991, + "grad_norm": 0.8235056111823619, + "learning_rate": 9.291957811530602e-06, + "loss": 0.1149, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11309683322906494, + "step": 4745, + "valid_targets_mean": 1354.8, + "valid_targets_min": 847 + }, + { + "epoch": 4.989495798319328, + "grad_norm": 0.8380994731336534, + "learning_rate": 9.247749461481712e-06, + "loss": 0.1207, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12259923666715622, + "step": 4750, + "valid_targets_mean": 1451.1, + "valid_targets_min": 557 + }, + { + "epoch": 4.994747899159664, + "grad_norm": 0.9271264619980075, + "learning_rate": 9.203614879904083e-06, + "loss": 0.1212, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12632964551448822, + "step": 4755, + "valid_targets_mean": 1332.4, + "valid_targets_min": 645 + }, + { + "epoch": 5.0, + "grad_norm": 0.7766606123712497, + "learning_rate": 9.159554369593901e-06, + "loss": 0.1228, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11304584890604019, + "step": 4760, + "valid_targets_mean": 1721.1, + "valid_targets_min": 760 + }, + { + "epoch": 5.005252100840337, + "grad_norm": 1.0368311360471962, + "learning_rate": 9.115568232839193e-06, + "loss": 0.2281, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2315981090068817, + "step": 4765, + "valid_targets_mean": 3398.8, + "valid_targets_min": 746 + }, + { + "epoch": 5.010504201680672, + "grad_norm": 0.6460571203150131, + "learning_rate": 9.071656771417721e-06, + "loss": 0.207, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17781823873519897, + "step": 4770, + "valid_targets_mean": 4347.4, + "valid_targets_min": 1651 + }, + { + "epoch": 5.015756302521009, + "grad_norm": 0.542133417895063, + "learning_rate": 9.027820286594902e-06, + "loss": 0.2101, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1896631270647049, + "step": 4775, + "valid_targets_mean": 4633.2, + "valid_targets_min": 1560 + }, + { + "epoch": 5.0210084033613445, + "grad_norm": 0.6608510247217927, + "learning_rate": 8.984059079121785e-06, + "loss": 0.2035, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19018647074699402, + "step": 4780, + "valid_targets_mean": 3938.1, + "valid_targets_min": 1841 + }, + { + "epoch": 5.026260504201681, + "grad_norm": 0.6358924043276708, + "learning_rate": 8.940373449232935e-06, + "loss": 0.2111, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22464792430400848, + "step": 4785, + "valid_targets_mean": 3724.8, + "valid_targets_min": 1374 + }, + { + "epoch": 5.031512605042017, + "grad_norm": 0.6599880706584261, + "learning_rate": 8.896763696644405e-06, + "loss": 0.2016, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18435746431350708, + "step": 4790, + "valid_targets_mean": 3264.8, + "valid_targets_min": 1089 + }, + { + "epoch": 5.036764705882353, + "grad_norm": 0.7096826802832755, + "learning_rate": 8.853230120551693e-06, + "loss": 0.2038, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21627312898635864, + "step": 4795, + "valid_targets_mean": 3374.9, + "valid_targets_min": 627 + }, + { + "epoch": 5.042016806722689, + "grad_norm": 0.6612340433792787, + "learning_rate": 8.809773019627635e-06, + "loss": 0.2061, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21441474556922913, + "step": 4800, + "valid_targets_mean": 3514.9, + "valid_targets_min": 1574 + }, + { + "epoch": 5.0472689075630255, + "grad_norm": 0.6216659402671705, + "learning_rate": 8.766392692020413e-06, + "loss": 0.2138, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21736544370651245, + "step": 4805, + "valid_targets_mean": 3956.7, + "valid_targets_min": 1899 + }, + { + "epoch": 5.052521008403361, + "grad_norm": 0.6397951889136652, + "learning_rate": 8.723089435351497e-06, + "loss": 0.2059, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.213152214884758, + "step": 4810, + "valid_targets_mean": 4397.6, + "valid_targets_min": 2261 + }, + { + "epoch": 5.057773109243698, + "grad_norm": 0.6827468645370026, + "learning_rate": 8.679863546713559e-06, + "loss": 0.2105, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19350934028625488, + "step": 4815, + "valid_targets_mean": 3263.8, + "valid_targets_min": 1873 + }, + { + "epoch": 5.063025210084033, + "grad_norm": 0.6432078260343645, + "learning_rate": 8.636715322668498e-06, + "loss": 0.212, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2112460732460022, + "step": 4820, + "valid_targets_mean": 3430.2, + "valid_targets_min": 1013 + }, + { + "epoch": 5.06827731092437, + "grad_norm": 0.5998462380114775, + "learning_rate": 8.593645059245365e-06, + "loss": 0.1989, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1965964436531067, + "step": 4825, + "valid_targets_mean": 4041.6, + "valid_targets_min": 1366 + }, + { + "epoch": 5.073529411764706, + "grad_norm": 0.6552876974701827, + "learning_rate": 8.550653051938333e-06, + "loss": 0.2088, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2239168882369995, + "step": 4830, + "valid_targets_mean": 3515.2, + "valid_targets_min": 2050 + }, + { + "epoch": 5.078781512605042, + "grad_norm": 0.7164022528196604, + "learning_rate": 8.507739595704695e-06, + "loss": 0.2149, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21687167882919312, + "step": 4835, + "valid_targets_mean": 3048.9, + "valid_targets_min": 746 + }, + { + "epoch": 5.084033613445378, + "grad_norm": 0.7024986732808598, + "learning_rate": 8.464904984962832e-06, + "loss": 0.2057, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2093815803527832, + "step": 4840, + "valid_targets_mean": 2982.6, + "valid_targets_min": 855 + }, + { + "epoch": 5.089285714285714, + "grad_norm": 0.6486210855345914, + "learning_rate": 8.422149513590151e-06, + "loss": 0.2096, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22854307293891907, + "step": 4845, + "valid_targets_mean": 3753.4, + "valid_targets_min": 2125 + }, + { + "epoch": 5.09453781512605, + "grad_norm": 0.7106124392970365, + "learning_rate": 8.37947347492115e-06, + "loss": 0.2146, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20508921146392822, + "step": 4850, + "valid_targets_mean": 2946.8, + "valid_targets_min": 1173 + }, + { + "epoch": 5.099789915966387, + "grad_norm": 0.7291320506136616, + "learning_rate": 8.33687716174532e-06, + "loss": 0.2051, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20715506374835968, + "step": 4855, + "valid_targets_mean": 3284.2, + "valid_targets_min": 1438 + }, + { + "epoch": 5.105042016806722, + "grad_norm": 0.667621729812997, + "learning_rate": 8.294360866305192e-06, + "loss": 0.2038, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18001650273799896, + "step": 4860, + "valid_targets_mean": 3818.4, + "valid_targets_min": 1133 + }, + { + "epoch": 5.110294117647059, + "grad_norm": 0.6904135635931854, + "learning_rate": 8.251924880294317e-06, + "loss": 0.2068, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1863369643688202, + "step": 4865, + "valid_targets_mean": 3339.8, + "valid_targets_min": 1051 + }, + { + "epoch": 5.1155462184873945, + "grad_norm": 0.708134359007726, + "learning_rate": 8.20956949485527e-06, + "loss": 0.202, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2200697362422943, + "step": 4870, + "valid_targets_mean": 3285.1, + "valid_targets_min": 1642 + }, + { + "epoch": 5.120798319327731, + "grad_norm": 0.6714863526693571, + "learning_rate": 8.167295000577622e-06, + "loss": 0.2061, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19819751381874084, + "step": 4875, + "valid_targets_mean": 3340.8, + "valid_targets_min": 1747 + }, + { + "epoch": 5.126050420168067, + "grad_norm": 0.6991162613090433, + "learning_rate": 8.125101687496e-06, + "loss": 0.2163, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2069099098443985, + "step": 4880, + "valid_targets_mean": 3218.2, + "valid_targets_min": 1765 + }, + { + "epoch": 5.131302521008403, + "grad_norm": 0.6933394799250305, + "learning_rate": 8.082989845088038e-06, + "loss": 0.2094, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20274317264556885, + "step": 4885, + "valid_targets_mean": 3182.9, + "valid_targets_min": 1233 + }, + { + "epoch": 5.13655462184874, + "grad_norm": 0.7022583842802075, + "learning_rate": 8.040959762272441e-06, + "loss": 0.195, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19732248783111572, + "step": 4890, + "valid_targets_mean": 3020.8, + "valid_targets_min": 869 + }, + { + "epoch": 5.141806722689076, + "grad_norm": 0.6578222367990266, + "learning_rate": 7.999011727406995e-06, + "loss": 0.2022, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1947716623544693, + "step": 4895, + "valid_targets_mean": 3269.2, + "valid_targets_min": 926 + }, + { + "epoch": 5.147058823529412, + "grad_norm": 0.6729734257141221, + "learning_rate": 7.957146028286524e-06, + "loss": 0.2027, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1842532753944397, + "step": 4900, + "valid_targets_mean": 3256.4, + "valid_targets_min": 1016 + }, + { + "epoch": 5.152310924369748, + "grad_norm": 0.6998982376570767, + "learning_rate": 7.915362952141017e-06, + "loss": 0.2048, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19443146884441376, + "step": 4905, + "valid_targets_mean": 3058.4, + "valid_targets_min": 1367 + }, + { + "epoch": 5.157563025210084, + "grad_norm": 0.6159690568204116, + "learning_rate": 7.873662785633594e-06, + "loss": 0.2023, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1794825792312622, + "step": 4910, + "valid_targets_mean": 3513.8, + "valid_targets_min": 761 + }, + { + "epoch": 5.16281512605042, + "grad_norm": 0.718929827088859, + "learning_rate": 7.832045814858538e-06, + "loss": 0.1975, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19105938076972961, + "step": 4915, + "valid_targets_mean": 2834.2, + "valid_targets_min": 1480 + }, + { + "epoch": 5.168067226890757, + "grad_norm": 0.6775963512647579, + "learning_rate": 7.790512325339367e-06, + "loss": 0.1982, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18776269257068634, + "step": 4920, + "valid_targets_mean": 2854.1, + "valid_targets_min": 1229 + }, + { + "epoch": 5.173319327731092, + "grad_norm": 0.7289317859752761, + "learning_rate": 7.74906260202685e-06, + "loss": 0.209, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19116216897964478, + "step": 4925, + "valid_targets_mean": 3215.8, + "valid_targets_min": 1727 + }, + { + "epoch": 5.178571428571429, + "grad_norm": 0.6500227003936777, + "learning_rate": 7.707696929297053e-06, + "loss": 0.204, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1965217888355255, + "step": 4930, + "valid_targets_mean": 3578.9, + "valid_targets_min": 1860 + }, + { + "epoch": 5.1838235294117645, + "grad_norm": 0.7034986881633343, + "learning_rate": 7.666415590949382e-06, + "loss": 0.2052, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20505331456661224, + "step": 4935, + "valid_targets_mean": 3121.1, + "valid_targets_min": 1145 + }, + { + "epoch": 5.189075630252101, + "grad_norm": 0.8145007649387389, + "learning_rate": 7.625218870204676e-06, + "loss": 0.2074, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20866146683692932, + "step": 4940, + "valid_targets_mean": 2910.1, + "valid_targets_min": 1195 + }, + { + "epoch": 5.194327731092437, + "grad_norm": 0.6372684720958994, + "learning_rate": 7.584107049703195e-06, + "loss": 0.1956, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17585617303848267, + "step": 4945, + "valid_targets_mean": 3215.2, + "valid_targets_min": 1087 + }, + { + "epoch": 5.199579831932773, + "grad_norm": 0.6712839739955457, + "learning_rate": 7.5430804115027615e-06, + "loss": 0.2045, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19442957639694214, + "step": 4950, + "valid_targets_mean": 3842.3, + "valid_targets_min": 730 + }, + { + "epoch": 5.204831932773109, + "grad_norm": 0.7139371019585867, + "learning_rate": 7.502139237076744e-06, + "loss": 0.1986, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18818247318267822, + "step": 4955, + "valid_targets_mean": 3112.6, + "valid_targets_min": 1097 + }, + { + "epoch": 5.2100840336134455, + "grad_norm": 0.6441054449323667, + "learning_rate": 7.461283807312194e-06, + "loss": 0.1961, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20336642861366272, + "step": 4960, + "valid_targets_mean": 3587.6, + "valid_targets_min": 1833 + }, + { + "epoch": 5.215336134453781, + "grad_norm": 0.7139397353122559, + "learning_rate": 7.420514402507886e-06, + "loss": 0.2008, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21995452046394348, + "step": 4965, + "valid_targets_mean": 3660.6, + "valid_targets_min": 1182 + }, + { + "epoch": 5.220588235294118, + "grad_norm": 0.6921935226344126, + "learning_rate": 7.379831302372389e-06, + "loss": 0.2009, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2377263605594635, + "step": 4970, + "valid_targets_mean": 3839.4, + "valid_targets_min": 1586 + }, + { + "epoch": 5.225840336134453, + "grad_norm": 0.78550496353629, + "learning_rate": 7.3392347860221556e-06, + "loss": 0.2021, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2115703821182251, + "step": 4975, + "valid_targets_mean": 3062.7, + "valid_targets_min": 1714 + }, + { + "epoch": 5.23109243697479, + "grad_norm": 0.717261721079846, + "learning_rate": 7.298725131979629e-06, + "loss": 0.1999, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2131146639585495, + "step": 4980, + "valid_targets_mean": 3611.1, + "valid_targets_min": 1504 + }, + { + "epoch": 5.236344537815126, + "grad_norm": 0.6319115820709261, + "learning_rate": 7.258302618171287e-06, + "loss": 0.1956, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1644587367773056, + "step": 4985, + "valid_targets_mean": 3457.1, + "valid_targets_min": 1170 + }, + { + "epoch": 5.241596638655462, + "grad_norm": 0.760031676694523, + "learning_rate": 7.217967521925775e-06, + "loss": 0.1937, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20226861536502838, + "step": 4990, + "valid_targets_mean": 3089.3, + "valid_targets_min": 1436 + }, + { + "epoch": 5.246848739495798, + "grad_norm": 0.9470898190916125, + "learning_rate": 7.177720119971998e-06, + "loss": 0.1967, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19645410776138306, + "step": 4995, + "valid_targets_mean": 3257.2, + "valid_targets_min": 1302 + }, + { + "epoch": 5.2521008403361344, + "grad_norm": 0.706018495456836, + "learning_rate": 7.137560688437184e-06, + "loss": 0.1976, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21298207342624664, + "step": 5000, + "valid_targets_mean": 3425.1, + "valid_targets_min": 2023 + }, + { + "epoch": 5.257352941176471, + "grad_norm": 0.6165263612026762, + "learning_rate": 7.097489502845047e-06, + "loss": 0.1802, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1659245491027832, + "step": 5005, + "valid_targets_mean": 3196.4, + "valid_targets_min": 809 + }, + { + "epoch": 5.262605042016807, + "grad_norm": 0.7663728544419008, + "learning_rate": 7.0575068381138525e-06, + "loss": 0.211, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19875086843967438, + "step": 5010, + "valid_targets_mean": 3197.8, + "valid_targets_min": 1059 + }, + { + "epoch": 5.267857142857143, + "grad_norm": 0.6844105981294532, + "learning_rate": 7.0176129685545414e-06, + "loss": 0.1926, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16719815135002136, + "step": 5015, + "valid_targets_mean": 3301.7, + "valid_targets_min": 964 + }, + { + "epoch": 5.273109243697479, + "grad_norm": 0.6796898164555453, + "learning_rate": 6.977808167868867e-06, + "loss": 0.2043, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1949189305305481, + "step": 5020, + "valid_targets_mean": 3694.2, + "valid_targets_min": 1105 + }, + { + "epoch": 5.2783613445378155, + "grad_norm": 0.8023813457851872, + "learning_rate": 6.9380927091475085e-06, + "loss": 0.2102, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20866572856903076, + "step": 5025, + "valid_targets_mean": 2612.6, + "valid_targets_min": 1491 + }, + { + "epoch": 5.283613445378151, + "grad_norm": 0.762817989942347, + "learning_rate": 6.898466864868165e-06, + "loss": 0.2144, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20279455184936523, + "step": 5030, + "valid_targets_mean": 3110.5, + "valid_targets_min": 1091 + }, + { + "epoch": 5.288865546218488, + "grad_norm": 0.7866878344731686, + "learning_rate": 6.858930906893751e-06, + "loss": 0.1934, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19141477346420288, + "step": 5035, + "valid_targets_mean": 3259.2, + "valid_targets_min": 1822 + }, + { + "epoch": 5.294117647058823, + "grad_norm": 0.7702679497523474, + "learning_rate": 6.819485106470454e-06, + "loss": 0.1944, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1862347275018692, + "step": 5040, + "valid_targets_mean": 3547.6, + "valid_targets_min": 1625 + }, + { + "epoch": 5.29936974789916, + "grad_norm": 0.6629392322076868, + "learning_rate": 6.780129734225949e-06, + "loss": 0.1864, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17328760027885437, + "step": 5045, + "valid_targets_mean": 3628.2, + "valid_targets_min": 1415 + }, + { + "epoch": 5.304621848739496, + "grad_norm": 0.7042102260307026, + "learning_rate": 6.740865060167483e-06, + "loss": 0.1917, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19156163930892944, + "step": 5050, + "valid_targets_mean": 3398.9, + "valid_targets_min": 1460 + }, + { + "epoch": 5.309873949579832, + "grad_norm": 0.7519060990832099, + "learning_rate": 6.701691353680049e-06, + "loss": 0.1975, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19511482119560242, + "step": 5055, + "valid_targets_mean": 2947.4, + "valid_targets_min": 1079 + }, + { + "epoch": 5.315126050420168, + "grad_norm": 0.727969914435581, + "learning_rate": 6.662608883524542e-06, + "loss": 0.1769, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18351078033447266, + "step": 5060, + "valid_targets_mean": 3003.0, + "valid_targets_min": 1274 + }, + { + "epoch": 5.320378151260504, + "grad_norm": 0.8817302867844496, + "learning_rate": 6.6236179178359115e-06, + "loss": 0.1928, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21124529838562012, + "step": 5065, + "valid_targets_mean": 3306.3, + "valid_targets_min": 914 + }, + { + "epoch": 5.32563025210084, + "grad_norm": 0.713024621019574, + "learning_rate": 6.5847187241213e-06, + "loss": 0.2055, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19047285616397858, + "step": 5070, + "valid_targets_mean": 3332.2, + "valid_targets_min": 1312 + }, + { + "epoch": 5.330882352941177, + "grad_norm": 0.752933122434432, + "learning_rate": 6.5459115692582386e-06, + "loss": 0.1924, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1971365213394165, + "step": 5075, + "valid_targets_mean": 2601.3, + "valid_targets_min": 987 + }, + { + "epoch": 5.336134453781512, + "grad_norm": 0.624699265138433, + "learning_rate": 6.507196719492819e-06, + "loss": 0.1949, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1911473274230957, + "step": 5080, + "valid_targets_mean": 4341.5, + "valid_targets_min": 1856 + }, + { + "epoch": 5.341386554621849, + "grad_norm": 0.7283950240407708, + "learning_rate": 6.468574440437801e-06, + "loss": 0.1966, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19926682114601135, + "step": 5085, + "valid_targets_mean": 3290.9, + "valid_targets_min": 1601 + }, + { + "epoch": 5.3466386554621845, + "grad_norm": 0.7710715895807497, + "learning_rate": 6.43004499707089e-06, + "loss": 0.204, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20834487676620483, + "step": 5090, + "valid_targets_mean": 3119.4, + "valid_targets_min": 1986 + }, + { + "epoch": 5.351890756302521, + "grad_norm": 0.7170439306426001, + "learning_rate": 6.3916086537328545e-06, + "loss": 0.1858, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21489310264587402, + "step": 5095, + "valid_targets_mean": 3777.1, + "valid_targets_min": 974 + }, + { + "epoch": 5.357142857142857, + "grad_norm": 0.6744006460741591, + "learning_rate": 6.3532656741257145e-06, + "loss": 0.1852, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16385085880756378, + "step": 5100, + "valid_targets_mean": 2878.0, + "valid_targets_min": 512 + }, + { + "epoch": 5.362394957983193, + "grad_norm": 0.673275766985947, + "learning_rate": 6.315016321310965e-06, + "loss": 0.1902, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1753840446472168, + "step": 5105, + "valid_targets_mean": 3215.4, + "valid_targets_min": 1202 + }, + { + "epoch": 5.367647058823529, + "grad_norm": 0.7266719247932443, + "learning_rate": 6.276860857707727e-06, + "loss": 0.2117, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20921765267848969, + "step": 5110, + "valid_targets_mean": 3693.1, + "valid_targets_min": 1455 + }, + { + "epoch": 5.3728991596638656, + "grad_norm": 0.6960543396247455, + "learning_rate": 6.238799545090994e-06, + "loss": 0.1953, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18564675748348236, + "step": 5115, + "valid_targets_mean": 3477.5, + "valid_targets_min": 1571 + }, + { + "epoch": 5.378151260504202, + "grad_norm": 0.789570094298452, + "learning_rate": 6.20083264458981e-06, + "loss": 0.2082, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22905242443084717, + "step": 5120, + "valid_targets_mean": 2912.1, + "valid_targets_min": 1450 + }, + { + "epoch": 5.383403361344538, + "grad_norm": 0.687911349078074, + "learning_rate": 6.162960416685469e-06, + "loss": 0.1928, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18090611696243286, + "step": 5125, + "valid_targets_mean": 3323.0, + "valid_targets_min": 1431 + }, + { + "epoch": 5.388655462184874, + "grad_norm": 0.8129192543706223, + "learning_rate": 6.125183121209741e-06, + "loss": 0.2089, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2075553834438324, + "step": 5130, + "valid_targets_mean": 3461.4, + "valid_targets_min": 1147 + }, + { + "epoch": 5.39390756302521, + "grad_norm": 0.7873625003498075, + "learning_rate": 6.087501017343107e-06, + "loss": 0.2065, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2097611427307129, + "step": 5135, + "valid_targets_mean": 2641.6, + "valid_targets_min": 998 + }, + { + "epoch": 5.399159663865547, + "grad_norm": 0.7237167630580533, + "learning_rate": 6.0499143636129384e-06, + "loss": 0.199, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20370076596736908, + "step": 5140, + "valid_targets_mean": 3260.9, + "valid_targets_min": 614 + }, + { + "epoch": 5.404411764705882, + "grad_norm": 0.85938348372471, + "learning_rate": 6.012423417891766e-06, + "loss": 0.1987, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20711749792099, + "step": 5145, + "valid_targets_mean": 2796.2, + "valid_targets_min": 1005 + }, + { + "epoch": 5.409663865546219, + "grad_norm": 0.6968015629432648, + "learning_rate": 5.975028437395493e-06, + "loss": 0.1985, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2024056762456894, + "step": 5150, + "valid_targets_mean": 3183.6, + "valid_targets_min": 2298 + }, + { + "epoch": 5.4149159663865545, + "grad_norm": 0.7775633759987758, + "learning_rate": 5.937729678681612e-06, + "loss": 0.207, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20395274460315704, + "step": 5155, + "valid_targets_mean": 2821.2, + "valid_targets_min": 617 + }, + { + "epoch": 5.420168067226891, + "grad_norm": 0.7494510775854252, + "learning_rate": 5.9005273976474684e-06, + "loss": 0.1891, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18208947777748108, + "step": 5160, + "valid_targets_mean": 3265.2, + "valid_targets_min": 1665 + }, + { + "epoch": 5.425420168067227, + "grad_norm": 0.824725420965561, + "learning_rate": 5.8634218495285126e-06, + "loss": 0.2046, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20658603310585022, + "step": 5165, + "valid_targets_mean": 3019.3, + "valid_targets_min": 1076 + }, + { + "epoch": 5.430672268907563, + "grad_norm": 0.706863386587082, + "learning_rate": 5.8264132888965155e-06, + "loss": 0.193, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19833385944366455, + "step": 5170, + "valid_targets_mean": 3610.8, + "valid_targets_min": 790 + }, + { + "epoch": 5.435924369747899, + "grad_norm": 0.7103390006031945, + "learning_rate": 5.789501969657853e-06, + "loss": 0.2088, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1992931365966797, + "step": 5175, + "valid_targets_mean": 3255.8, + "valid_targets_min": 1728 + }, + { + "epoch": 5.4411764705882355, + "grad_norm": 0.6848028235034054, + "learning_rate": 5.752688145051761e-06, + "loss": 0.2018, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18287193775177002, + "step": 5180, + "valid_targets_mean": 3377.2, + "valid_targets_min": 981 + }, + { + "epoch": 5.446428571428571, + "grad_norm": 0.6806365974211747, + "learning_rate": 5.715972067648561e-06, + "loss": 0.1865, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1667267084121704, + "step": 5185, + "valid_targets_mean": 2839.1, + "valid_targets_min": 1351 + }, + { + "epoch": 5.451680672268908, + "grad_norm": 0.6810171841346309, + "learning_rate": 5.679353989347989e-06, + "loss": 0.1968, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20622935891151428, + "step": 5190, + "valid_targets_mean": 4396.7, + "valid_targets_min": 2416 + }, + { + "epoch": 5.456932773109243, + "grad_norm": 0.6886243059430002, + "learning_rate": 5.642834161377408e-06, + "loss": 0.1913, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1882258951663971, + "step": 5195, + "valid_targets_mean": 4668.6, + "valid_targets_min": 1233 + }, + { + "epoch": 5.46218487394958, + "grad_norm": 0.660869505715319, + "learning_rate": 5.606412834290121e-06, + "loss": 0.1875, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1740989089012146, + "step": 5200, + "valid_targets_mean": 3936.4, + "valid_targets_min": 1524 + }, + { + "epoch": 5.467436974789916, + "grad_norm": 0.6389923753551053, + "learning_rate": 5.570090257963645e-06, + "loss": 0.1911, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18670515716075897, + "step": 5205, + "valid_targets_mean": 4389.3, + "valid_targets_min": 856 + }, + { + "epoch": 5.472689075630252, + "grad_norm": 0.7185606904022306, + "learning_rate": 5.533866681597981e-06, + "loss": 0.1893, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18405769765377045, + "step": 5210, + "valid_targets_mean": 3241.3, + "valid_targets_min": 906 + }, + { + "epoch": 5.477941176470588, + "grad_norm": 0.796159259324853, + "learning_rate": 5.497742353713928e-06, + "loss": 0.1852, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20212048292160034, + "step": 5215, + "valid_targets_mean": 3680.4, + "valid_targets_min": 832 + }, + { + "epoch": 5.483193277310924, + "grad_norm": 0.6843887461039875, + "learning_rate": 5.461717522151371e-06, + "loss": 0.1767, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1704184114933014, + "step": 5220, + "valid_targets_mean": 3168.9, + "valid_targets_min": 1484 + }, + { + "epoch": 5.48844537815126, + "grad_norm": 0.81830636371663, + "learning_rate": 5.4257924340675535e-06, + "loss": 0.188, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18880800902843475, + "step": 5225, + "valid_targets_mean": 3667.5, + "valid_targets_min": 1440 + }, + { + "epoch": 5.493697478991597, + "grad_norm": 0.761192266055787, + "learning_rate": 5.389967335935429e-06, + "loss": 0.2039, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2186485230922699, + "step": 5230, + "valid_targets_mean": 3025.6, + "valid_targets_min": 1349 + }, + { + "epoch": 5.498949579831933, + "grad_norm": 0.7532532316921411, + "learning_rate": 5.3542424735419306e-06, + "loss": 0.1948, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1849045306444168, + "step": 5235, + "valid_targets_mean": 2935.8, + "valid_targets_min": 1156 + }, + { + "epoch": 5.504201680672269, + "grad_norm": 0.7266362371210848, + "learning_rate": 5.318618091986294e-06, + "loss": 0.1904, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17571350932121277, + "step": 5240, + "valid_targets_mean": 3190.4, + "valid_targets_min": 993 + }, + { + "epoch": 5.509453781512605, + "grad_norm": 0.7883604048005873, + "learning_rate": 5.283094435678398e-06, + "loss": 0.1845, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20258891582489014, + "step": 5245, + "valid_targets_mean": 2785.6, + "valid_targets_min": 1275 + }, + { + "epoch": 5.514705882352941, + "grad_norm": 0.738824710435114, + "learning_rate": 5.2476717483370685e-06, + "loss": 0.1907, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1991308033466339, + "step": 5250, + "valid_targets_mean": 3266.8, + "valid_targets_min": 1669 + }, + { + "epoch": 5.519957983193278, + "grad_norm": 0.7925166684746748, + "learning_rate": 5.212350272988394e-06, + "loss": 0.1974, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1969340294599533, + "step": 5255, + "valid_targets_mean": 3357.5, + "valid_targets_min": 1710 + }, + { + "epoch": 5.525210084033613, + "grad_norm": 0.6825177393092328, + "learning_rate": 5.177130251964088e-06, + "loss": 0.1917, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18405650556087494, + "step": 5260, + "valid_targets_mean": 3468.1, + "valid_targets_min": 1685 + }, + { + "epoch": 5.53046218487395, + "grad_norm": 0.6591391403288339, + "learning_rate": 5.1420119268998085e-06, + "loss": 0.1951, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19749081134796143, + "step": 5265, + "valid_targets_mean": 3659.6, + "valid_targets_min": 1931 + }, + { + "epoch": 5.535714285714286, + "grad_norm": 0.6736986111232942, + "learning_rate": 5.106995538733488e-06, + "loss": 0.1919, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18770131468772888, + "step": 5270, + "valid_targets_mean": 3862.3, + "valid_targets_min": 2009 + }, + { + "epoch": 5.540966386554622, + "grad_norm": 0.8741377267243634, + "learning_rate": 5.07208132770372e-06, + "loss": 0.1753, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16808158159255981, + "step": 5275, + "valid_targets_mean": 1792.6, + "valid_targets_min": 777 + }, + { + "epoch": 5.546218487394958, + "grad_norm": 0.8019745661839314, + "learning_rate": 5.037269533348075e-06, + "loss": 0.1325, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12899786233901978, + "step": 5280, + "valid_targets_mean": 1354.7, + "valid_targets_min": 705 + }, + { + "epoch": 5.551470588235294, + "grad_norm": 0.9281156697299153, + "learning_rate": 5.002560394501463e-06, + "loss": 0.1286, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13236215710639954, + "step": 5285, + "valid_targets_mean": 1556.9, + "valid_targets_min": 914 + }, + { + "epoch": 5.55672268907563, + "grad_norm": 0.823501068446433, + "learning_rate": 4.9679541492945135e-06, + "loss": 0.1263, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11238055676221848, + "step": 5290, + "valid_targets_mean": 1397.1, + "valid_targets_min": 680 + }, + { + "epoch": 5.561974789915967, + "grad_norm": 0.8106452499925574, + "learning_rate": 4.933451035151913e-06, + "loss": 0.1248, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12909407913684845, + "step": 5295, + "valid_targets_mean": 1698.1, + "valid_targets_min": 819 + }, + { + "epoch": 5.567226890756302, + "grad_norm": 0.8991107502754927, + "learning_rate": 4.899051288790806e-06, + "loss": 0.1232, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12105128914117813, + "step": 5300, + "valid_targets_mean": 1393.1, + "valid_targets_min": 734 + }, + { + "epoch": 5.572478991596639, + "grad_norm": 0.8395119193730466, + "learning_rate": 4.86475514621916e-06, + "loss": 0.1317, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11696095764636993, + "step": 5305, + "valid_targets_mean": 1443.1, + "valid_targets_min": 655 + }, + { + "epoch": 5.5777310924369745, + "grad_norm": 1.0738907935762767, + "learning_rate": 4.830562842734112e-06, + "loss": 0.1115, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11815018951892853, + "step": 5310, + "valid_targets_mean": 1392.2, + "valid_targets_min": 737 + }, + { + "epoch": 5.582983193277311, + "grad_norm": 0.8292783339611027, + "learning_rate": 4.796474612920421e-06, + "loss": 0.1324, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11230309307575226, + "step": 5315, + "valid_targets_mean": 1386.6, + "valid_targets_min": 759 + }, + { + "epoch": 5.588235294117647, + "grad_norm": 0.9357218955051299, + "learning_rate": 4.762490690648813e-06, + "loss": 0.1191, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12718072533607483, + "step": 5320, + "valid_targets_mean": 1442.9, + "valid_targets_min": 750 + }, + { + "epoch": 5.593487394957983, + "grad_norm": 0.8519534800000159, + "learning_rate": 4.728611309074374e-06, + "loss": 0.119, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11761420965194702, + "step": 5325, + "valid_targets_mean": 1536.1, + "valid_targets_min": 780 + }, + { + "epoch": 5.598739495798319, + "grad_norm": 0.8547416140469031, + "learning_rate": 4.694836700634975e-06, + "loss": 0.1162, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1196620911359787, + "step": 5330, + "valid_targets_mean": 1463.1, + "valid_targets_min": 679 + }, + { + "epoch": 5.6039915966386555, + "grad_norm": 1.0901335325216264, + "learning_rate": 4.661167097049668e-06, + "loss": 0.1227, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12231962382793427, + "step": 5335, + "valid_targets_mean": 1292.8, + "valid_targets_min": 771 + }, + { + "epoch": 5.609243697478991, + "grad_norm": 0.9123241183930774, + "learning_rate": 4.62760272931708e-06, + "loss": 0.1098, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11801913380622864, + "step": 5340, + "valid_targets_mean": 1542.4, + "valid_targets_min": 878 + }, + { + "epoch": 5.614495798319328, + "grad_norm": 0.8570929790691967, + "learning_rate": 4.594143827713844e-06, + "loss": 0.1095, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10810776799917221, + "step": 5345, + "valid_targets_mean": 1506.8, + "valid_targets_min": 942 + }, + { + "epoch": 5.619747899159664, + "grad_norm": 0.9539604016186798, + "learning_rate": 4.56079062179303e-06, + "loss": 0.1107, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11601479351520538, + "step": 5350, + "valid_targets_mean": 1401.9, + "valid_targets_min": 675 + }, + { + "epoch": 5.625, + "grad_norm": 0.9114757769971337, + "learning_rate": 4.527543340382538e-06, + "loss": 0.1171, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11921755969524384, + "step": 5355, + "valid_targets_mean": 1483.8, + "valid_targets_min": 892 + }, + { + "epoch": 5.630252100840336, + "grad_norm": 0.9360433208438923, + "learning_rate": 4.494402211583569e-06, + "loss": 0.1168, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11960253119468689, + "step": 5360, + "valid_targets_mean": 1356.3, + "valid_targets_min": 656 + }, + { + "epoch": 5.635504201680672, + "grad_norm": 0.8687564177093906, + "learning_rate": 4.461367462769009e-06, + "loss": 0.1185, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10865601897239685, + "step": 5365, + "valid_targets_mean": 1340.6, + "valid_targets_min": 706 + }, + { + "epoch": 5.640756302521009, + "grad_norm": 0.8626601637005205, + "learning_rate": 4.428439320581923e-06, + "loss": 0.1201, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.119922935962677, + "step": 5370, + "valid_targets_mean": 1528.6, + "valid_targets_min": 548 + }, + { + "epoch": 5.6460084033613445, + "grad_norm": 1.2286926999590546, + "learning_rate": 4.3956180109339705e-06, + "loss": 0.1161, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10904563963413239, + "step": 5375, + "valid_targets_mean": 1268.9, + "valid_targets_min": 658 + }, + { + "epoch": 5.651260504201681, + "grad_norm": 0.8729368734062463, + "learning_rate": 4.362903759003849e-06, + "loss": 0.1132, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1106632798910141, + "step": 5380, + "valid_targets_mean": 1360.1, + "valid_targets_min": 650 + }, + { + "epoch": 5.656512605042017, + "grad_norm": 0.8066508995038737, + "learning_rate": 4.33029678923576e-06, + "loss": 0.1136, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11501973122358322, + "step": 5385, + "valid_targets_mean": 1452.3, + "valid_targets_min": 859 + }, + { + "epoch": 5.661764705882353, + "grad_norm": 0.8482374901140713, + "learning_rate": 4.297797325337889e-06, + "loss": 0.1051, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11828213930130005, + "step": 5390, + "valid_targets_mean": 1391.3, + "valid_targets_min": 728 + }, + { + "epoch": 5.667016806722689, + "grad_norm": 0.826557032894644, + "learning_rate": 4.265405590280822e-06, + "loss": 0.1104, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09589506685733795, + "step": 5395, + "valid_targets_mean": 1344.4, + "valid_targets_min": 686 + }, + { + "epoch": 5.6722689075630255, + "grad_norm": 0.941561782597229, + "learning_rate": 4.233121806296072e-06, + "loss": 0.1139, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12858964502811432, + "step": 5400, + "valid_targets_mean": 1545.2, + "valid_targets_min": 697 + }, + { + "epoch": 5.677521008403361, + "grad_norm": 0.912093405528764, + "learning_rate": 4.200946194874514e-06, + "loss": 0.1109, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10562796890735626, + "step": 5405, + "valid_targets_mean": 1354.6, + "valid_targets_min": 779 + }, + { + "epoch": 5.682773109243698, + "grad_norm": 0.9260849926734132, + "learning_rate": 4.168878976764872e-06, + "loss": 0.125, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11829014122486115, + "step": 5410, + "valid_targets_mean": 1434.1, + "valid_targets_min": 729 + }, + { + "epoch": 5.688025210084033, + "grad_norm": 0.826771685553631, + "learning_rate": 4.136920371972228e-06, + "loss": 0.1094, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1030585840344429, + "step": 5415, + "valid_targets_mean": 1388.2, + "valid_targets_min": 868 + }, + { + "epoch": 5.69327731092437, + "grad_norm": 1.6999684647726199, + "learning_rate": 4.105070599756482e-06, + "loss": 0.1163, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10433146357536316, + "step": 5420, + "valid_targets_mean": 1282.3, + "valid_targets_min": 765 + }, + { + "epoch": 5.698529411764706, + "grad_norm": 0.8817697258847107, + "learning_rate": 4.073329878630856e-06, + "loss": 0.1127, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11964145302772522, + "step": 5425, + "valid_targets_mean": 1457.2, + "valid_targets_min": 793 + }, + { + "epoch": 5.703781512605042, + "grad_norm": 0.8518914261076463, + "learning_rate": 4.041698426360425e-06, + "loss": 0.1157, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11360062658786774, + "step": 5430, + "valid_targets_mean": 1448.5, + "valid_targets_min": 806 + }, + { + "epoch": 5.709033613445378, + "grad_norm": 0.8301646651006851, + "learning_rate": 4.010176459960569e-06, + "loss": 0.1063, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09808893501758575, + "step": 5435, + "valid_targets_mean": 1380.7, + "valid_targets_min": 803 + }, + { + "epoch": 5.714285714285714, + "grad_norm": 0.8473401775683042, + "learning_rate": 3.978764195695528e-06, + "loss": 0.1111, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11080893129110336, + "step": 5440, + "valid_targets_mean": 1515.7, + "valid_targets_min": 660 + }, + { + "epoch": 5.71953781512605, + "grad_norm": 0.9100300218409771, + "learning_rate": 3.947461849076912e-06, + "loss": 0.1007, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1048063337802887, + "step": 5445, + "valid_targets_mean": 1402.0, + "valid_targets_min": 837 + }, + { + "epoch": 5.724789915966387, + "grad_norm": 0.8889294607662074, + "learning_rate": 3.916269634862193e-06, + "loss": 0.1113, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10396813601255417, + "step": 5450, + "valid_targets_mean": 1574.1, + "valid_targets_min": 719 + }, + { + "epoch": 5.730042016806722, + "grad_norm": 0.8903144486882467, + "learning_rate": 3.885187767053269e-06, + "loss": 0.1153, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10951384902000427, + "step": 5455, + "valid_targets_mean": 1430.1, + "valid_targets_min": 765 + }, + { + "epoch": 5.735294117647059, + "grad_norm": 0.9031317882555354, + "learning_rate": 3.854216458894973e-06, + "loss": 0.1117, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12100645154714584, + "step": 5460, + "valid_targets_mean": 1372.3, + "valid_targets_min": 727 + }, + { + "epoch": 5.740546218487395, + "grad_norm": 0.8606806374553407, + "learning_rate": 3.823355922873606e-06, + "loss": 0.1084, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09598094969987869, + "step": 5465, + "valid_targets_mean": 1192.8, + "valid_targets_min": 655 + }, + { + "epoch": 5.745798319327731, + "grad_norm": 0.9625073380564342, + "learning_rate": 3.792606370715508e-06, + "loss": 0.1138, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10911808162927628, + "step": 5470, + "valid_targets_mean": 1508.0, + "valid_targets_min": 669 + }, + { + "epoch": 5.751050420168067, + "grad_norm": 0.8921081945325963, + "learning_rate": 3.761968013385584e-06, + "loss": 0.1069, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10961748659610748, + "step": 5475, + "valid_targets_mean": 1430.2, + "valid_targets_min": 1046 + }, + { + "epoch": 5.756302521008403, + "grad_norm": 0.9534472437981408, + "learning_rate": 3.731441061085843e-06, + "loss": 0.114, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12638525664806366, + "step": 5480, + "valid_targets_mean": 1651.8, + "valid_targets_min": 692 + }, + { + "epoch": 5.76155462184874, + "grad_norm": 0.8796809522933133, + "learning_rate": 3.701025723253988e-06, + "loss": 0.1137, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11247321218252182, + "step": 5485, + "valid_targets_mean": 1540.4, + "valid_targets_min": 846 + }, + { + "epoch": 5.766806722689076, + "grad_norm": 0.845414134902536, + "learning_rate": 3.67072220856197e-06, + "loss": 0.1172, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10926534980535507, + "step": 5490, + "valid_targets_mean": 1455.1, + "valid_targets_min": 764 + }, + { + "epoch": 5.772058823529412, + "grad_norm": 0.8126469766696464, + "learning_rate": 3.640530724914517e-06, + "loss": 0.1056, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10028908401727676, + "step": 5495, + "valid_targets_mean": 1497.4, + "valid_targets_min": 822 + }, + { + "epoch": 5.777310924369748, + "grad_norm": 0.8406164976266153, + "learning_rate": 3.61045147944777e-06, + "loss": 0.1071, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11252301931381226, + "step": 5500, + "valid_targets_mean": 1543.8, + "valid_targets_min": 982 + }, + { + "epoch": 5.782563025210084, + "grad_norm": 0.9415916945254411, + "learning_rate": 3.5804846785278315e-06, + "loss": 0.1119, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10923096537590027, + "step": 5505, + "valid_targets_mean": 1346.3, + "valid_targets_min": 713 + }, + { + "epoch": 5.78781512605042, + "grad_norm": 0.9260499456205905, + "learning_rate": 3.5506305277493326e-06, + "loss": 0.1071, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10536296665668488, + "step": 5510, + "valid_targets_mean": 1395.7, + "valid_targets_min": 721 + }, + { + "epoch": 5.793067226890757, + "grad_norm": 0.8774386593252896, + "learning_rate": 3.520889231934057e-06, + "loss": 0.1056, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10436506569385529, + "step": 5515, + "valid_targets_mean": 1290.6, + "valid_targets_min": 741 + }, + { + "epoch": 5.798319327731092, + "grad_norm": 0.8896778034184114, + "learning_rate": 3.4912609951295084e-06, + "loss": 0.1088, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1191120520234108, + "step": 5520, + "valid_targets_mean": 1568.1, + "valid_targets_min": 734 + }, + { + "epoch": 5.803571428571429, + "grad_norm": 0.9421881494917845, + "learning_rate": 3.461746020607526e-06, + "loss": 0.1162, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13356809318065643, + "step": 5525, + "valid_targets_mean": 1703.1, + "valid_targets_min": 744 + }, + { + "epoch": 5.8088235294117645, + "grad_norm": 0.9745264130361654, + "learning_rate": 3.432344510862895e-06, + "loss": 0.1158, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12390495836734772, + "step": 5530, + "valid_targets_mean": 1652.8, + "valid_targets_min": 620 + }, + { + "epoch": 5.814075630252101, + "grad_norm": 0.8607153880999272, + "learning_rate": 3.403056667611917e-06, + "loss": 0.1093, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10633715987205505, + "step": 5535, + "valid_targets_mean": 1481.8, + "valid_targets_min": 723 + }, + { + "epoch": 5.819327731092437, + "grad_norm": 0.9758519266902133, + "learning_rate": 3.373882691791088e-06, + "loss": 0.1153, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10976162552833557, + "step": 5540, + "valid_targets_mean": 1686.5, + "valid_targets_min": 740 + }, + { + "epoch": 5.824579831932773, + "grad_norm": 0.8967263497321722, + "learning_rate": 3.344822783555679e-06, + "loss": 0.1078, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10004294663667679, + "step": 5545, + "valid_targets_mean": 1345.1, + "valid_targets_min": 711 + }, + { + "epoch": 5.829831932773109, + "grad_norm": 1.0391240197314284, + "learning_rate": 3.315877142278363e-06, + "loss": 0.1144, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11110391467809677, + "step": 5550, + "valid_targets_mean": 1619.1, + "valid_targets_min": 804 + }, + { + "epoch": 5.8350840336134455, + "grad_norm": 0.8413197113632568, + "learning_rate": 3.287045966547866e-06, + "loss": 0.1064, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11233742535114288, + "step": 5555, + "valid_targets_mean": 1423.2, + "valid_targets_min": 674 + }, + { + "epoch": 5.840336134453781, + "grad_norm": 0.8505366043709849, + "learning_rate": 3.258329454167599e-06, + "loss": 0.1055, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10158196091651917, + "step": 5560, + "valid_targets_mean": 1207.4, + "valid_targets_min": 567 + }, + { + "epoch": 5.845588235294118, + "grad_norm": 0.8995630860603766, + "learning_rate": 3.2297278021542833e-06, + "loss": 0.1047, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11643253266811371, + "step": 5565, + "valid_targets_mean": 1542.4, + "valid_targets_min": 912 + }, + { + "epoch": 5.850840336134453, + "grad_norm": 0.8887960162735108, + "learning_rate": 3.201241206736614e-06, + "loss": 0.1131, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11594435572624207, + "step": 5570, + "valid_targets_mean": 1591.0, + "valid_targets_min": 897 + }, + { + "epoch": 5.85609243697479, + "grad_norm": 1.1842033013727196, + "learning_rate": 3.1728698633539266e-06, + "loss": 0.1073, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1004495844244957, + "step": 5575, + "valid_targets_mean": 1290.1, + "valid_targets_min": 773 + }, + { + "epoch": 5.8613445378151265, + "grad_norm": 0.8528216924870448, + "learning_rate": 3.1446139666548212e-06, + "loss": 0.1097, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09786748886108398, + "step": 5580, + "valid_targets_mean": 1407.2, + "valid_targets_min": 679 + }, + { + "epoch": 5.866596638655462, + "grad_norm": 0.9063160104966684, + "learning_rate": 3.1164737104958707e-06, + "loss": 0.1159, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11985988914966583, + "step": 5585, + "valid_targets_mean": 1600.2, + "valid_targets_min": 818 + }, + { + "epoch": 5.871848739495798, + "grad_norm": 0.8331809940510251, + "learning_rate": 3.0884492879402452e-06, + "loss": 0.1122, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10528066009283066, + "step": 5590, + "valid_targets_mean": 1442.4, + "valid_targets_min": 790 + }, + { + "epoch": 5.8771008403361344, + "grad_norm": 0.8662258381631335, + "learning_rate": 3.0605408912564184e-06, + "loss": 0.1078, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11069589108228683, + "step": 5595, + "valid_targets_mean": 1426.6, + "valid_targets_min": 592 + }, + { + "epoch": 5.882352941176471, + "grad_norm": 0.8059447911663884, + "learning_rate": 3.032748711916851e-06, + "loss": 0.1073, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1017690896987915, + "step": 5600, + "valid_targets_mean": 1430.9, + "valid_targets_min": 662 + }, + { + "epoch": 5.887605042016807, + "grad_norm": 0.8787623158989677, + "learning_rate": 3.0050729405966495e-06, + "loss": 0.1123, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11519140005111694, + "step": 5605, + "valid_targets_mean": 1412.6, + "valid_targets_min": 622 + }, + { + "epoch": 5.892857142857143, + "grad_norm": 1.0058669337260462, + "learning_rate": 2.9775137671722754e-06, + "loss": 0.1074, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12139453738927841, + "step": 5610, + "valid_targets_mean": 1372.1, + "valid_targets_min": 667 + }, + { + "epoch": 5.898109243697479, + "grad_norm": 0.9818342504773482, + "learning_rate": 2.9500713807202565e-06, + "loss": 0.1165, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1251143366098404, + "step": 5615, + "valid_targets_mean": 1628.1, + "valid_targets_min": 1012 + }, + { + "epoch": 5.9033613445378155, + "grad_norm": 1.0048701808002658, + "learning_rate": 2.9227459695158543e-06, + "loss": 0.1195, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12856556475162506, + "step": 5620, + "valid_targets_mean": 1464.7, + "valid_targets_min": 635 + }, + { + "epoch": 5.908613445378151, + "grad_norm": 0.9524777797952462, + "learning_rate": 2.895537721031809e-06, + "loss": 0.1112, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13392376899719238, + "step": 5625, + "valid_targets_mean": 1745.9, + "valid_targets_min": 689 + }, + { + "epoch": 5.913865546218488, + "grad_norm": 0.8360052998799868, + "learning_rate": 2.8684468219370364e-06, + "loss": 0.1099, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09906312078237534, + "step": 5630, + "valid_targets_mean": 1129.1, + "valid_targets_min": 697 + }, + { + "epoch": 5.919117647058823, + "grad_norm": 0.9259328855340732, + "learning_rate": 2.841473458095334e-06, + "loss": 0.1092, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12108924984931946, + "step": 5635, + "valid_targets_mean": 1624.6, + "valid_targets_min": 656 + }, + { + "epoch": 5.92436974789916, + "grad_norm": 0.9476207176974106, + "learning_rate": 2.8146178145641355e-06, + "loss": 0.1111, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1358291506767273, + "step": 5640, + "valid_targets_mean": 1755.8, + "valid_targets_min": 697 + }, + { + "epoch": 5.929621848739496, + "grad_norm": 0.8733881430652086, + "learning_rate": 2.787880075593217e-06, + "loss": 0.1096, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11107189953327179, + "step": 5645, + "valid_targets_mean": 1516.4, + "valid_targets_min": 820 + }, + { + "epoch": 5.934873949579832, + "grad_norm": 0.8803395218820865, + "learning_rate": 2.7612604246234355e-06, + "loss": 0.1058, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10555368661880493, + "step": 5650, + "valid_targets_mean": 1391.4, + "valid_targets_min": 680 + }, + { + "epoch": 5.940126050420168, + "grad_norm": 0.8940529152418495, + "learning_rate": 2.7347590442854867e-06, + "loss": 0.1075, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11712536960840225, + "step": 5655, + "valid_targets_mean": 1412.4, + "valid_targets_min": 778 + }, + { + "epoch": 5.945378151260504, + "grad_norm": 0.9009479204017542, + "learning_rate": 2.7083761163986433e-06, + "loss": 0.1185, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12473637610673904, + "step": 5660, + "valid_targets_mean": 1599.6, + "valid_targets_min": 851 + }, + { + "epoch": 5.95063025210084, + "grad_norm": 0.8299195293692447, + "learning_rate": 2.682111821969493e-06, + "loss": 0.1072, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10053186863660812, + "step": 5665, + "valid_targets_mean": 1398.4, + "valid_targets_min": 692 + }, + { + "epoch": 5.955882352941177, + "grad_norm": 0.8224894370809741, + "learning_rate": 2.6559663411907233e-06, + "loss": 0.1068, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09880638122558594, + "step": 5670, + "valid_targets_mean": 1477.9, + "valid_targets_min": 741 + }, + { + "epoch": 5.961134453781512, + "grad_norm": 0.8446943544157789, + "learning_rate": 2.629939853439856e-06, + "loss": 0.1043, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09644494950771332, + "step": 5675, + "valid_targets_mean": 1299.4, + "valid_targets_min": 639 + }, + { + "epoch": 5.966386554621849, + "grad_norm": 0.8887196740407839, + "learning_rate": 2.604032537278052e-06, + "loss": 0.1009, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10244621336460114, + "step": 5680, + "valid_targets_mean": 1277.9, + "valid_targets_min": 743 + }, + { + "epoch": 5.9716386554621845, + "grad_norm": 0.8494276928184287, + "learning_rate": 2.5782445704488447e-06, + "loss": 0.1103, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10847003012895584, + "step": 5685, + "valid_targets_mean": 1529.9, + "valid_targets_min": 610 + }, + { + "epoch": 5.976890756302521, + "grad_norm": 0.8658895151511194, + "learning_rate": 2.5525761298769515e-06, + "loss": 0.1061, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10970406234264374, + "step": 5690, + "valid_targets_mean": 1331.6, + "valid_targets_min": 695 + }, + { + "epoch": 5.982142857142857, + "grad_norm": 0.9065356041104413, + "learning_rate": 2.527027391667054e-06, + "loss": 0.1048, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10520265996456146, + "step": 5695, + "valid_targets_mean": 1581.9, + "valid_targets_min": 807 + }, + { + "epoch": 5.987394957983193, + "grad_norm": 0.9469535446284602, + "learning_rate": 2.501598531102587e-06, + "loss": 0.1059, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10947225987911224, + "step": 5700, + "valid_targets_mean": 1327.6, + "valid_targets_min": 765 + }, + { + "epoch": 5.992647058823529, + "grad_norm": 0.9476175324156466, + "learning_rate": 2.47628972264452e-06, + "loss": 0.1063, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11112868785858154, + "step": 5705, + "valid_targets_mean": 1346.4, + "valid_targets_min": 591 + }, + { + "epoch": 5.9978991596638656, + "grad_norm": 0.9233409415833587, + "learning_rate": 2.4511011399301944e-06, + "loss": 0.1098, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10038024187088013, + "step": 5710, + "valid_targets_mean": 1483.2, + "valid_targets_min": 692 + }, + { + "epoch": 6.003151260504202, + "grad_norm": 1.1538573337023281, + "learning_rate": 2.4260329557721107e-06, + "loss": 0.1738, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20704257488250732, + "step": 5715, + "valid_targets_mean": 4404.5, + "valid_targets_min": 1323 + }, + { + "epoch": 6.008403361344538, + "grad_norm": 1.1897027864306338, + "learning_rate": 2.4010853421567237e-06, + "loss": 0.2143, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22920134663581848, + "step": 5720, + "valid_targets_mean": 4483.4, + "valid_targets_min": 1005 + }, + { + "epoch": 6.013655462184874, + "grad_norm": 0.8684521464937454, + "learning_rate": 2.376258470243309e-06, + "loss": 0.2006, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19509011507034302, + "step": 5725, + "valid_targets_mean": 4502.1, + "valid_targets_min": 1509 + }, + { + "epoch": 6.01890756302521, + "grad_norm": 0.8037614431305709, + "learning_rate": 2.351552510362758e-06, + "loss": 0.2021, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1814684271812439, + "step": 5730, + "valid_targets_mean": 3430.2, + "valid_targets_min": 1561 + }, + { + "epoch": 6.024159663865547, + "grad_norm": 0.7816962283075021, + "learning_rate": 2.326967632016406e-06, + "loss": 0.1892, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18898342549800873, + "step": 5735, + "valid_targets_mean": 3385.4, + "valid_targets_min": 1184 + }, + { + "epoch": 6.029411764705882, + "grad_norm": 0.6426902354697276, + "learning_rate": 2.302504003874888e-06, + "loss": 0.204, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1760241985321045, + "step": 5740, + "valid_targets_mean": 3982.6, + "valid_targets_min": 1413 + }, + { + "epoch": 6.034663865546219, + "grad_norm": 0.632043071580013, + "learning_rate": 2.2781617937769675e-06, + "loss": 0.1805, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19574542343616486, + "step": 5745, + "valid_targets_mean": 4911.7, + "valid_targets_min": 2160 + }, + { + "epoch": 6.0399159663865545, + "grad_norm": 0.7493769564211563, + "learning_rate": 2.2539411687283907e-06, + "loss": 0.2004, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19801229238510132, + "step": 5750, + "valid_targets_mean": 3782.6, + "valid_targets_min": 1511 + }, + { + "epoch": 6.045168067226891, + "grad_norm": 0.7505509884796049, + "learning_rate": 2.229842294900744e-06, + "loss": 0.1974, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20454156398773193, + "step": 5755, + "valid_targets_mean": 3030.0, + "valid_targets_min": 1462 + }, + { + "epoch": 6.050420168067227, + "grad_norm": 0.6430262170455331, + "learning_rate": 2.205865337630302e-06, + "loss": 0.2006, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18196547031402588, + "step": 5760, + "valid_targets_mean": 3772.4, + "valid_targets_min": 874 + }, + { + "epoch": 6.055672268907563, + "grad_norm": 0.7098617069387976, + "learning_rate": 2.182010461416899e-06, + "loss": 0.1983, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19023019075393677, + "step": 5765, + "valid_targets_mean": 3337.1, + "valid_targets_min": 953 + }, + { + "epoch": 6.060924369747899, + "grad_norm": 0.6552026128807007, + "learning_rate": 2.158277829922817e-06, + "loss": 0.2004, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2095913290977478, + "step": 5770, + "valid_targets_mean": 4284.9, + "valid_targets_min": 1265 + }, + { + "epoch": 6.0661764705882355, + "grad_norm": 0.5640222204672125, + "learning_rate": 2.1346676059716253e-06, + "loss": 0.1961, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19262853264808655, + "step": 5775, + "valid_targets_mean": 5010.6, + "valid_targets_min": 1596 + }, + { + "epoch": 6.071428571428571, + "grad_norm": 0.6700501160751591, + "learning_rate": 2.1111799515471066e-06, + "loss": 0.1951, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2048107534646988, + "step": 5780, + "valid_targets_mean": 3490.4, + "valid_targets_min": 1759 + }, + { + "epoch": 6.076680672268908, + "grad_norm": 1.192594245087854, + "learning_rate": 2.0878150277921195e-06, + "loss": 0.1997, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20699971914291382, + "step": 5785, + "valid_targets_mean": 3264.3, + "valid_targets_min": 1353 + }, + { + "epoch": 6.081932773109243, + "grad_norm": 0.6402893347468779, + "learning_rate": 2.064572995007492e-06, + "loss": 0.1987, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17887401580810547, + "step": 5790, + "valid_targets_mean": 3814.6, + "valid_targets_min": 1643 + }, + { + "epoch": 6.08718487394958, + "grad_norm": 0.6836188652244888, + "learning_rate": 2.0414540126509274e-06, + "loss": 0.1928, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17512783408164978, + "step": 5795, + "valid_targets_mean": 3166.1, + "valid_targets_min": 1269 + }, + { + "epoch": 6.092436974789916, + "grad_norm": 0.6778220747996802, + "learning_rate": 2.0184582393359253e-06, + "loss": 0.209, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20338422060012817, + "step": 5800, + "valid_targets_mean": 3617.4, + "valid_targets_min": 1681 + }, + { + "epoch": 6.097689075630252, + "grad_norm": 0.6622080466063627, + "learning_rate": 1.99558583283066e-06, + "loss": 0.1926, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17835170030593872, + "step": 5805, + "valid_targets_mean": 3919.8, + "valid_targets_min": 1477 + }, + { + "epoch": 6.102941176470588, + "grad_norm": 0.7482662124846838, + "learning_rate": 1.9728369500569333e-06, + "loss": 0.2007, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1978331208229065, + "step": 5810, + "valid_targets_mean": 3418.5, + "valid_targets_min": 662 + }, + { + "epoch": 6.108193277310924, + "grad_norm": 1.0158385440208195, + "learning_rate": 1.950211747089077e-06, + "loss": 0.1963, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2101389467716217, + "step": 5815, + "valid_targets_mean": 3706.7, + "valid_targets_min": 2077 + }, + { + "epoch": 6.11344537815126, + "grad_norm": 0.7058981750753525, + "learning_rate": 1.927710379152881e-06, + "loss": 0.1819, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1703696846961975, + "step": 5820, + "valid_targets_mean": 2878.1, + "valid_targets_min": 1505 + }, + { + "epoch": 6.118697478991597, + "grad_norm": 0.7508480855114319, + "learning_rate": 1.9053330006245452e-06, + "loss": 0.2016, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21035335958003998, + "step": 5825, + "valid_targets_mean": 3418.0, + "valid_targets_min": 1957 + }, + { + "epoch": 6.123949579831933, + "grad_norm": 0.8433194225905101, + "learning_rate": 1.8830797650296006e-06, + "loss": 0.2058, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.25868695974349976, + "step": 5830, + "valid_targets_mean": 4106.4, + "valid_targets_min": 1704 + }, + { + "epoch": 6.129201680672269, + "grad_norm": 0.7590435573654869, + "learning_rate": 1.8609508250418628e-06, + "loss": 0.1922, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2122974842786789, + "step": 5835, + "valid_targets_mean": 3046.9, + "valid_targets_min": 1422 + }, + { + "epoch": 6.1344537815126055, + "grad_norm": 0.685478517649954, + "learning_rate": 1.8389463324823986e-06, + "loss": 0.186, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1737407147884369, + "step": 5840, + "valid_targets_mean": 3447.4, + "valid_targets_min": 1603 + }, + { + "epoch": 6.139705882352941, + "grad_norm": 0.8161452603910854, + "learning_rate": 1.81706643831846e-06, + "loss": 0.1991, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20304900407791138, + "step": 5845, + "valid_targets_mean": 2597.8, + "valid_targets_min": 1685 + }, + { + "epoch": 6.144957983193278, + "grad_norm": 0.7114292866383795, + "learning_rate": 1.7953112926624715e-06, + "loss": 0.1864, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19642803072929382, + "step": 5850, + "valid_targets_mean": 3290.6, + "valid_targets_min": 1208 + }, + { + "epoch": 6.150210084033613, + "grad_norm": 0.7279693187875432, + "learning_rate": 1.7736810447709852e-06, + "loss": 0.1954, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1854780614376068, + "step": 5855, + "valid_targets_mean": 2661.8, + "valid_targets_min": 1501 + }, + { + "epoch": 6.15546218487395, + "grad_norm": 0.7284805186121608, + "learning_rate": 1.7521758430436553e-06, + "loss": 0.1961, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22248005867004395, + "step": 5860, + "valid_targets_mean": 3849.0, + "valid_targets_min": 1866 + }, + { + "epoch": 6.160714285714286, + "grad_norm": 0.641586434100809, + "learning_rate": 1.7307958350222366e-06, + "loss": 0.1819, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1723538041114807, + "step": 5865, + "valid_targets_mean": 3397.9, + "valid_targets_min": 1239 + }, + { + "epoch": 6.165966386554622, + "grad_norm": 0.7494400065396022, + "learning_rate": 1.7095411673895545e-06, + "loss": 0.1915, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20020216703414917, + "step": 5870, + "valid_targets_mean": 3155.5, + "valid_targets_min": 1177 + }, + { + "epoch": 6.171218487394958, + "grad_norm": 0.7120710111731775, + "learning_rate": 1.6884119859685034e-06, + "loss": 0.1922, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18129676580429077, + "step": 5875, + "valid_targets_mean": 3594.5, + "valid_targets_min": 1270 + }, + { + "epoch": 6.176470588235294, + "grad_norm": 0.7012711548565949, + "learning_rate": 1.6674084357210562e-06, + "loss": 0.1943, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18761314451694489, + "step": 5880, + "valid_targets_mean": 3571.2, + "valid_targets_min": 1216 + }, + { + "epoch": 6.18172268907563, + "grad_norm": 0.6937981892604655, + "learning_rate": 1.6465306607472608e-06, + "loss": 0.1927, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18734653294086456, + "step": 5885, + "valid_targets_mean": 3290.8, + "valid_targets_min": 1184 + }, + { + "epoch": 6.186974789915967, + "grad_norm": 0.7223230217430263, + "learning_rate": 1.625778804284246e-06, + "loss": 0.1955, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18657483160495758, + "step": 5890, + "valid_targets_mean": 2986.1, + "valid_targets_min": 1292 + }, + { + "epoch": 6.192226890756302, + "grad_norm": 0.703895451312637, + "learning_rate": 1.6051530087052558e-06, + "loss": 0.1986, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18239927291870117, + "step": 5895, + "valid_targets_mean": 3485.4, + "valid_targets_min": 1639 + }, + { + "epoch": 6.197478991596639, + "grad_norm": 0.7220190947994646, + "learning_rate": 1.5846534155186511e-06, + "loss": 0.1811, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19022542238235474, + "step": 5900, + "valid_targets_mean": 2959.4, + "valid_targets_min": 1394 + }, + { + "epoch": 6.2027310924369745, + "grad_norm": 0.7192311642483811, + "learning_rate": 1.564280165366956e-06, + "loss": 0.1979, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20613990724086761, + "step": 5905, + "valid_targets_mean": 3428.9, + "valid_targets_min": 2280 + }, + { + "epoch": 6.207983193277311, + "grad_norm": 0.7691711026249906, + "learning_rate": 1.544033398025886e-06, + "loss": 0.1868, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21603600680828094, + "step": 5910, + "valid_targets_mean": 3233.9, + "valid_targets_min": 810 + }, + { + "epoch": 6.213235294117647, + "grad_norm": 0.8449315953755364, + "learning_rate": 1.5239132524033951e-06, + "loss": 0.1834, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18134553730487823, + "step": 5915, + "valid_targets_mean": 3211.6, + "valid_targets_min": 1654 + }, + { + "epoch": 6.218487394957983, + "grad_norm": 0.7395008703366813, + "learning_rate": 1.50391986653871e-06, + "loss": 0.1916, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18029049038887024, + "step": 5920, + "valid_targets_mean": 3057.8, + "valid_targets_min": 584 + }, + { + "epoch": 6.223739495798319, + "grad_norm": 0.7120133644780183, + "learning_rate": 1.4840533776013954e-06, + "loss": 0.1916, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20296408236026764, + "step": 5925, + "valid_targets_mean": 3572.6, + "valid_targets_min": 2498 + }, + { + "epoch": 6.2289915966386555, + "grad_norm": 0.752548834195417, + "learning_rate": 1.4643139218904035e-06, + "loss": 0.1897, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18757691979408264, + "step": 5930, + "valid_targets_mean": 3161.1, + "valid_targets_min": 1350 + }, + { + "epoch": 6.234243697478991, + "grad_norm": 0.7837418288101413, + "learning_rate": 1.4447016348331477e-06, + "loss": 0.1975, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19451862573623657, + "step": 5935, + "valid_targets_mean": 3486.1, + "valid_targets_min": 1624 + }, + { + "epoch": 6.239495798319328, + "grad_norm": 0.7679677373950752, + "learning_rate": 1.4252166509845777e-06, + "loss": 0.1762, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16891759634017944, + "step": 5940, + "valid_targets_mean": 2769.6, + "valid_targets_min": 916 + }, + { + "epoch": 6.244747899159663, + "grad_norm": 0.6545085160769695, + "learning_rate": 1.4058591040262259e-06, + "loss": 0.1878, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1811821609735489, + "step": 5945, + "valid_targets_mean": 3734.1, + "valid_targets_min": 2209 + }, + { + "epoch": 6.25, + "grad_norm": 0.7272522502400294, + "learning_rate": 1.3866291267653309e-06, + "loss": 0.1889, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18539613485336304, + "step": 5950, + "valid_targets_mean": 3107.0, + "valid_targets_min": 1259 + }, + { + "epoch": 6.255252100840336, + "grad_norm": 0.6965968942209451, + "learning_rate": 1.3675268511339067e-06, + "loss": 0.1829, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17434164881706238, + "step": 5955, + "valid_targets_mean": 3685.6, + "valid_targets_min": 1183 + }, + { + "epoch": 6.260504201680672, + "grad_norm": 0.7307769179047728, + "learning_rate": 1.3485524081878288e-06, + "loss": 0.1806, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20974670350551605, + "step": 5960, + "valid_targets_mean": 3891.3, + "valid_targets_min": 1101 + }, + { + "epoch": 6.265756302521009, + "grad_norm": 0.7157157431884991, + "learning_rate": 1.3297059281059533e-06, + "loss": 0.1975, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19651910662651062, + "step": 5965, + "valid_targets_mean": 3877.6, + "valid_targets_min": 1658 + }, + { + "epoch": 6.2710084033613445, + "grad_norm": 0.8654778291967979, + "learning_rate": 1.3109875401892146e-06, + "loss": 0.187, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19856885075569153, + "step": 5970, + "valid_targets_mean": 3050.1, + "valid_targets_min": 1423 + }, + { + "epoch": 6.276260504201681, + "grad_norm": 0.7591061487662136, + "learning_rate": 1.2923973728597373e-06, + "loss": 0.1957, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18958264589309692, + "step": 5975, + "valid_targets_mean": 3202.4, + "valid_targets_min": 1185 + }, + { + "epoch": 6.281512605042017, + "grad_norm": 0.7845162142528881, + "learning_rate": 1.2739355536599508e-06, + "loss": 0.2075, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2176717221736908, + "step": 5980, + "valid_targets_mean": 3779.1, + "valid_targets_min": 1091 + }, + { + "epoch": 6.286764705882353, + "grad_norm": 0.7274113285487317, + "learning_rate": 1.2556022092517362e-06, + "loss": 0.1891, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1754409372806549, + "step": 5985, + "valid_targets_mean": 3628.9, + "valid_targets_min": 1352 + }, + { + "epoch": 6.292016806722689, + "grad_norm": 0.6322394750569781, + "learning_rate": 1.237397465415524e-06, + "loss": 0.19, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19616565108299255, + "step": 5990, + "valid_targets_mean": 4061.2, + "valid_targets_min": 1535 + }, + { + "epoch": 6.2972689075630255, + "grad_norm": 0.7257557508034214, + "learning_rate": 1.2193214470494664e-06, + "loss": 0.18, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.167373925447464, + "step": 5995, + "valid_targets_mean": 2753.1, + "valid_targets_min": 854 + }, + { + "epoch": 6.302521008403361, + "grad_norm": 0.7431922528740501, + "learning_rate": 1.201374278168541e-06, + "loss": 0.1768, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16021127998828888, + "step": 6000, + "valid_targets_mean": 2942.5, + "valid_targets_min": 1179 + }, + { + "epoch": 6.307773109243698, + "grad_norm": 0.7197510596784839, + "learning_rate": 1.1835560819037429e-06, + "loss": 0.1872, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1804109513759613, + "step": 6005, + "valid_targets_mean": 3598.9, + "valid_targets_min": 1290 + }, + { + "epoch": 6.313025210084033, + "grad_norm": 0.8045418304005293, + "learning_rate": 1.1658669805012112e-06, + "loss": 0.1761, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1749718338251114, + "step": 6010, + "valid_targets_mean": 2332.6, + "valid_targets_min": 642 + }, + { + "epoch": 6.31827731092437, + "grad_norm": 0.7127205041558864, + "learning_rate": 1.1483070953213904e-06, + "loss": 0.1745, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18035557866096497, + "step": 6015, + "valid_targets_mean": 3670.2, + "valid_targets_min": 1764 + }, + { + "epoch": 6.323529411764706, + "grad_norm": 0.8051860130698884, + "learning_rate": 1.130876546838211e-06, + "loss": 0.2005, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2282528579235077, + "step": 6020, + "valid_targets_mean": 3528.6, + "valid_targets_min": 1410 + }, + { + "epoch": 6.328781512605042, + "grad_norm": 0.7625429310294065, + "learning_rate": 1.1135754546382627e-06, + "loss": 0.1813, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19633427262306213, + "step": 6025, + "valid_targets_mean": 3147.7, + "valid_targets_min": 1683 + }, + { + "epoch": 6.334033613445378, + "grad_norm": 0.7138024696131663, + "learning_rate": 1.0964039374199564e-06, + "loss": 0.1872, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19841980934143066, + "step": 6030, + "valid_targets_mean": 3632.5, + "valid_targets_min": 996 + }, + { + "epoch": 6.339285714285714, + "grad_norm": 0.7688382202900614, + "learning_rate": 1.07936211299273e-06, + "loss": 0.188, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18963909149169922, + "step": 6035, + "valid_targets_mean": 3135.3, + "valid_targets_min": 1349 + }, + { + "epoch": 6.34453781512605, + "grad_norm": 0.7341808809524797, + "learning_rate": 1.0624500982762376e-06, + "loss": 0.1859, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2044352889060974, + "step": 6040, + "valid_targets_mean": 3391.6, + "valid_targets_min": 1248 + }, + { + "epoch": 6.349789915966387, + "grad_norm": 0.7221599296550733, + "learning_rate": 1.045668009299523e-06, + "loss": 0.1844, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17875009775161743, + "step": 6045, + "valid_targets_mean": 3323.4, + "valid_targets_min": 1445 + }, + { + "epoch": 6.355042016806722, + "grad_norm": 0.7155618590130363, + "learning_rate": 1.029015961200266e-06, + "loss": 0.181, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17386895418167114, + "step": 6050, + "valid_targets_mean": 3134.3, + "valid_targets_min": 2000 + }, + { + "epoch": 6.360294117647059, + "grad_norm": 0.8696023819163883, + "learning_rate": 1.012494068223946e-06, + "loss": 0.1759, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18593569099903107, + "step": 6055, + "valid_targets_mean": 2828.3, + "valid_targets_min": 1197 + }, + { + "epoch": 6.3655462184873945, + "grad_norm": 0.7145375703144178, + "learning_rate": 9.961024437230948e-07, + "loss": 0.1948, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18828941881656647, + "step": 6060, + "valid_targets_mean": 3219.0, + "valid_targets_min": 1223 + }, + { + "epoch": 6.370798319327731, + "grad_norm": 0.7434045401240451, + "learning_rate": 9.798412001565038e-07, + "loss": 0.1947, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17213355004787445, + "step": 6065, + "valid_targets_mean": 3199.2, + "valid_targets_min": 869 + }, + { + "epoch": 6.376050420168067, + "grad_norm": 0.760275705548783, + "learning_rate": 9.63710449088453e-07, + "loss": 0.1912, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19253242015838623, + "step": 6070, + "valid_targets_mean": 2817.8, + "valid_targets_min": 1603 + }, + { + "epoch": 6.381302521008403, + "grad_norm": 0.729204870471661, + "learning_rate": 9.477103011879408e-07, + "loss": 0.1931, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17323127388954163, + "step": 6075, + "valid_targets_mean": 2942.2, + "valid_targets_min": 1135 + }, + { + "epoch": 6.38655462184874, + "grad_norm": 0.7069419195201837, + "learning_rate": 9.318408662279399e-07, + "loss": 0.1945, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21406994760036469, + "step": 6080, + "valid_targets_mean": 4077.0, + "valid_targets_min": 1994 + }, + { + "epoch": 6.391806722689076, + "grad_norm": 0.7466628023501196, + "learning_rate": 9.161022530846253e-07, + "loss": 0.1942, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16813525557518005, + "step": 6085, + "valid_targets_mean": 3060.1, + "valid_targets_min": 1066 + }, + { + "epoch": 6.397058823529412, + "grad_norm": 0.7366467317633626, + "learning_rate": 9.004945697366452e-07, + "loss": 0.1932, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20294198393821716, + "step": 6090, + "valid_targets_mean": 3687.4, + "valid_targets_min": 1211 + }, + { + "epoch": 6.402310924369748, + "grad_norm": 0.7660213872137742, + "learning_rate": 8.850179232643641e-07, + "loss": 0.1903, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1757078468799591, + "step": 6095, + "valid_targets_mean": 2972.2, + "valid_targets_min": 1195 + }, + { + "epoch": 6.407563025210084, + "grad_norm": 0.8448238623784213, + "learning_rate": 8.696724198491369e-07, + "loss": 0.1894, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18741391599178314, + "step": 6100, + "valid_targets_mean": 2429.5, + "valid_targets_min": 484 + }, + { + "epoch": 6.41281512605042, + "grad_norm": 0.7208665843891413, + "learning_rate": 8.544581647725825e-07, + "loss": 0.1976, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2011285126209259, + "step": 6105, + "valid_targets_mean": 3851.9, + "valid_targets_min": 1257 + }, + { + "epoch": 6.418067226890757, + "grad_norm": 0.7164569848209156, + "learning_rate": 8.393752624158603e-07, + "loss": 0.1867, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17893822491168976, + "step": 6110, + "valid_targets_mean": 3483.2, + "valid_targets_min": 1372 + }, + { + "epoch": 6.423319327731092, + "grad_norm": 0.7706889942916458, + "learning_rate": 8.244238162589435e-07, + "loss": 0.1886, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19799582660198212, + "step": 6115, + "valid_targets_mean": 3186.8, + "valid_targets_min": 1769 + }, + { + "epoch": 6.428571428571429, + "grad_norm": 0.7885866860059115, + "learning_rate": 8.096039288799251e-07, + "loss": 0.1906, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18775229156017303, + "step": 6120, + "valid_targets_mean": 3407.6, + "valid_targets_min": 1074 + }, + { + "epoch": 6.4338235294117645, + "grad_norm": 0.6919907540962501, + "learning_rate": 7.949157019543064e-07, + "loss": 0.1957, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1812029927968979, + "step": 6125, + "valid_targets_mean": 3796.4, + "valid_targets_min": 980 + }, + { + "epoch": 6.439075630252101, + "grad_norm": 0.7918341376555602, + "learning_rate": 7.803592362542911e-07, + "loss": 0.1995, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20236995816230774, + "step": 6130, + "valid_targets_mean": 2808.1, + "valid_targets_min": 793 + }, + { + "epoch": 6.444327731092437, + "grad_norm": 0.7965898165350053, + "learning_rate": 7.659346316481086e-07, + "loss": 0.1842, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22702500224113464, + "step": 6135, + "valid_targets_mean": 3677.5, + "valid_targets_min": 1471 + }, + { + "epoch": 6.449579831932773, + "grad_norm": 0.7266460626729361, + "learning_rate": 7.516419870993296e-07, + "loss": 0.1783, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16017696261405945, + "step": 6140, + "valid_targets_mean": 3032.6, + "valid_targets_min": 1353 + }, + { + "epoch": 6.454831932773109, + "grad_norm": 0.7762725308287282, + "learning_rate": 7.374814006661667e-07, + "loss": 0.1851, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17704874277114868, + "step": 6145, + "valid_targets_mean": 2601.9, + "valid_targets_min": 1084 + }, + { + "epoch": 6.4600840336134455, + "grad_norm": 0.6779697306222039, + "learning_rate": 7.234529695008241e-07, + "loss": 0.1838, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17760631442070007, + "step": 6150, + "valid_targets_mean": 3280.8, + "valid_targets_min": 1428 + }, + { + "epoch": 6.465336134453781, + "grad_norm": 0.8121257910719274, + "learning_rate": 7.095567898488175e-07, + "loss": 0.1811, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1856568455696106, + "step": 6155, + "valid_targets_mean": 3229.4, + "valid_targets_min": 1193 + }, + { + "epoch": 6.470588235294118, + "grad_norm": 0.7371997769488223, + "learning_rate": 6.957929570483224e-07, + "loss": 0.1817, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17043937742710114, + "step": 6160, + "valid_targets_mean": 3519.2, + "valid_targets_min": 1614 + }, + { + "epoch": 6.475840336134453, + "grad_norm": 0.6638062829293753, + "learning_rate": 6.821615655295155e-07, + "loss": 0.174, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16736310720443726, + "step": 6165, + "valid_targets_mean": 3699.1, + "valid_targets_min": 974 + }, + { + "epoch": 6.48109243697479, + "grad_norm": 0.7220475008819989, + "learning_rate": 6.686627088139253e-07, + "loss": 0.1747, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14820286631584167, + "step": 6170, + "valid_targets_mean": 2730.4, + "valid_targets_min": 1575 + }, + { + "epoch": 6.486344537815126, + "grad_norm": 0.6962914540227392, + "learning_rate": 6.552964795137895e-07, + "loss": 0.1796, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18003645539283752, + "step": 6175, + "valid_targets_mean": 3345.0, + "valid_targets_min": 1697 + }, + { + "epoch": 6.491596638655462, + "grad_norm": 0.7440882846707011, + "learning_rate": 6.420629693314317e-07, + "loss": 0.1846, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19298087060451508, + "step": 6180, + "valid_targets_mean": 3602.2, + "valid_targets_min": 1970 + }, + { + "epoch": 6.496848739495798, + "grad_norm": 0.7715353825685302, + "learning_rate": 6.289622690586151e-07, + "loss": 0.1967, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18994097411632538, + "step": 6185, + "valid_targets_mean": 3128.4, + "valid_targets_min": 887 + }, + { + "epoch": 6.5021008403361344, + "grad_norm": 0.8887946663567943, + "learning_rate": 6.159944685759289e-07, + "loss": 0.1788, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1865498125553131, + "step": 6190, + "valid_targets_mean": 2712.2, + "valid_targets_min": 1279 + }, + { + "epoch": 6.507352941176471, + "grad_norm": 0.6867564122848154, + "learning_rate": 6.031596568521792e-07, + "loss": 0.1742, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1672389805316925, + "step": 6195, + "valid_targets_mean": 3052.6, + "valid_targets_min": 1021 + }, + { + "epoch": 6.512605042016807, + "grad_norm": 0.8081151613494477, + "learning_rate": 5.904579219437567e-07, + "loss": 0.1874, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1853436529636383, + "step": 6200, + "valid_targets_mean": 3352.1, + "valid_targets_min": 654 + }, + { + "epoch": 6.517857142857143, + "grad_norm": 0.8297017876682581, + "learning_rate": 5.778893509940497e-07, + "loss": 0.1855, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2378537356853485, + "step": 6205, + "valid_targets_mean": 2860.6, + "valid_targets_min": 1039 + }, + { + "epoch": 6.523109243697479, + "grad_norm": 0.7037062721004519, + "learning_rate": 5.654540302328526e-07, + "loss": 0.1874, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17788448929786682, + "step": 6210, + "valid_targets_mean": 3742.9, + "valid_targets_min": 2459 + }, + { + "epoch": 6.5283613445378155, + "grad_norm": 0.6751043734055584, + "learning_rate": 5.531520449757465e-07, + "loss": 0.1865, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16557300090789795, + "step": 6215, + "valid_targets_mean": 3435.8, + "valid_targets_min": 1276 + }, + { + "epoch": 6.533613445378151, + "grad_norm": 0.6332717965969442, + "learning_rate": 5.409834796235447e-07, + "loss": 0.1827, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17843201756477356, + "step": 6220, + "valid_targets_mean": 4335.8, + "valid_targets_min": 1572 + }, + { + "epoch": 6.538865546218488, + "grad_norm": 0.7540653616743905, + "learning_rate": 5.28948417661701e-07, + "loss": 0.1847, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1931922882795334, + "step": 6225, + "valid_targets_mean": 2975.5, + "valid_targets_min": 791 + }, + { + "epoch": 6.544117647058823, + "grad_norm": 0.945825539132947, + "learning_rate": 5.170469416597223e-07, + "loss": 0.1348, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1272469162940979, + "step": 6230, + "valid_targets_mean": 1444.9, + "valid_targets_min": 740 + }, + { + "epoch": 6.54936974789916, + "grad_norm": 0.9201038959571372, + "learning_rate": 5.05279133270633e-07, + "loss": 0.1261, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12720605731010437, + "step": 6235, + "valid_targets_mean": 1456.5, + "valid_targets_min": 612 + }, + { + "epoch": 6.554621848739496, + "grad_norm": 0.9294548695403332, + "learning_rate": 4.936450732303866e-07, + "loss": 0.1212, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12623611092567444, + "step": 6240, + "valid_targets_mean": 1432.6, + "valid_targets_min": 826 + }, + { + "epoch": 6.559873949579832, + "grad_norm": 0.81095763836755, + "learning_rate": 4.821448413573237e-07, + "loss": 0.1169, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11129063367843628, + "step": 6245, + "valid_targets_mean": 1432.6, + "valid_targets_min": 742 + }, + { + "epoch": 6.565126050420168, + "grad_norm": 0.8336053499869773, + "learning_rate": 4.70778516551631e-07, + "loss": 0.123, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11743263155221939, + "step": 6250, + "valid_targets_mean": 1387.0, + "valid_targets_min": 718 + }, + { + "epoch": 6.570378151260504, + "grad_norm": 0.8189714574359003, + "learning_rate": 4.595461767947829e-07, + "loss": 0.1256, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12419360131025314, + "step": 6255, + "valid_targets_mean": 1527.4, + "valid_targets_min": 764 + }, + { + "epoch": 6.57563025210084, + "grad_norm": 0.8726128195536536, + "learning_rate": 4.484478991490249e-07, + "loss": 0.108, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10007977485656738, + "step": 6260, + "valid_targets_mean": 1353.6, + "valid_targets_min": 725 + }, + { + "epoch": 6.580882352941177, + "grad_norm": 0.9528237066239539, + "learning_rate": 4.374837597568338e-07, + "loss": 0.1271, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10588499903678894, + "step": 6265, + "valid_targets_mean": 1309.9, + "valid_targets_min": 610 + }, + { + "epoch": 6.586134453781512, + "grad_norm": 0.773375907639893, + "learning_rate": 4.266538338403936e-07, + "loss": 0.1134, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1066712811589241, + "step": 6270, + "valid_targets_mean": 1465.4, + "valid_targets_min": 720 + }, + { + "epoch": 6.591386554621849, + "grad_norm": 0.7447038454026255, + "learning_rate": 4.159581957010894e-07, + "loss": 0.1176, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10983015596866608, + "step": 6275, + "valid_targets_mean": 1379.4, + "valid_targets_min": 615 + }, + { + "epoch": 6.5966386554621845, + "grad_norm": 0.8705541079832045, + "learning_rate": 4.0539691871898545e-07, + "loss": 0.1092, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10850921273231506, + "step": 6280, + "valid_targets_mean": 1158.2, + "valid_targets_min": 593 + }, + { + "epoch": 6.601890756302521, + "grad_norm": 0.9416604661089228, + "learning_rate": 3.949700753523344e-07, + "loss": 0.1118, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1087367981672287, + "step": 6285, + "valid_targets_mean": 1543.1, + "valid_targets_min": 704 + }, + { + "epoch": 6.607142857142857, + "grad_norm": 0.7499389879872029, + "learning_rate": 3.8467773713707134e-07, + "loss": 0.1101, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0929175540804863, + "step": 6290, + "valid_targets_mean": 1300.1, + "valid_targets_min": 722 + }, + { + "epoch": 6.612394957983193, + "grad_norm": 0.7928586147639457, + "learning_rate": 3.7451997468632486e-07, + "loss": 0.1076, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10093091428279877, + "step": 6295, + "valid_targets_mean": 1401.3, + "valid_targets_min": 642 + }, + { + "epoch": 6.617647058823529, + "grad_norm": 0.9017571609664792, + "learning_rate": 3.6449685768993327e-07, + "loss": 0.1058, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11259915679693222, + "step": 6300, + "valid_targets_mean": 1436.8, + "valid_targets_min": 518 + }, + { + "epoch": 6.6228991596638656, + "grad_norm": 0.8365779847032611, + "learning_rate": 3.5460845491396944e-07, + "loss": 0.1145, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12376931309700012, + "step": 6305, + "valid_targets_mean": 1531.6, + "valid_targets_min": 728 + }, + { + "epoch": 6.628151260504202, + "grad_norm": 0.889104983252716, + "learning_rate": 3.448548342002589e-07, + "loss": 0.1106, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1163712590932846, + "step": 6310, + "valid_targets_mean": 1469.6, + "valid_targets_min": 764 + }, + { + "epoch": 6.633403361344538, + "grad_norm": 0.8740557078182234, + "learning_rate": 3.352360624659312e-07, + "loss": 0.1176, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12843522429466248, + "step": 6315, + "valid_targets_mean": 1437.8, + "valid_targets_min": 818 + }, + { + "epoch": 6.6386554621848735, + "grad_norm": 0.8792645901441288, + "learning_rate": 3.2575220570294276e-07, + "loss": 0.1102, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11173952370882034, + "step": 6320, + "valid_targets_mean": 1327.3, + "valid_targets_min": 625 + }, + { + "epoch": 6.64390756302521, + "grad_norm": 0.8115595326058354, + "learning_rate": 3.164033289776369e-07, + "loss": 0.1138, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12014767527580261, + "step": 6325, + "valid_targets_mean": 1685.2, + "valid_targets_min": 790 + }, + { + "epoch": 6.649159663865547, + "grad_norm": 0.9521276969718082, + "learning_rate": 3.071894964302935e-07, + "loss": 0.113, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12036529183387756, + "step": 6330, + "valid_targets_mean": 1595.3, + "valid_targets_min": 891 + }, + { + "epoch": 6.654411764705882, + "grad_norm": 0.7903280323515541, + "learning_rate": 2.981107712746867e-07, + "loss": 0.1071, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09706208854913712, + "step": 6335, + "valid_targets_mean": 1381.1, + "valid_targets_min": 719 + }, + { + "epoch": 6.659663865546219, + "grad_norm": 0.8355498112239595, + "learning_rate": 2.891672157976522e-07, + "loss": 0.1063, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10185357928276062, + "step": 6340, + "valid_targets_mean": 1345.7, + "valid_targets_min": 657 + }, + { + "epoch": 6.6649159663865545, + "grad_norm": 0.8948565870788178, + "learning_rate": 2.803588913586608e-07, + "loss": 0.1052, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10712474584579468, + "step": 6345, + "valid_targets_mean": 1342.1, + "valid_targets_min": 783 + }, + { + "epoch": 6.670168067226891, + "grad_norm": 0.8221625640757199, + "learning_rate": 2.716858583894033e-07, + "loss": 0.1075, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10669823735952377, + "step": 6350, + "valid_targets_mean": 1450.6, + "valid_targets_min": 629 + }, + { + "epoch": 6.675420168067227, + "grad_norm": 0.8413623877263701, + "learning_rate": 2.6314817639335964e-07, + "loss": 0.109, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11155045032501221, + "step": 6355, + "valid_targets_mean": 1461.3, + "valid_targets_min": 678 + }, + { + "epoch": 6.680672268907563, + "grad_norm": 0.8587976871867034, + "learning_rate": 2.547459039454103e-07, + "loss": 0.1128, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.120185486972332, + "step": 6360, + "valid_targets_mean": 1723.1, + "valid_targets_min": 1075 + }, + { + "epoch": 6.685924369747899, + "grad_norm": 0.92862789354394, + "learning_rate": 2.4647909869142117e-07, + "loss": 0.1139, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1129080206155777, + "step": 6365, + "valid_targets_mean": 1669.1, + "valid_targets_min": 816 + }, + { + "epoch": 6.6911764705882355, + "grad_norm": 0.8365500928151788, + "learning_rate": 2.3834781734784817e-07, + "loss": 0.1094, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11981870979070663, + "step": 6370, + "valid_targets_mean": 1521.4, + "valid_targets_min": 957 + }, + { + "epoch": 6.696428571428571, + "grad_norm": 0.8689676540452689, + "learning_rate": 2.3035211570135995e-07, + "loss": 0.1085, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09756392240524292, + "step": 6375, + "valid_targets_mean": 1282.1, + "valid_targets_min": 643 + }, + { + "epoch": 6.701680672268908, + "grad_norm": 0.9369896336428621, + "learning_rate": 2.224920486084403e-07, + "loss": 0.1135, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10868951678276062, + "step": 6380, + "valid_targets_mean": 1499.7, + "valid_targets_min": 726 + }, + { + "epoch": 6.706932773109243, + "grad_norm": 0.8236205446292434, + "learning_rate": 2.1476766999502408e-07, + "loss": 0.1034, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11456996202468872, + "step": 6385, + "valid_targets_mean": 1621.1, + "valid_targets_min": 705 + }, + { + "epoch": 6.71218487394958, + "grad_norm": 0.8914772064174625, + "learning_rate": 2.071790328561152e-07, + "loss": 0.1056, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11084552109241486, + "step": 6390, + "valid_targets_mean": 1390.9, + "valid_targets_min": 700 + }, + { + "epoch": 6.717436974789916, + "grad_norm": 0.847420104124652, + "learning_rate": 1.997261892554403e-07, + "loss": 0.0992, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09959986060857773, + "step": 6395, + "valid_targets_mean": 1254.4, + "valid_targets_min": 627 + }, + { + "epoch": 6.722689075630252, + "grad_norm": 0.874119271608596, + "learning_rate": 1.9240919032506688e-07, + "loss": 0.1089, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10325537621974945, + "step": 6400, + "valid_targets_mean": 1479.2, + "valid_targets_min": 817 + }, + { + "epoch": 6.727941176470588, + "grad_norm": 0.8485613033201405, + "learning_rate": 1.8522808626507683e-07, + "loss": 0.1064, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11246100813150406, + "step": 6405, + "valid_targets_mean": 1464.4, + "valid_targets_min": 974 + }, + { + "epoch": 6.733193277310924, + "grad_norm": 0.8500768031572533, + "learning_rate": 1.781829263432111e-07, + "loss": 0.1057, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10820727050304413, + "step": 6410, + "valid_targets_mean": 1381.2, + "valid_targets_min": 657 + }, + { + "epoch": 6.73844537815126, + "grad_norm": 1.0070862147853497, + "learning_rate": 1.7127375889452569e-07, + "loss": 0.1097, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10374858230352402, + "step": 6415, + "valid_targets_mean": 1486.0, + "valid_targets_min": 746 + }, + { + "epoch": 6.743697478991597, + "grad_norm": 0.9783876731250509, + "learning_rate": 1.6450063132107396e-07, + "loss": 0.1081, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11519736051559448, + "step": 6420, + "valid_targets_mean": 1459.7, + "valid_targets_min": 739 + }, + { + "epoch": 6.748949579831933, + "grad_norm": 0.8259991898073508, + "learning_rate": 1.5786359009156928e-07, + "loss": 0.1044, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09908154606819153, + "step": 6425, + "valid_targets_mean": 1397.0, + "valid_targets_min": 682 + }, + { + "epoch": 6.754201680672269, + "grad_norm": 0.8592177771547324, + "learning_rate": 1.5136268074107398e-07, + "loss": 0.1029, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10556816309690475, + "step": 6430, + "valid_targets_mean": 1288.8, + "valid_targets_min": 703 + }, + { + "epoch": 6.759453781512605, + "grad_norm": 0.876887343291053, + "learning_rate": 1.44997947870682e-07, + "loss": 0.1128, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11252713203430176, + "step": 6435, + "valid_targets_mean": 1446.1, + "valid_targets_min": 864 + }, + { + "epoch": 6.764705882352941, + "grad_norm": 0.9653593171457929, + "learning_rate": 1.3876943514721465e-07, + "loss": 0.1151, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14397484064102173, + "step": 6440, + "valid_targets_mean": 1673.2, + "valid_targets_min": 734 + }, + { + "epoch": 6.769957983193278, + "grad_norm": 0.8493841465052333, + "learning_rate": 1.3267718530292296e-07, + "loss": 0.1042, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10939159989356995, + "step": 6445, + "valid_targets_mean": 1598.7, + "valid_targets_min": 607 + }, + { + "epoch": 6.775210084033613, + "grad_norm": 0.821915166356728, + "learning_rate": 1.267212401351925e-07, + "loss": 0.1029, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10267669707536697, + "step": 6450, + "valid_targets_mean": 1445.2, + "valid_targets_min": 551 + }, + { + "epoch": 6.78046218487395, + "grad_norm": 0.9162688760398915, + "learning_rate": 1.2090164050625907e-07, + "loss": 0.1092, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11637894809246063, + "step": 6455, + "valid_targets_mean": 1552.2, + "valid_targets_min": 791 + }, + { + "epoch": 6.785714285714286, + "grad_norm": 0.8967489554798673, + "learning_rate": 1.1521842634292013e-07, + "loss": 0.1055, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10807375609874725, + "step": 6460, + "valid_targets_mean": 1511.6, + "valid_targets_min": 825 + }, + { + "epoch": 6.790966386554622, + "grad_norm": 0.8909809447006225, + "learning_rate": 1.0967163663627044e-07, + "loss": 0.1008, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10812873393297195, + "step": 6465, + "valid_targets_mean": 1489.3, + "valid_targets_min": 859 + }, + { + "epoch": 6.796218487394958, + "grad_norm": 0.8597923475845829, + "learning_rate": 1.0426130944143353e-07, + "loss": 0.0978, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09637298434972763, + "step": 6470, + "valid_targets_mean": 1356.9, + "valid_targets_min": 737 + }, + { + "epoch": 6.801470588235294, + "grad_norm": 0.8605974789325253, + "learning_rate": 9.898748187729513e-08, + "loss": 0.111, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09894619882106781, + "step": 6475, + "valid_targets_mean": 1359.9, + "valid_targets_min": 791 + }, + { + "epoch": 6.80672268907563, + "grad_norm": 0.9100875928994199, + "learning_rate": 9.385019012625007e-08, + "loss": 0.1135, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11625594645738602, + "step": 6480, + "valid_targets_mean": 1443.4, + "valid_targets_min": 724 + }, + { + "epoch": 6.811974789915967, + "grad_norm": 0.8583853259041662, + "learning_rate": 8.884946943395811e-08, + "loss": 0.1104, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11173100769519806, + "step": 6485, + "valid_targets_mean": 1376.3, + "valid_targets_min": 944 + }, + { + "epoch": 6.817226890756302, + "grad_norm": 0.7696906815936799, + "learning_rate": 8.398535410910402e-08, + "loss": 0.1038, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09793375432491302, + "step": 6490, + "valid_targets_mean": 1597.7, + "valid_targets_min": 802 + }, + { + "epoch": 6.822478991596639, + "grad_norm": 0.7990711794579531, + "learning_rate": 7.925787752314674e-08, + "loss": 0.1124, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09811538457870483, + "step": 6495, + "valid_targets_mean": 1419.2, + "valid_targets_min": 740 + }, + { + "epoch": 6.8277310924369745, + "grad_norm": 0.7717945193131686, + "learning_rate": 7.466707211010838e-08, + "loss": 0.108, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10290801525115967, + "step": 6500, + "valid_targets_mean": 1570.5, + "valid_targets_min": 881 + }, + { + "epoch": 6.832983193277311, + "grad_norm": 0.9330044417782807, + "learning_rate": 7.02129693663478e-08, + "loss": 0.102, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10135114192962646, + "step": 6505, + "valid_targets_mean": 1177.1, + "valid_targets_min": 636 + }, + { + "epoch": 6.838235294117647, + "grad_norm": 0.885799823289419, + "learning_rate": 6.589559985033189e-08, + "loss": 0.1051, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10052669793367386, + "step": 6510, + "valid_targets_mean": 1280.1, + "valid_targets_min": 814 + }, + { + "epoch": 6.843487394957983, + "grad_norm": 0.8895050648007775, + "learning_rate": 6.171499318244234e-08, + "loss": 0.0972, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0963287502527237, + "step": 6515, + "valid_targets_mean": 1253.6, + "valid_targets_min": 604 + }, + { + "epoch": 6.848739495798319, + "grad_norm": 0.8626286788780626, + "learning_rate": 5.767117804476696e-08, + "loss": 0.108, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0979156345129013, + "step": 6520, + "valid_targets_mean": 1232.8, + "valid_targets_min": 661 + }, + { + "epoch": 6.8539915966386555, + "grad_norm": 0.8311072710033767, + "learning_rate": 5.376418218089541e-08, + "loss": 0.109, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1046762764453888, + "step": 6525, + "valid_targets_mean": 1484.8, + "valid_targets_min": 728 + }, + { + "epoch": 6.859243697478991, + "grad_norm": 0.9079288548187959, + "learning_rate": 4.99940323957393e-08, + "loss": 0.1056, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11257081478834152, + "step": 6530, + "valid_targets_mean": 1383.6, + "valid_targets_min": 692 + }, + { + "epoch": 6.864495798319328, + "grad_norm": 0.8918440819640617, + "learning_rate": 4.63607545553435e-08, + "loss": 0.1065, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10769190639257431, + "step": 6535, + "valid_targets_mean": 1386.2, + "valid_targets_min": 840 + }, + { + "epoch": 6.869747899159664, + "grad_norm": 0.9081288698653714, + "learning_rate": 4.2864373586706254e-08, + "loss": 0.1084, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10562418401241302, + "step": 6540, + "valid_targets_mean": 1375.6, + "valid_targets_min": 772 + }, + { + "epoch": 6.875, + "grad_norm": 0.8331522601558252, + "learning_rate": 3.950491347761487e-08, + "loss": 0.1045, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10698384046554565, + "step": 6545, + "valid_targets_mean": 1612.4, + "valid_targets_min": 670 + }, + { + "epoch": 6.880252100840336, + "grad_norm": 0.8223352044912656, + "learning_rate": 3.628239727647254e-08, + "loss": 0.1039, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10564574599266052, + "step": 6550, + "valid_targets_mean": 1427.0, + "valid_targets_min": 750 + }, + { + "epoch": 6.885504201680672, + "grad_norm": 1.2026759527578401, + "learning_rate": 3.319684709215176e-08, + "loss": 0.1063, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10793040692806244, + "step": 6555, + "valid_targets_mean": 1479.3, + "valid_targets_min": 766 + }, + { + "epoch": 6.890756302521009, + "grad_norm": 0.8039951616902973, + "learning_rate": 3.024828409383007e-08, + "loss": 0.1018, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09126448631286621, + "step": 6560, + "valid_targets_mean": 1241.5, + "valid_targets_min": 729 + }, + { + "epoch": 6.8960084033613445, + "grad_norm": 0.8938242214668102, + "learning_rate": 2.743672851085233e-08, + "loss": 0.1082, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11531618982553482, + "step": 6565, + "valid_targets_mean": 1410.9, + "valid_targets_min": 682 + }, + { + "epoch": 6.901260504201681, + "grad_norm": 0.891140302112469, + "learning_rate": 2.4762199632588634e-08, + "loss": 0.1181, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11160510778427124, + "step": 6570, + "valid_targets_mean": 1569.1, + "valid_targets_min": 738 + }, + { + "epoch": 6.906512605042017, + "grad_norm": 0.8886137842875292, + "learning_rate": 2.2224715808309983e-08, + "loss": 0.1078, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10890690982341766, + "step": 6575, + "valid_targets_mean": 1378.0, + "valid_targets_min": 731 + }, + { + "epoch": 6.911764705882353, + "grad_norm": 0.9367326463088681, + "learning_rate": 1.9824294447043923e-08, + "loss": 0.1115, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13127145171165466, + "step": 6580, + "valid_targets_mean": 1620.0, + "valid_targets_min": 748 + }, + { + "epoch": 6.917016806722689, + "grad_norm": 0.838793196574803, + "learning_rate": 1.7560952017481313e-08, + "loss": 0.1025, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09811349958181381, + "step": 6585, + "valid_targets_mean": 1355.1, + "valid_targets_min": 564 + }, + { + "epoch": 6.9222689075630255, + "grad_norm": 0.8347467550105157, + "learning_rate": 1.5434704047836424e-08, + "loss": 0.1027, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09899817407131195, + "step": 6590, + "valid_targets_mean": 1419.1, + "valid_targets_min": 651 + }, + { + "epoch": 6.927521008403361, + "grad_norm": 0.8905919808272537, + "learning_rate": 1.344556512576256e-08, + "loss": 0.1108, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10358569025993347, + "step": 6595, + "valid_targets_mean": 1291.7, + "valid_targets_min": 687 + }, + { + "epoch": 6.932773109243698, + "grad_norm": 0.8193427692652885, + "learning_rate": 1.1593548898236606e-08, + "loss": 0.1027, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09667745232582092, + "step": 6600, + "valid_targets_mean": 1236.8, + "valid_targets_min": 703 + }, + { + "epoch": 6.938025210084033, + "grad_norm": 0.8054209308544474, + "learning_rate": 9.878668071474639e-09, + "loss": 0.101, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08912120014429092, + "step": 6605, + "valid_targets_mean": 1258.9, + "valid_targets_min": 522 + }, + { + "epoch": 6.94327731092437, + "grad_norm": 0.8379632670512256, + "learning_rate": 8.3009344108409e-09, + "loss": 0.1071, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10500848293304443, + "step": 6610, + "valid_targets_mean": 1495.5, + "valid_targets_min": 764 + }, + { + "epoch": 6.948529411764706, + "grad_norm": 0.9047510484875828, + "learning_rate": 6.860358740763406e-09, + "loss": 0.1143, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12173473089933395, + "step": 6615, + "valid_targets_mean": 1421.0, + "valid_targets_min": 548 + }, + { + "epoch": 6.953781512605042, + "grad_norm": 0.8386152042305247, + "learning_rate": 5.55695094467179e-09, + "loss": 0.1013, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11426173895597458, + "step": 6620, + "valid_targets_mean": 1487.2, + "valid_targets_min": 694 + }, + { + "epoch": 6.959033613445378, + "grad_norm": 0.8298195930802489, + "learning_rate": 4.3907199649151355e-09, + "loss": 0.105, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10774379968643188, + "step": 6625, + "valid_targets_mean": 1512.4, + "valid_targets_min": 823 + }, + { + "epoch": 6.964285714285714, + "grad_norm": 0.7758294188223108, + "learning_rate": 3.361673802708687e-09, + "loss": 0.0926, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08553959429264069, + "step": 6630, + "valid_targets_mean": 1375.4, + "valid_targets_min": 595 + }, + { + "epoch": 6.96953781512605, + "grad_norm": 0.9086042968946347, + "learning_rate": 2.469819518080563e-09, + "loss": 0.1032, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11077478528022766, + "step": 6635, + "valid_targets_mean": 1401.2, + "valid_targets_min": 693 + }, + { + "epoch": 6.974789915966387, + "grad_norm": 1.0872068857891495, + "learning_rate": 1.7151632298140209e-09, + "loss": 0.1005, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09122096002101898, + "step": 6640, + "valid_targets_mean": 1185.6, + "valid_targets_min": 720 + }, + { + "epoch": 6.980042016806722, + "grad_norm": 0.9264996959156637, + "learning_rate": 1.0977101154163727e-09, + "loss": 0.102, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08891530334949493, + "step": 6645, + "valid_targets_mean": 1364.2, + "valid_targets_min": 685 + }, + { + "epoch": 6.985294117647059, + "grad_norm": 0.8282065868459698, + "learning_rate": 6.174644110767958e-10, + "loss": 0.0982, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0922815352678299, + "step": 6650, + "valid_targets_mean": 1345.2, + "valid_targets_min": 658 + }, + { + "epoch": 6.990546218487395, + "grad_norm": 0.7963997364292627, + "learning_rate": 2.744294116419077e-10, + "loss": 0.1045, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09688857197761536, + "step": 6655, + "valid_targets_mean": 1431.4, + "valid_targets_min": 686 + }, + { + "epoch": 6.995798319327731, + "grad_norm": 0.8692235718392078, + "learning_rate": 6.860747058468064e-11, + "loss": 0.1056, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11209136247634888, + "step": 6660, + "valid_targets_mean": 1505.8, + "valid_targets_min": 713 + }, + { + "epoch": 7.0, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0974183976650238, + "step": 6664, + "total_flos": 1189064928198656.0, + "train_loss": 0.2180497848695996, + "train_runtime": 25724.8893, + "train_samples_per_second": 4.145, + "train_steps_per_second": 0.259, + "valid_targets_mean": 1721.1, + "valid_targets_min": 760 + } + ], + "logging_steps": 5, + "max_steps": 6664, + "num_input_tokens_seen": 0, + "num_train_epochs": 7, + "save_steps": 200, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": true, + "should_training_stop": true + }, + "attributes": {} + } + }, + "total_flos": 1189064928198656.0, + "train_batch_size": 1, + "trial_name": null, + "trial_params": null +}