diff --git "a/trainer_state.json" "b/trainer_state.json" new file mode 100644--- /dev/null +++ "b/trainer_state.json" @@ -0,0 +1,3654 @@ +{ + "best_metric": 0.3097, + "best_model_checkpoint": "ms-cond-detr-res-50-vehicles/checkpoint-131385", + "epoch": 60.0, + "eval_steps": 500, + "global_step": 138300, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.21691973969631237, + "grad_norm": 32948.171875, + "learning_rate": 9.999685192743662e-05, + "loss": 7.6906, + "step": 500 + }, + { + "epoch": 0.43383947939262474, + "grad_norm": 8056.21142578125, + "learning_rate": 9.998728034076959e-05, + "loss": 2.3313, + "step": 1000 + }, + { + "epoch": 0.6507592190889371, + "grad_norm": 17431.4765625, + "learning_rate": 9.997124764767083e-05, + "loss": 2.1856, + "step": 1500 + }, + { + "epoch": 0.8676789587852495, + "grad_norm": 17146.232421875, + "learning_rate": 9.994876864856252e-05, + "loss": 2.051, + "step": 2000 + }, + { + "epoch": 1.0, + "eval_loss": 1.895993709564209, + "eval_map": 0.0623, + "eval_map_50": 0.1484, + "eval_map_75": 0.0432, + "eval_map_bus": 0.0489, + "eval_map_car": 0.0878, + "eval_map_container": 0.0856, + "eval_map_large": 0.1451, + "eval_map_medium": 0.0546, + "eval_map_motorbike": 0.0269, + "eval_map_small": 0.0085, + "eval_mar_1": 0.0883, + "eval_mar_10": 0.2294, + "eval_mar_100": 0.2984, + "eval_mar_100_bus": 0.3264, + "eval_mar_100_car": 0.3206, + "eval_mar_100_container": 0.3323, + "eval_mar_100_motorbike": 0.2141, + "eval_mar_large": 0.4778, + "eval_mar_medium": 0.2854, + "eval_mar_small": 0.0421, + "eval_runtime": 114.5232, + "eval_samples_per_second": 20.109, + "eval_steps_per_second": 2.515, + "step": 2305 + }, + { + "epoch": 1.0845986984815619, + "grad_norm": 14355.5908203125, + "learning_rate": 9.991984624324235e-05, + "loss": 1.9627, + "step": 2500 + }, + { + "epoch": 1.3015184381778742, + "grad_norm": 5871.64599609375, + "learning_rate": 9.988456131077249e-05, + "loss": 1.9168, + "step": 3000 + }, + { + "epoch": 1.5184381778741867, + "grad_norm": 4061.07080078125, + "learning_rate": 9.984277698186814e-05, + "loss": 1.8332, + "step": 3500 + }, + { + "epoch": 1.735357917570499, + "grad_norm": 4107.30517578125, + "learning_rate": 9.979456291970887e-05, + "loss": 1.7907, + "step": 4000 + }, + { + "epoch": 1.9522776572668112, + "grad_norm": 6267.9453125, + "learning_rate": 9.973992534392322e-05, + "loss": 1.7617, + "step": 4500 + }, + { + "epoch": 2.0, + "eval_loss": 1.6729236841201782, + "eval_map": 0.1472, + "eval_map_50": 0.3286, + "eval_map_75": 0.1129, + "eval_map_bus": 0.1128, + "eval_map_car": 0.2083, + "eval_map_container": 0.1971, + "eval_map_large": 0.3455, + "eval_map_medium": 0.1211, + "eval_map_motorbike": 0.0705, + "eval_map_small": 0.0156, + "eval_mar_1": 0.1272, + "eval_mar_10": 0.3047, + "eval_mar_100": 0.3573, + "eval_mar_100_bus": 0.4427, + "eval_mar_100_car": 0.3575, + "eval_mar_100_container": 0.3994, + "eval_mar_100_motorbike": 0.2297, + "eval_mar_large": 0.6163, + "eval_mar_medium": 0.3404, + "eval_mar_small": 0.0626, + "eval_runtime": 111.0496, + "eval_samples_per_second": 20.738, + "eval_steps_per_second": 2.593, + "step": 4610 + }, + { + "epoch": 2.1691973969631237, + "grad_norm": 6151.71826171875, + "learning_rate": 9.967887130277497e-05, + "loss": 1.7034, + "step": 5000 + }, + { + "epoch": 2.3861171366594363, + "grad_norm": 13430.7021484375, + "learning_rate": 9.961140867225379e-05, + "loss": 1.6812, + "step": 5500 + }, + { + "epoch": 2.6030368763557483, + "grad_norm": 23429.322265625, + "learning_rate": 9.953754615505938e-05, + "loss": 1.6754, + "step": 6000 + }, + { + "epoch": 2.819956616052061, + "grad_norm": 5950.3984375, + "learning_rate": 9.94572932794787e-05, + "loss": 1.6489, + "step": 6500 + }, + { + "epoch": 3.0, + "eval_loss": 1.5874069929122925, + "eval_map": 0.1778, + "eval_map_50": 0.3853, + "eval_map_75": 0.1458, + "eval_map_bus": 0.1352, + "eval_map_car": 0.2354, + "eval_map_container": 0.2234, + "eval_map_large": 0.3729, + "eval_map_medium": 0.1542, + "eval_map_motorbike": 0.1172, + "eval_map_small": 0.0131, + "eval_mar_1": 0.1417, + "eval_mar_10": 0.3206, + "eval_mar_100": 0.365, + "eval_mar_100_bus": 0.4474, + "eval_mar_100_car": 0.3691, + "eval_mar_100_container": 0.3944, + "eval_mar_100_motorbike": 0.2491, + "eval_mar_large": 0.6265, + "eval_mar_medium": 0.343, + "eval_mar_small": 0.0747, + "eval_runtime": 111.1265, + "eval_samples_per_second": 20.724, + "eval_steps_per_second": 2.592, + "step": 6915 + }, + { + "epoch": 3.036876355748373, + "grad_norm": 8822.9736328125, + "learning_rate": 9.937084002387407e-05, + "loss": 1.6342, + "step": 7000 + }, + { + "epoch": 3.2537960954446854, + "grad_norm": 17186.669921875, + "learning_rate": 9.927785103843946e-05, + "loss": 1.6239, + "step": 7500 + }, + { + "epoch": 3.470715835140998, + "grad_norm": 7216.52880859375, + "learning_rate": 9.917850519536694e-05, + "loss": 1.632, + "step": 8000 + }, + { + "epoch": 3.6876355748373104, + "grad_norm": 15494.7607421875, + "learning_rate": 9.907281531030016e-05, + "loss": 1.6064, + "step": 8500 + }, + { + "epoch": 3.9045553145336225, + "grad_norm": 8969.22265625, + "learning_rate": 9.896102536613032e-05, + "loss": 1.5998, + "step": 9000 + }, + { + "epoch": 4.0, + "eval_loss": 1.552794337272644, + "eval_map": 0.1929, + "eval_map_50": 0.4053, + "eval_map_75": 0.1639, + "eval_map_bus": 0.1675, + "eval_map_car": 0.2425, + "eval_map_container": 0.2398, + "eval_map_large": 0.4082, + "eval_map_medium": 0.1638, + "eval_map_motorbike": 0.1219, + "eval_map_small": 0.0144, + "eval_mar_1": 0.1504, + "eval_mar_10": 0.3294, + "eval_mar_100": 0.3756, + "eval_mar_100_bus": 0.4699, + "eval_mar_100_car": 0.3745, + "eval_mar_100_container": 0.4104, + "eval_mar_100_motorbike": 0.2477, + "eval_mar_large": 0.6317, + "eval_mar_medium": 0.3567, + "eval_mar_small": 0.07, + "eval_runtime": 109.6617, + "eval_samples_per_second": 21.001, + "eval_steps_per_second": 2.626, + "step": 9220 + }, + { + "epoch": 4.1214750542299345, + "grad_norm": 15890.3359375, + "learning_rate": 9.884270173273174e-05, + "loss": 1.5972, + "step": 9500 + }, + { + "epoch": 4.3383947939262475, + "grad_norm": 26849.8046875, + "learning_rate": 9.871807737608682e-05, + "loss": 1.5947, + "step": 10000 + }, + { + "epoch": 4.55531453362256, + "grad_norm": 17527.794921875, + "learning_rate": 9.858716837277515e-05, + "loss": 1.5719, + "step": 10500 + }, + { + "epoch": 4.7722342733188725, + "grad_norm": 27437.568359375, + "learning_rate": 9.844999161009761e-05, + "loss": 1.5632, + "step": 11000 + }, + { + "epoch": 4.989154013015185, + "grad_norm": 8879.484375, + "learning_rate": 9.830685786294999e-05, + "loss": 1.552, + "step": 11500 + }, + { + "epoch": 5.0, + "eval_loss": 1.52571439743042, + "eval_map": 0.2026, + "eval_map_50": 0.4239, + "eval_map_75": 0.1723, + "eval_map_bus": 0.1926, + "eval_map_car": 0.2487, + "eval_map_container": 0.2421, + "eval_map_large": 0.4281, + "eval_map_medium": 0.1671, + "eval_map_motorbike": 0.1269, + "eval_map_small": 0.0163, + "eval_mar_1": 0.1528, + "eval_mar_10": 0.3307, + "eval_mar_100": 0.3791, + "eval_mar_100_bus": 0.4657, + "eval_mar_100_car": 0.3765, + "eval_mar_100_container": 0.4165, + "eval_mar_100_motorbike": 0.2577, + "eval_mar_large": 0.6259, + "eval_mar_medium": 0.3542, + "eval_mar_small": 0.0996, + "eval_runtime": 113.4379, + "eval_samples_per_second": 20.302, + "eval_steps_per_second": 2.539, + "step": 11525 + }, + { + "epoch": 5.206073752711497, + "grad_norm": 16417.5234375, + "learning_rate": 9.815721191945502e-05, + "loss": 1.5611, + "step": 12000 + }, + { + "epoch": 5.422993492407809, + "grad_norm": 5270.97802734375, + "learning_rate": 9.800135368110628e-05, + "loss": 1.551, + "step": 12500 + }, + { + "epoch": 5.639913232104122, + "grad_norm": 12491.1376953125, + "learning_rate": 9.783930325366346e-05, + "loss": 1.5441, + "step": 13000 + }, + { + "epoch": 5.856832971800434, + "grad_norm": 6461.4892578125, + "learning_rate": 9.767176669323077e-05, + "loss": 1.5478, + "step": 13500 + }, + { + "epoch": 6.0, + "eval_loss": 1.5407626628875732, + "eval_map": 0.1996, + "eval_map_50": 0.424, + "eval_map_75": 0.164, + "eval_map_bus": 0.1989, + "eval_map_car": 0.2419, + "eval_map_container": 0.2416, + "eval_map_large": 0.4241, + "eval_map_medium": 0.1588, + "eval_map_motorbike": 0.1162, + "eval_map_small": 0.0161, + "eval_mar_1": 0.1529, + "eval_mar_10": 0.3225, + "eval_mar_100": 0.37, + "eval_mar_100_bus": 0.4587, + "eval_mar_100_car": 0.3579, + "eval_mar_100_container": 0.4178, + "eval_mar_100_motorbike": 0.2455, + "eval_mar_large": 0.6196, + "eval_mar_medium": 0.3413, + "eval_mar_small": 0.0782, + "eval_runtime": 112.8265, + "eval_samples_per_second": 20.412, + "eval_steps_per_second": 2.553, + "step": 13830 + }, + { + "epoch": 6.073752711496746, + "grad_norm": 4583.74365234375, + "learning_rate": 9.749741995141488e-05, + "loss": 1.5571, + "step": 14000 + }, + { + "epoch": 6.290672451193059, + "grad_norm": 6658.3671875, + "learning_rate": 9.731694602810796e-05, + "loss": 1.5572, + "step": 14500 + }, + { + "epoch": 6.507592190889371, + "grad_norm": 7703.2578125, + "learning_rate": 9.713036820450053e-05, + "loss": 1.547, + "step": 15000 + }, + { + "epoch": 6.724511930585683, + "grad_norm": 16854.68359375, + "learning_rate": 9.693771054918806e-05, + "loss": 1.5371, + "step": 15500 + }, + { + "epoch": 6.941431670281996, + "grad_norm": 22233.17578125, + "learning_rate": 9.673899791506617e-05, + "loss": 1.5026, + "step": 16000 + }, + { + "epoch": 7.0, + "eval_loss": 1.473095178604126, + "eval_map": 0.2228, + "eval_map_50": 0.4631, + "eval_map_75": 0.1881, + "eval_map_bus": 0.2327, + "eval_map_car": 0.2595, + "eval_map_container": 0.2596, + "eval_map_large": 0.4556, + "eval_map_medium": 0.1862, + "eval_map_motorbike": 0.1395, + "eval_map_small": 0.0224, + "eval_mar_1": 0.1628, + "eval_mar_10": 0.3411, + "eval_mar_100": 0.3918, + "eval_mar_100_bus": 0.4761, + "eval_mar_100_car": 0.3906, + "eval_mar_100_container": 0.4347, + "eval_mar_100_motorbike": 0.266, + "eval_mar_large": 0.6375, + "eval_mar_medium": 0.3684, + "eval_mar_small": 0.1103, + "eval_runtime": 110.9297, + "eval_samples_per_second": 20.761, + "eval_steps_per_second": 2.596, + "step": 16135 + }, + { + "epoch": 7.158351409978308, + "grad_norm": 19154.3046875, + "learning_rate": 9.653425593612456e-05, + "loss": 1.5021, + "step": 16500 + }, + { + "epoch": 7.375271149674621, + "grad_norm": 9528.267578125, + "learning_rate": 9.63235110241402e-05, + "loss": 1.5002, + "step": 17000 + }, + { + "epoch": 7.592190889370933, + "grad_norm": 15413.521484375, + "learning_rate": 9.610679036527032e-05, + "loss": 1.4903, + "step": 17500 + }, + { + "epoch": 7.809110629067245, + "grad_norm": 8371.5927734375, + "learning_rate": 9.588457317037219e-05, + "loss": 1.4959, + "step": 18000 + }, + { + "epoch": 8.0, + "eval_loss": 1.450566291809082, + "eval_map": 0.2326, + "eval_map_50": 0.4723, + "eval_map_75": 0.2016, + "eval_map_bus": 0.2383, + "eval_map_car": 0.2738, + "eval_map_container": 0.2721, + "eval_map_large": 0.4815, + "eval_map_medium": 0.1948, + "eval_map_motorbike": 0.146, + "eval_map_small": 0.02, + "eval_mar_1": 0.1679, + "eval_mar_10": 0.3488, + "eval_mar_100": 0.3983, + "eval_mar_100_bus": 0.4799, + "eval_mar_100_car": 0.4008, + "eval_mar_100_container": 0.4372, + "eval_mar_100_motorbike": 0.2752, + "eval_mar_large": 0.6462, + "eval_mar_medium": 0.3758, + "eval_mar_small": 0.1042, + "eval_runtime": 111.6404, + "eval_samples_per_second": 20.629, + "eval_steps_per_second": 2.58, + "step": 18440 + }, + { + "epoch": 8.026030368763557, + "grad_norm": 7741.39892578125, + "learning_rate": 9.565599746504495e-05, + "loss": 1.4911, + "step": 18500 + }, + { + "epoch": 8.242950108459869, + "grad_norm": 12290.6552734375, + "learning_rate": 9.542153212228251e-05, + "loss": 1.4937, + "step": 19000 + }, + { + "epoch": 8.459869848156183, + "grad_norm": 11567.1787109375, + "learning_rate": 9.518120738818473e-05, + "loss": 1.5119, + "step": 19500 + }, + { + "epoch": 8.676789587852495, + "grad_norm": 25120.248046875, + "learning_rate": 9.493555236671335e-05, + "loss": 1.4841, + "step": 20000 + }, + { + "epoch": 8.893709327548807, + "grad_norm": 6134.39599609375, + "learning_rate": 9.468361416878137e-05, + "loss": 1.4923, + "step": 20500 + }, + { + "epoch": 9.0, + "eval_loss": 1.4423633813858032, + "eval_map": 0.2329, + "eval_map_50": 0.4795, + "eval_map_75": 0.2007, + "eval_map_bus": 0.2454, + "eval_map_car": 0.27, + "eval_map_container": 0.2706, + "eval_map_large": 0.4755, + "eval_map_medium": 0.194, + "eval_map_motorbike": 0.1455, + "eval_map_small": 0.025, + "eval_mar_1": 0.1668, + "eval_mar_10": 0.3462, + "eval_mar_100": 0.3973, + "eval_mar_100_bus": 0.4772, + "eval_mar_100_car": 0.4004, + "eval_mar_100_container": 0.4375, + "eval_mar_100_motorbike": 0.2741, + "eval_mar_large": 0.6412, + "eval_mar_medium": 0.3766, + "eval_mar_small": 0.1091, + "eval_runtime": 112.7615, + "eval_samples_per_second": 20.424, + "eval_steps_per_second": 2.554, + "step": 20745 + }, + { + "epoch": 9.11062906724512, + "grad_norm": 32511.9609375, + "learning_rate": 9.442591177115253e-05, + "loss": 1.4782, + "step": 21000 + }, + { + "epoch": 9.327548806941431, + "grad_norm": 11596.8134765625, + "learning_rate": 9.41630109812504e-05, + "loss": 1.4803, + "step": 21500 + }, + { + "epoch": 9.544468546637743, + "grad_norm": 6854.0498046875, + "learning_rate": 9.389389201412557e-05, + "loss": 1.4894, + "step": 22000 + }, + { + "epoch": 9.761388286334057, + "grad_norm": 6358.80908203125, + "learning_rate": 9.361911072169985e-05, + "loss": 1.5033, + "step": 22500 + }, + { + "epoch": 9.97830802603037, + "grad_norm": 3667.44677734375, + "learning_rate": 9.333870255084278e-05, + "loss": 1.4813, + "step": 23000 + }, + { + "epoch": 10.0, + "eval_loss": 1.441864252090454, + "eval_map": 0.2347, + "eval_map_50": 0.4795, + "eval_map_75": 0.2034, + "eval_map_bus": 0.2558, + "eval_map_car": 0.2691, + "eval_map_container": 0.2689, + "eval_map_large": 0.4789, + "eval_map_medium": 0.1962, + "eval_map_motorbike": 0.1452, + "eval_map_small": 0.0219, + "eval_mar_1": 0.1701, + "eval_mar_10": 0.3484, + "eval_mar_100": 0.3954, + "eval_mar_100_bus": 0.4847, + "eval_mar_100_car": 0.3916, + "eval_mar_100_container": 0.434, + "eval_mar_100_motorbike": 0.2714, + "eval_mar_large": 0.6499, + "eval_mar_medium": 0.3714, + "eval_mar_small": 0.0978, + "eval_runtime": 114.4896, + "eval_samples_per_second": 20.115, + "eval_steps_per_second": 2.516, + "step": 23050 + }, + { + "epoch": 10.195227765726681, + "grad_norm": 6613.9287109375, + "learning_rate": 9.305270367429292e-05, + "loss": 1.4713, + "step": 23500 + }, + { + "epoch": 10.412147505422993, + "grad_norm": 16454.421875, + "learning_rate": 9.27611509859916e-05, + "loss": 1.4608, + "step": 24000 + }, + { + "epoch": 10.629067245119305, + "grad_norm": 8706.1943359375, + "learning_rate": 9.246468171391835e-05, + "loss": 1.4732, + "step": 24500 + }, + { + "epoch": 10.845986984815617, + "grad_norm": 4838.7392578125, + "learning_rate": 9.216214586190261e-05, + "loss": 1.4833, + "step": 25000 + }, + { + "epoch": 11.0, + "eval_loss": 1.4288930892944336, + "eval_map": 0.2451, + "eval_map_50": 0.4962, + "eval_map_75": 0.2143, + "eval_map_bus": 0.2705, + "eval_map_car": 0.2791, + "eval_map_container": 0.2843, + "eval_map_large": 0.5032, + "eval_map_medium": 0.2044, + "eval_map_motorbike": 0.1465, + "eval_map_small": 0.0243, + "eval_mar_1": 0.1738, + "eval_mar_10": 0.3561, + "eval_mar_100": 0.4058, + "eval_mar_100_bus": 0.5024, + "eval_mar_100_car": 0.4023, + "eval_mar_100_container": 0.4454, + "eval_mar_100_motorbike": 0.2732, + "eval_mar_large": 0.6609, + "eval_mar_medium": 0.3869, + "eval_mar_small": 0.1005, + "eval_runtime": 111.8693, + "eval_samples_per_second": 20.587, + "eval_steps_per_second": 2.574, + "step": 25355 + }, + { + "epoch": 11.062906724511931, + "grad_norm": 5249.5126953125, + "learning_rate": 9.185417108036163e-05, + "loss": 1.4815, + "step": 25500 + }, + { + "epoch": 11.279826464208243, + "grad_norm": 7979.5078125, + "learning_rate": 9.154079709813505e-05, + "loss": 1.4599, + "step": 26000 + }, + { + "epoch": 11.496746203904555, + "grad_norm": 24827.08203125, + "learning_rate": 9.122206434056104e-05, + "loss": 1.4527, + "step": 26500 + }, + { + "epoch": 11.713665943600867, + "grad_norm": 13943.88671875, + "learning_rate": 9.08980139242614e-05, + "loss": 1.4506, + "step": 27000 + }, + { + "epoch": 11.93058568329718, + "grad_norm": 19058.4140625, + "learning_rate": 9.056868765183752e-05, + "loss": 1.444, + "step": 27500 + }, + { + "epoch": 12.0, + "eval_loss": 1.4114290475845337, + "eval_map": 0.2497, + "eval_map_50": 0.5054, + "eval_map_75": 0.2185, + "eval_map_bus": 0.2717, + "eval_map_car": 0.2836, + "eval_map_container": 0.2905, + "eval_map_large": 0.5069, + "eval_map_medium": 0.2101, + "eval_map_motorbike": 0.1532, + "eval_map_small": 0.0247, + "eval_mar_1": 0.175, + "eval_mar_10": 0.358, + "eval_mar_100": 0.4062, + "eval_mar_100_bus": 0.4934, + "eval_mar_100_car": 0.4052, + "eval_mar_100_container": 0.4483, + "eval_mar_100_motorbike": 0.278, + "eval_mar_large": 0.658, + "eval_mar_medium": 0.384, + "eval_mar_small": 0.1037, + "eval_runtime": 111.8412, + "eval_samples_per_second": 20.592, + "eval_steps_per_second": 2.575, + "step": 27660 + }, + { + "epoch": 12.147505422993492, + "grad_norm": 20425.599609375, + "learning_rate": 9.023412800647782e-05, + "loss": 1.4346, + "step": 28000 + }, + { + "epoch": 12.364425162689805, + "grad_norm": 20580.5859375, + "learning_rate": 8.989506279701155e-05, + "loss": 1.436, + "step": 28500 + }, + { + "epoch": 12.581344902386117, + "grad_norm": 5153.2529296875, + "learning_rate": 8.955017679879593e-05, + "loss": 1.4358, + "step": 29000 + }, + { + "epoch": 12.79826464208243, + "grad_norm": 20761.373046875, + "learning_rate": 8.920018881585156e-05, + "loss": 1.4389, + "step": 29500 + }, + { + "epoch": 13.0, + "eval_loss": 1.4145116806030273, + "eval_map": 0.2491, + "eval_map_50": 0.5044, + "eval_map_75": 0.2154, + "eval_map_bus": 0.2809, + "eval_map_car": 0.2703, + "eval_map_container": 0.2931, + "eval_map_large": 0.5069, + "eval_map_medium": 0.2081, + "eval_map_motorbike": 0.152, + "eval_map_small": 0.0243, + "eval_mar_1": 0.1778, + "eval_mar_10": 0.3591, + "eval_mar_100": 0.4036, + "eval_mar_100_bus": 0.5021, + "eval_mar_100_car": 0.3905, + "eval_mar_100_container": 0.4506, + "eval_mar_100_motorbike": 0.2712, + "eval_mar_large": 0.6548, + "eval_mar_medium": 0.3811, + "eval_mar_small": 0.0958, + "eval_runtime": 113.291, + "eval_samples_per_second": 20.328, + "eval_steps_per_second": 2.542, + "step": 29965 + }, + { + "epoch": 13.015184381778742, + "grad_norm": 2281.438232421875, + "learning_rate": 8.884585910276008e-05, + "loss": 1.4451, + "step": 30000 + }, + { + "epoch": 13.232104121475054, + "grad_norm": 4104.1279296875, + "learning_rate": 8.848581322428806e-05, + "loss": 1.4493, + "step": 30500 + }, + { + "epoch": 13.449023861171366, + "grad_norm": 4472.2119140625, + "learning_rate": 8.812080266430921e-05, + "loss": 1.4535, + "step": 31000 + }, + { + "epoch": 13.66594360086768, + "grad_norm": 2972.729248046875, + "learning_rate": 8.775161924175216e-05, + "loss": 1.4399, + "step": 31500 + }, + { + "epoch": 13.882863340563992, + "grad_norm": 2877.804443359375, + "learning_rate": 8.737683090425208e-05, + "loss": 1.4721, + "step": 32000 + }, + { + "epoch": 14.0, + "eval_loss": 1.425186276435852, + "eval_map": 0.2426, + "eval_map_50": 0.4967, + "eval_map_75": 0.2135, + "eval_map_bus": 0.2701, + "eval_map_car": 0.2734, + "eval_map_container": 0.2865, + "eval_map_large": 0.5026, + "eval_map_medium": 0.1982, + "eval_map_motorbike": 0.1402, + "eval_map_small": 0.0224, + "eval_mar_1": 0.1728, + "eval_mar_10": 0.3474, + "eval_mar_100": 0.3944, + "eval_mar_100_bus": 0.4776, + "eval_mar_100_car": 0.3894, + "eval_mar_100_container": 0.4408, + "eval_mar_100_motorbike": 0.27, + "eval_mar_large": 0.6479, + "eval_mar_medium": 0.3668, + "eval_mar_small": 0.1061, + "eval_runtime": 114.1204, + "eval_samples_per_second": 20.18, + "eval_steps_per_second": 2.524, + "step": 32270 + }, + { + "epoch": 14.099783080260304, + "grad_norm": 2141.58056640625, + "learning_rate": 8.699722094429873e-05, + "loss": 1.4556, + "step": 32500 + }, + { + "epoch": 14.316702819956616, + "grad_norm": 3093.70166015625, + "learning_rate": 8.661283833169138e-05, + "loss": 1.4435, + "step": 33000 + }, + { + "epoch": 14.533622559652928, + "grad_norm": 10697.4072265625, + "learning_rate": 8.622373265190294e-05, + "loss": 1.4338, + "step": 33500 + }, + { + "epoch": 14.750542299349242, + "grad_norm": 4543.31982421875, + "learning_rate": 8.582995409968335e-05, + "loss": 1.4138, + "step": 34000 + }, + { + "epoch": 14.967462039045554, + "grad_norm": 8605.0224609375, + "learning_rate": 8.543155347258457e-05, + "loss": 1.4151, + "step": 34500 + }, + { + "epoch": 15.0, + "eval_loss": 1.38901686668396, + "eval_map": 0.257, + "eval_map_50": 0.5144, + "eval_map_75": 0.2303, + "eval_map_bus": 0.2907, + "eval_map_car": 0.284, + "eval_map_container": 0.2968, + "eval_map_large": 0.5145, + "eval_map_medium": 0.2172, + "eval_map_motorbike": 0.1563, + "eval_map_small": 0.0218, + "eval_mar_1": 0.1789, + "eval_mar_10": 0.3604, + "eval_mar_100": 0.4054, + "eval_mar_100_bus": 0.4884, + "eval_mar_100_car": 0.4023, + "eval_mar_100_container": 0.4466, + "eval_mar_100_motorbike": 0.2845, + "eval_mar_large": 0.6357, + "eval_mar_medium": 0.3819, + "eval_mar_small": 0.1104, + "eval_runtime": 114.3602, + "eval_samples_per_second": 20.138, + "eval_steps_per_second": 2.518, + "step": 34575 + }, + { + "epoch": 15.184381778741866, + "grad_norm": 8320.3056640625, + "learning_rate": 8.502858216440758e-05, + "loss": 1.4148, + "step": 35000 + }, + { + "epoch": 15.401301518438178, + "grad_norm": 8899.4482421875, + "learning_rate": 8.462109215857262e-05, + "loss": 1.4098, + "step": 35500 + }, + { + "epoch": 15.61822125813449, + "grad_norm": 5221.080078125, + "learning_rate": 8.420996435565979e-05, + "loss": 1.4055, + "step": 36000 + }, + { + "epoch": 15.835140997830802, + "grad_norm": 2089.09375, + "learning_rate": 8.379360400220391e-05, + "loss": 1.4085, + "step": 36500 + }, + { + "epoch": 16.0, + "eval_loss": 1.3738867044448853, + "eval_map": 0.2624, + "eval_map_50": 0.5264, + "eval_map_75": 0.2343, + "eval_map_bus": 0.2938, + "eval_map_car": 0.2917, + "eval_map_container": 0.3026, + "eval_map_large": 0.5278, + "eval_map_medium": 0.2188, + "eval_map_motorbike": 0.1615, + "eval_map_small": 0.0266, + "eval_mar_1": 0.1806, + "eval_mar_10": 0.3683, + "eval_mar_100": 0.42, + "eval_mar_100_bus": 0.5113, + "eval_mar_100_car": 0.4123, + "eval_mar_100_container": 0.465, + "eval_mar_100_motorbike": 0.2912, + "eval_mar_large": 0.6689, + "eval_mar_medium": 0.3994, + "eval_mar_small": 0.1048, + "eval_runtime": 113.9743, + "eval_samples_per_second": 20.206, + "eval_steps_per_second": 2.527, + "step": 36880 + }, + { + "epoch": 16.052060737527114, + "grad_norm": 9751.138671875, + "learning_rate": 8.337288426364522e-05, + "loss": 1.4132, + "step": 37000 + }, + { + "epoch": 16.268980477223426, + "grad_norm": 7289.64453125, + "learning_rate": 8.294785941295685e-05, + "loss": 1.4053, + "step": 37500 + }, + { + "epoch": 16.485900216919738, + "grad_norm": 10739.8271484375, + "learning_rate": 8.251858427847263e-05, + "loss": 1.4095, + "step": 38000 + }, + { + "epoch": 16.702819956616054, + "grad_norm": 6208.62158203125, + "learning_rate": 8.20851142368143e-05, + "loss": 1.3964, + "step": 38500 + }, + { + "epoch": 16.919739696312366, + "grad_norm": 10748.8740234375, + "learning_rate": 8.164838451708801e-05, + "loss": 1.3936, + "step": 39000 + }, + { + "epoch": 17.0, + "eval_loss": 1.3773220777511597, + "eval_map": 0.2668, + "eval_map_50": 0.5317, + "eval_map_75": 0.2387, + "eval_map_bus": 0.3055, + "eval_map_car": 0.2917, + "eval_map_container": 0.311, + "eval_map_large": 0.5238, + "eval_map_medium": 0.2246, + "eval_map_motorbike": 0.1591, + "eval_map_small": 0.0255, + "eval_mar_1": 0.1833, + "eval_mar_10": 0.3691, + "eval_mar_100": 0.4148, + "eval_mar_100_bus": 0.5058, + "eval_mar_100_car": 0.4058, + "eval_mar_100_container": 0.4589, + "eval_mar_100_motorbike": 0.2889, + "eval_mar_large": 0.6592, + "eval_mar_medium": 0.393, + "eval_mar_small": 0.1057, + "eval_runtime": 114.4682, + "eval_samples_per_second": 20.119, + "eval_steps_per_second": 2.516, + "step": 39185 + }, + { + "epoch": 17.136659436008678, + "grad_norm": 8642.4755859375, + "learning_rate": 8.120670105669583e-05, + "loss": 1.3972, + "step": 39500 + }, + { + "epoch": 17.35357917570499, + "grad_norm": 22437.994140625, + "learning_rate": 8.076099192246061e-05, + "loss": 1.4012, + "step": 40000 + }, + { + "epoch": 17.570498915401302, + "grad_norm": 6367.958984375, + "learning_rate": 8.031131461099501e-05, + "loss": 1.4144, + "step": 40500 + }, + { + "epoch": 17.787418655097614, + "grad_norm": 27725.388671875, + "learning_rate": 7.985772713080777e-05, + "loss": 1.4062, + "step": 41000 + }, + { + "epoch": 18.0, + "eval_loss": 1.3631058931350708, + "eval_map": 0.2687, + "eval_map_50": 0.5359, + "eval_map_75": 0.2387, + "eval_map_bus": 0.3014, + "eval_map_car": 0.2967, + "eval_map_container": 0.3116, + "eval_map_large": 0.5344, + "eval_map_medium": 0.226, + "eval_map_motorbike": 0.165, + "eval_map_small": 0.0249, + "eval_mar_1": 0.1848, + "eval_mar_10": 0.3696, + "eval_mar_100": 0.4176, + "eval_mar_100_bus": 0.5015, + "eval_mar_100_car": 0.4178, + "eval_mar_100_container": 0.4559, + "eval_mar_100_motorbike": 0.2953, + "eval_mar_large": 0.6661, + "eval_mar_medium": 0.3957, + "eval_mar_small": 0.1045, + "eval_runtime": 115.6328, + "eval_samples_per_second": 19.916, + "eval_steps_per_second": 2.491, + "step": 41490 + }, + { + "epoch": 18.004338394793926, + "grad_norm": 7504.40625, + "learning_rate": 7.940120667790506e-05, + "loss": 1.3951, + "step": 41500 + }, + { + "epoch": 18.22125813449024, + "grad_norm": 10632.771484375, + "learning_rate": 7.893998242197806e-05, + "loss": 1.4015, + "step": 42000 + }, + { + "epoch": 18.43817787418655, + "grad_norm": 3698.81298828125, + "learning_rate": 7.84750248995952e-05, + "loss": 1.3926, + "step": 42500 + }, + { + "epoch": 18.655097613882862, + "grad_norm": 20440.525390625, + "learning_rate": 7.800639409041694e-05, + "loss": 1.4003, + "step": 43000 + }, + { + "epoch": 18.872017353579174, + "grad_norm": 15015.9267578125, + "learning_rate": 7.753415044795898e-05, + "loss": 1.3825, + "step": 43500 + }, + { + "epoch": 19.0, + "eval_loss": 1.3476593494415283, + "eval_map": 0.2706, + "eval_map_50": 0.5411, + "eval_map_75": 0.2421, + "eval_map_bus": 0.3013, + "eval_map_car": 0.3005, + "eval_map_container": 0.3143, + "eval_map_large": 0.5328, + "eval_map_medium": 0.232, + "eval_map_motorbike": 0.1661, + "eval_map_small": 0.0256, + "eval_mar_1": 0.1835, + "eval_mar_10": 0.3693, + "eval_mar_100": 0.421, + "eval_mar_100_bus": 0.4967, + "eval_mar_100_car": 0.4221, + "eval_mar_100_container": 0.4661, + "eval_mar_100_motorbike": 0.2991, + "eval_mar_large": 0.6464, + "eval_mar_medium": 0.3959, + "eval_mar_small": 0.1243, + "eval_runtime": 114.676, + "eval_samples_per_second": 20.083, + "eval_steps_per_second": 2.511, + "step": 43795 + }, + { + "epoch": 19.088937093275486, + "grad_norm": 23474.3359375, + "learning_rate": 7.705835489179352e-05, + "loss": 1.3803, + "step": 44000 + }, + { + "epoch": 19.305856832971802, + "grad_norm": 14476.4375, + "learning_rate": 7.657906879969072e-05, + "loss": 1.3718, + "step": 44500 + }, + { + "epoch": 19.522776572668114, + "grad_norm": 21769.71875, + "learning_rate": 7.609635399970097e-05, + "loss": 1.3739, + "step": 45000 + }, + { + "epoch": 19.739696312364426, + "grad_norm": 16376.3427734375, + "learning_rate": 7.56112482427524e-05, + "loss": 1.3751, + "step": 45500 + }, + { + "epoch": 19.95661605206074, + "grad_norm": 8047.681640625, + "learning_rate": 7.51228518291386e-05, + "loss": 1.3704, + "step": 46000 + }, + { + "epoch": 20.0, + "eval_loss": 1.3514395952224731, + "eval_map": 0.2736, + "eval_map_50": 0.5439, + "eval_map_75": 0.2437, + "eval_map_bus": 0.3137, + "eval_map_car": 0.3013, + "eval_map_container": 0.3152, + "eval_map_large": 0.5431, + "eval_map_medium": 0.2335, + "eval_map_motorbike": 0.1642, + "eval_map_small": 0.0268, + "eval_mar_1": 0.1861, + "eval_mar_10": 0.3721, + "eval_mar_100": 0.4213, + "eval_mar_100_bus": 0.5033, + "eval_mar_100_car": 0.4247, + "eval_mar_100_container": 0.468, + "eval_mar_100_motorbike": 0.2892, + "eval_mar_large": 0.66, + "eval_mar_medium": 0.3999, + "eval_mar_small": 0.1239, + "eval_runtime": 113.7146, + "eval_samples_per_second": 20.252, + "eval_steps_per_second": 2.533, + "step": 46100 + }, + { + "epoch": 20.17353579175705, + "grad_norm": 6952.75634765625, + "learning_rate": 7.463023909270814e-05, + "loss": 1.3831, + "step": 46500 + }, + { + "epoch": 20.390455531453362, + "grad_norm": 4949.50146484375, + "learning_rate": 7.413444904801033e-05, + "loss": 1.3736, + "step": 47000 + }, + { + "epoch": 20.607375271149674, + "grad_norm": 13462.2197265625, + "learning_rate": 7.363554565211042e-05, + "loss": 1.3757, + "step": 47500 + }, + { + "epoch": 20.824295010845987, + "grad_norm": 11438.8916015625, + "learning_rate": 7.313359326369684e-05, + "loss": 1.3847, + "step": 48000 + }, + { + "epoch": 21.0, + "eval_loss": 1.3405940532684326, + "eval_map": 0.2773, + "eval_map_50": 0.548, + "eval_map_75": 0.2525, + "eval_map_bus": 0.3134, + "eval_map_car": 0.3109, + "eval_map_container": 0.3142, + "eval_map_large": 0.5483, + "eval_map_medium": 0.2389, + "eval_map_motorbike": 0.1707, + "eval_map_small": 0.0339, + "eval_mar_1": 0.1878, + "eval_mar_10": 0.3785, + "eval_mar_100": 0.4315, + "eval_mar_100_bus": 0.5139, + "eval_mar_100_car": 0.4344, + "eval_mar_100_container": 0.4725, + "eval_mar_100_motorbike": 0.3051, + "eval_mar_large": 0.6629, + "eval_mar_medium": 0.4104, + "eval_mar_small": 0.1327, + "eval_runtime": 113.9783, + "eval_samples_per_second": 20.206, + "eval_steps_per_second": 2.527, + "step": 48405 + }, + { + "epoch": 21.0412147505423, + "grad_norm": 5165.931640625, + "learning_rate": 7.262865663477902e-05, + "loss": 1.3741, + "step": 48500 + }, + { + "epoch": 21.25813449023861, + "grad_norm": 22676.916015625, + "learning_rate": 7.21208009023343e-05, + "loss": 1.3723, + "step": 49000 + }, + { + "epoch": 21.475054229934923, + "grad_norm": 16659.28515625, + "learning_rate": 7.161009157990521e-05, + "loss": 1.3684, + "step": 49500 + }, + { + "epoch": 21.691973969631235, + "grad_norm": 36924.6015625, + "learning_rate": 7.109659454914833e-05, + "loss": 1.3559, + "step": 50000 + }, + { + "epoch": 21.90889370932755, + "grad_norm": 17127.916015625, + "learning_rate": 7.058141116015095e-05, + "loss": 1.3711, + "step": 50500 + }, + { + "epoch": 22.0, + "eval_loss": 1.329733967781067, + "eval_map": 0.2789, + "eval_map_50": 0.5529, + "eval_map_75": 0.2536, + "eval_map_bus": 0.3151, + "eval_map_car": 0.3087, + "eval_map_container": 0.3189, + "eval_map_large": 0.5527, + "eval_map_medium": 0.2377, + "eval_map_motorbike": 0.1728, + "eval_map_small": 0.0291, + "eval_mar_1": 0.1862, + "eval_mar_10": 0.3778, + "eval_mar_100": 0.4288, + "eval_mar_100_bus": 0.5073, + "eval_mar_100_car": 0.4286, + "eval_mar_100_container": 0.4753, + "eval_mar_100_motorbike": 0.3041, + "eval_mar_large": 0.6636, + "eval_mar_medium": 0.4064, + "eval_mar_small": 0.1326, + "eval_runtime": 114.0898, + "eval_samples_per_second": 20.186, + "eval_steps_per_second": 2.524, + "step": 50710 + }, + { + "epoch": 22.125813449023862, + "grad_norm": 20025.771484375, + "learning_rate": 7.006254303068497e-05, + "loss": 1.3614, + "step": 51000 + }, + { + "epoch": 22.342733188720175, + "grad_norm": 15083.662109375, + "learning_rate": 6.954108682712056e-05, + "loss": 1.3679, + "step": 51500 + }, + { + "epoch": 22.559652928416487, + "grad_norm": 26199.78125, + "learning_rate": 6.901710981746509e-05, + "loss": 1.3535, + "step": 52000 + }, + { + "epoch": 22.7765726681128, + "grad_norm": 7781.2822265625, + "learning_rate": 6.849173485857683e-05, + "loss": 1.3682, + "step": 52500 + }, + { + "epoch": 22.99349240780911, + "grad_norm": 10568.328125, + "learning_rate": 6.796292403540774e-05, + "loss": 1.3693, + "step": 53000 + }, + { + "epoch": 23.0, + "eval_loss": 1.3302034139633179, + "eval_map": 0.2779, + "eval_map_50": 0.5488, + "eval_map_75": 0.2495, + "eval_map_bus": 0.3107, + "eval_map_car": 0.3079, + "eval_map_container": 0.32, + "eval_map_large": 0.5462, + "eval_map_medium": 0.2358, + "eval_map_motorbike": 0.1728, + "eval_map_small": 0.0283, + "eval_mar_1": 0.1869, + "eval_mar_10": 0.378, + "eval_mar_100": 0.4313, + "eval_mar_100_bus": 0.5203, + "eval_mar_100_car": 0.4265, + "eval_mar_100_container": 0.4718, + "eval_mar_100_motorbike": 0.3068, + "eval_mar_large": 0.6569, + "eval_mar_medium": 0.4084, + "eval_mar_small": 0.1338, + "eval_runtime": 114.703, + "eval_samples_per_second": 20.078, + "eval_steps_per_second": 2.511, + "step": 53015 + }, + { + "epoch": 23.210412147505423, + "grad_norm": 32113.388671875, + "learning_rate": 6.743179598962347e-05, + "loss": 1.3628, + "step": 53500 + }, + { + "epoch": 23.427331887201735, + "grad_norm": 15862.0458984375, + "learning_rate": 6.689841923690201e-05, + "loss": 1.3597, + "step": 54000 + }, + { + "epoch": 23.644251626898047, + "grad_norm": 10582.056640625, + "learning_rate": 6.636500906051175e-05, + "loss": 1.3635, + "step": 54500 + }, + { + "epoch": 23.86117136659436, + "grad_norm": 11771.59375, + "learning_rate": 6.58273498976812e-05, + "loss": 1.3678, + "step": 55000 + }, + { + "epoch": 24.0, + "eval_loss": 1.3459113836288452, + "eval_map": 0.2734, + "eval_map_50": 0.539, + "eval_map_75": 0.2477, + "eval_map_bus": 0.3079, + "eval_map_car": 0.2993, + "eval_map_container": 0.3169, + "eval_map_large": 0.5452, + "eval_map_medium": 0.2312, + "eval_map_motorbike": 0.1696, + "eval_map_small": 0.0277, + "eval_mar_1": 0.1841, + "eval_mar_10": 0.3742, + "eval_mar_100": 0.4272, + "eval_mar_100_bus": 0.5071, + "eval_mar_100_car": 0.4191, + "eval_mar_100_container": 0.4813, + "eval_mar_100_motorbike": 0.3011, + "eval_mar_large": 0.6656, + "eval_mar_medium": 0.4043, + "eval_mar_small": 0.1266, + "eval_runtime": 115.6337, + "eval_samples_per_second": 19.916, + "eval_steps_per_second": 2.491, + "step": 55320 + }, + { + "epoch": 24.07809110629067, + "grad_norm": 18562.78515625, + "learning_rate": 6.528764900194297e-05, + "loss": 1.3849, + "step": 55500 + }, + { + "epoch": 24.295010845986983, + "grad_norm": 10382.9853515625, + "learning_rate": 6.474597599487527e-05, + "loss": 1.3632, + "step": 56000 + }, + { + "epoch": 24.5119305856833, + "grad_norm": 11665.0673828125, + "learning_rate": 6.420240075245931e-05, + "loss": 1.3582, + "step": 56500 + }, + { + "epoch": 24.72885032537961, + "grad_norm": 4384.60546875, + "learning_rate": 6.365699339606521e-05, + "loss": 1.3442, + "step": 57000 + }, + { + "epoch": 24.945770065075923, + "grad_norm": 7771.29443359375, + "learning_rate": 6.310982428340635e-05, + "loss": 1.3554, + "step": 57500 + }, + { + "epoch": 25.0, + "eval_loss": 1.3141295909881592, + "eval_map": 0.2895, + "eval_map_50": 0.5625, + "eval_map_75": 0.2674, + "eval_map_bus": 0.3275, + "eval_map_car": 0.3135, + "eval_map_container": 0.337, + "eval_map_large": 0.5526, + "eval_map_medium": 0.2503, + "eval_map_motorbike": 0.1798, + "eval_map_small": 0.0326, + "eval_mar_1": 0.1904, + "eval_mar_10": 0.3872, + "eval_mar_100": 0.4387, + "eval_mar_100_bus": 0.5216, + "eval_mar_100_car": 0.4361, + "eval_mar_100_container": 0.4857, + "eval_mar_100_motorbike": 0.3112, + "eval_mar_large": 0.6709, + "eval_mar_medium": 0.4191, + "eval_mar_small": 0.1254, + "eval_runtime": 114.1019, + "eval_samples_per_second": 20.184, + "eval_steps_per_second": 2.524, + "step": 57625 + }, + { + "epoch": 25.162689804772235, + "grad_norm": 11156.1474609375, + "learning_rate": 6.25609639994632e-05, + "loss": 1.3439, + "step": 58000 + }, + { + "epoch": 25.379609544468547, + "grad_norm": 19446.05078125, + "learning_rate": 6.201158587864379e-05, + "loss": 1.3484, + "step": 58500 + }, + { + "epoch": 25.59652928416486, + "grad_norm": 37928.94921875, + "learning_rate": 6.145955889829366e-05, + "loss": 1.3497, + "step": 59000 + }, + { + "epoch": 25.81344902386117, + "grad_norm": 12394.7900390625, + "learning_rate": 6.090605363139137e-05, + "loss": 1.3444, + "step": 59500 + }, + { + "epoch": 26.0, + "eval_loss": 1.3255101442337036, + "eval_map": 0.2852, + "eval_map_50": 0.5566, + "eval_map_75": 0.2625, + "eval_map_bus": 0.3259, + "eval_map_car": 0.3115, + "eval_map_container": 0.3282, + "eval_map_large": 0.5484, + "eval_map_medium": 0.2437, + "eval_map_motorbike": 0.1754, + "eval_map_small": 0.0312, + "eval_mar_1": 0.1892, + "eval_mar_10": 0.3827, + "eval_mar_100": 0.4341, + "eval_mar_100_bus": 0.5192, + "eval_mar_100_car": 0.4338, + "eval_mar_100_container": 0.477, + "eval_mar_100_motorbike": 0.3065, + "eval_mar_large": 0.672, + "eval_mar_medium": 0.4146, + "eval_mar_small": 0.1121, + "eval_runtime": 114.2701, + "eval_samples_per_second": 20.154, + "eval_steps_per_second": 2.52, + "step": 59930 + }, + { + "epoch": 26.030368763557483, + "grad_norm": 21555.208984375, + "learning_rate": 6.035114148028319e-05, + "loss": 1.3548, + "step": 60000 + }, + { + "epoch": 26.247288503253795, + "grad_norm": 28509.6328125, + "learning_rate": 5.979600780867037e-05, + "loss": 1.3455, + "step": 60500 + }, + { + "epoch": 26.464208242950107, + "grad_norm": 21676.015625, + "learning_rate": 5.923849926827495e-05, + "loss": 1.3445, + "step": 61000 + }, + { + "epoch": 26.68112798264642, + "grad_norm": 25364.083984375, + "learning_rate": 5.867979895868912e-05, + "loss": 1.3463, + "step": 61500 + }, + { + "epoch": 26.89804772234273, + "grad_norm": 9840.4853515625, + "learning_rate": 5.811997895242124e-05, + "loss": 1.3421, + "step": 62000 + }, + { + "epoch": 27.0, + "eval_loss": 1.3189969062805176, + "eval_map": 0.2839, + "eval_map_50": 0.5592, + "eval_map_75": 0.2576, + "eval_map_bus": 0.3208, + "eval_map_car": 0.3134, + "eval_map_container": 0.3251, + "eval_map_large": 0.5548, + "eval_map_medium": 0.2448, + "eval_map_motorbike": 0.1765, + "eval_map_small": 0.0266, + "eval_mar_1": 0.1903, + "eval_mar_10": 0.3816, + "eval_mar_100": 0.4325, + "eval_mar_100_bus": 0.5073, + "eval_mar_100_car": 0.4453, + "eval_mar_100_container": 0.4693, + "eval_mar_100_motorbike": 0.3082, + "eval_mar_large": 0.6654, + "eval_mar_medium": 0.4114, + "eval_mar_small": 0.1285, + "eval_runtime": 114.9445, + "eval_samples_per_second": 20.036, + "eval_steps_per_second": 2.506, + "step": 62235 + }, + { + "epoch": 27.114967462039047, + "grad_norm": 16236.349609375, + "learning_rate": 5.7560234198709096e-05, + "loss": 1.3567, + "step": 62500 + }, + { + "epoch": 27.33188720173536, + "grad_norm": 16390.1328125, + "learning_rate": 5.6998393463013776e-05, + "loss": 1.3631, + "step": 63000 + }, + { + "epoch": 27.54880694143167, + "grad_norm": 7639.146484375, + "learning_rate": 5.643564993245218e-05, + "loss": 1.353, + "step": 63500 + }, + { + "epoch": 27.765726681127983, + "grad_norm": 7254.7099609375, + "learning_rate": 5.587207620110937e-05, + "loss": 1.3587, + "step": 64000 + }, + { + "epoch": 27.982646420824295, + "grad_norm": 26371.984375, + "learning_rate": 5.5307744970166573e-05, + "loss": 1.3477, + "step": 64500 + }, + { + "epoch": 28.0, + "eval_loss": 1.321735143661499, + "eval_map": 0.2852, + "eval_map_50": 0.5581, + "eval_map_75": 0.2622, + "eval_map_bus": 0.3238, + "eval_map_car": 0.3113, + "eval_map_container": 0.3256, + "eval_map_large": 0.5491, + "eval_map_medium": 0.2445, + "eval_map_motorbike": 0.1801, + "eval_map_small": 0.0268, + "eval_mar_1": 0.188, + "eval_mar_10": 0.3805, + "eval_mar_100": 0.4326, + "eval_mar_100_bus": 0.5124, + "eval_mar_100_car": 0.4292, + "eval_mar_100_container": 0.478, + "eval_mar_100_motorbike": 0.3109, + "eval_mar_large": 0.66, + "eval_mar_medium": 0.4122, + "eval_mar_small": 0.1297, + "eval_runtime": 115.1063, + "eval_samples_per_second": 20.008, + "eval_steps_per_second": 2.502, + "step": 64540 + }, + { + "epoch": 28.199566160520607, + "grad_norm": 13310.9052734375, + "learning_rate": 5.474272903852271e-05, + "loss": 1.3441, + "step": 65000 + }, + { + "epoch": 28.41648590021692, + "grad_norm": 2977.188720703125, + "learning_rate": 5.417823311099729e-05, + "loss": 1.3369, + "step": 65500 + }, + { + "epoch": 28.63340563991323, + "grad_norm": 5458.31396484375, + "learning_rate": 5.361206752337853e-05, + "loss": 1.3426, + "step": 66000 + }, + { + "epoch": 28.850325379609544, + "grad_norm": 3358.320556640625, + "learning_rate": 5.304543597796046e-05, + "loss": 1.3577, + "step": 66500 + }, + { + "epoch": 29.0, + "eval_loss": 1.3080586194992065, + "eval_map": 0.2881, + "eval_map_50": 0.5656, + "eval_map_75": 0.2638, + "eval_map_bus": 0.3304, + "eval_map_car": 0.3142, + "eval_map_container": 0.3312, + "eval_map_large": 0.5512, + "eval_map_medium": 0.2467, + "eval_map_motorbike": 0.1766, + "eval_map_small": 0.0267, + "eval_mar_1": 0.1899, + "eval_mar_10": 0.3833, + "eval_mar_100": 0.4341, + "eval_mar_100_bus": 0.5179, + "eval_mar_100_car": 0.43, + "eval_mar_100_container": 0.4776, + "eval_mar_100_motorbike": 0.3109, + "eval_mar_large": 0.6641, + "eval_mar_medium": 0.4136, + "eval_mar_small": 0.1252, + "eval_runtime": 114.8879, + "eval_samples_per_second": 20.046, + "eval_steps_per_second": 2.507, + "step": 66845 + }, + { + "epoch": 29.067245119305856, + "grad_norm": 12659.2099609375, + "learning_rate": 5.2478411570383244e-05, + "loss": 1.3436, + "step": 67000 + }, + { + "epoch": 29.284164859002168, + "grad_norm": 2700.028076171875, + "learning_rate": 5.191220240565011e-05, + "loss": 1.3463, + "step": 67500 + }, + { + "epoch": 29.501084598698483, + "grad_norm": 12202.7109375, + "learning_rate": 5.134461217394917e-05, + "loss": 1.3386, + "step": 68000 + }, + { + "epoch": 29.718004338394795, + "grad_norm": 11113.21875, + "learning_rate": 5.0776848486872474e-05, + "loss": 1.3335, + "step": 68500 + }, + { + "epoch": 29.934924078091107, + "grad_norm": 7475.49072265625, + "learning_rate": 5.020898458610682e-05, + "loss": 1.3362, + "step": 69000 + }, + { + "epoch": 30.0, + "eval_loss": 1.310318112373352, + "eval_map": 0.288, + "eval_map_50": 0.5656, + "eval_map_75": 0.2622, + "eval_map_bus": 0.3324, + "eval_map_car": 0.3093, + "eval_map_container": 0.3328, + "eval_map_large": 0.5594, + "eval_map_medium": 0.2476, + "eval_map_motorbike": 0.1775, + "eval_map_small": 0.0272, + "eval_mar_1": 0.1908, + "eval_mar_10": 0.383, + "eval_mar_100": 0.4353, + "eval_mar_100_bus": 0.5117, + "eval_mar_100_car": 0.4331, + "eval_mar_100_container": 0.4814, + "eval_mar_100_motorbike": 0.3149, + "eval_mar_large": 0.6702, + "eval_mar_medium": 0.411, + "eval_mar_small": 0.1275, + "eval_runtime": 115.2354, + "eval_samples_per_second": 19.985, + "eval_steps_per_second": 2.499, + "step": 69150 + }, + { + "epoch": 30.15184381778742, + "grad_norm": 12929.96875, + "learning_rate": 4.9642229486198724e-05, + "loss": 1.3372, + "step": 69500 + }, + { + "epoch": 30.36876355748373, + "grad_norm": 10545.1923828125, + "learning_rate": 4.9074384759668744e-05, + "loss": 1.3335, + "step": 70000 + }, + { + "epoch": 30.585683297180044, + "grad_norm": 6960.68310546875, + "learning_rate": 4.850665943778378e-05, + "loss": 1.3405, + "step": 70500 + }, + { + "epoch": 30.802603036876356, + "grad_norm": 16920.470703125, + "learning_rate": 4.793912675728147e-05, + "loss": 1.3399, + "step": 71000 + }, + { + "epoch": 31.0, + "eval_loss": 1.3056919574737549, + "eval_map": 0.2891, + "eval_map_50": 0.5684, + "eval_map_75": 0.2644, + "eval_map_bus": 0.3291, + "eval_map_car": 0.3136, + "eval_map_container": 0.3346, + "eval_map_large": 0.566, + "eval_map_medium": 0.2482, + "eval_map_motorbike": 0.1788, + "eval_map_small": 0.0308, + "eval_mar_1": 0.1914, + "eval_mar_10": 0.3856, + "eval_mar_100": 0.4356, + "eval_mar_100_bus": 0.5217, + "eval_mar_100_car": 0.435, + "eval_mar_100_container": 0.4715, + "eval_mar_100_motorbike": 0.3142, + "eval_mar_large": 0.678, + "eval_mar_medium": 0.4131, + "eval_mar_small": 0.1303, + "eval_runtime": 114.0811, + "eval_samples_per_second": 20.187, + "eval_steps_per_second": 2.525, + "step": 71455 + }, + { + "epoch": 31.019522776572668, + "grad_norm": 7885.31982421875, + "learning_rate": 4.73718599300487e-05, + "loss": 1.3293, + "step": 71500 + }, + { + "epoch": 31.23644251626898, + "grad_norm": 6155.576171875, + "learning_rate": 4.680493213367716e-05, + "loss": 1.3307, + "step": 72000 + }, + { + "epoch": 31.453362255965292, + "grad_norm": 12137.0146484375, + "learning_rate": 4.623841650202349e-05, + "loss": 1.3276, + "step": 72500 + }, + { + "epoch": 31.670281995661604, + "grad_norm": 15681.1962890625, + "learning_rate": 4.5672386115774904e-05, + "loss": 1.3183, + "step": 73000 + }, + { + "epoch": 31.887201735357916, + "grad_norm": 20826.763671875, + "learning_rate": 4.5106913993021883e-05, + "loss": 1.326, + "step": 73500 + }, + { + "epoch": 32.0, + "eval_loss": 1.2957255840301514, + "eval_map": 0.2917, + "eval_map_50": 0.5725, + "eval_map_75": 0.2679, + "eval_map_bus": 0.3311, + "eval_map_car": 0.3187, + "eval_map_container": 0.3363, + "eval_map_large": 0.559, + "eval_map_medium": 0.2514, + "eval_map_motorbike": 0.1808, + "eval_map_small": 0.0368, + "eval_mar_1": 0.1915, + "eval_mar_10": 0.3864, + "eval_mar_100": 0.4393, + "eval_mar_100_bus": 0.5161, + "eval_mar_100_car": 0.4399, + "eval_mar_100_container": 0.4856, + "eval_mar_100_motorbike": 0.3154, + "eval_mar_large": 0.6778, + "eval_mar_medium": 0.4159, + "eval_mar_small": 0.1351, + "eval_runtime": 112.6576, + "eval_samples_per_second": 20.442, + "eval_steps_per_second": 2.556, + "step": 73760 + }, + { + "epoch": 32.10412147505423, + "grad_norm": 17197.775390625, + "learning_rate": 4.454320208327262e-05, + "loss": 1.3303, + "step": 74000 + }, + { + "epoch": 32.321041214750544, + "grad_norm": 21979.078125, + "learning_rate": 4.397906376349877e-05, + "loss": 1.3182, + "step": 74500 + }, + { + "epoch": 32.53796095444685, + "grad_norm": 11120.1962890625, + "learning_rate": 4.341570214631434e-05, + "loss": 1.3164, + "step": 75000 + }, + { + "epoch": 32.75488069414317, + "grad_norm": 6189.1796875, + "learning_rate": 4.285318990553778e-05, + "loss": 1.3143, + "step": 75500 + }, + { + "epoch": 32.971800433839476, + "grad_norm": 18750.640625, + "learning_rate": 4.229272181774833e-05, + "loss": 1.3187, + "step": 76000 + }, + { + "epoch": 33.0, + "eval_loss": 1.2895259857177734, + "eval_map": 0.2974, + "eval_map_50": 0.5776, + "eval_map_75": 0.2758, + "eval_map_bus": 0.3381, + "eval_map_car": 0.3235, + "eval_map_container": 0.3408, + "eval_map_large": 0.5698, + "eval_map_medium": 0.2581, + "eval_map_motorbike": 0.1871, + "eval_map_small": 0.0287, + "eval_mar_1": 0.1936, + "eval_mar_10": 0.3929, + "eval_mar_100": 0.4434, + "eval_mar_100_bus": 0.5274, + "eval_mar_100_car": 0.4415, + "eval_mar_100_container": 0.4849, + "eval_mar_100_motorbike": 0.3198, + "eval_mar_large": 0.6729, + "eval_mar_medium": 0.4216, + "eval_mar_small": 0.1412, + "eval_runtime": 113.1455, + "eval_samples_per_second": 20.354, + "eval_steps_per_second": 2.545, + "step": 76065 + }, + { + "epoch": 33.18872017353579, + "grad_norm": 28217.193359375, + "learning_rate": 4.173212384261402e-05, + "loss": 1.3211, + "step": 76500 + }, + { + "epoch": 33.40563991323211, + "grad_norm": 15140.1513671875, + "learning_rate": 4.1172592425996225e-05, + "loss": 1.3108, + "step": 77000 + }, + { + "epoch": 33.622559652928416, + "grad_norm": 16245.7314453125, + "learning_rate": 4.061531534860906e-05, + "loss": 1.3074, + "step": 77500 + }, + { + "epoch": 33.83947939262473, + "grad_norm": 11151.5146484375, + "learning_rate": 4.005813094796232e-05, + "loss": 1.3335, + "step": 78000 + }, + { + "epoch": 34.0, + "eval_loss": 1.2928670644760132, + "eval_map": 0.2955, + "eval_map_50": 0.5764, + "eval_map_75": 0.2743, + "eval_map_bus": 0.339, + "eval_map_car": 0.3213, + "eval_map_container": 0.3375, + "eval_map_large": 0.5708, + "eval_map_medium": 0.2556, + "eval_map_motorbike": 0.1843, + "eval_map_small": 0.0306, + "eval_mar_1": 0.1928, + "eval_mar_10": 0.3899, + "eval_mar_100": 0.442, + "eval_mar_100_bus": 0.5158, + "eval_mar_100_car": 0.4456, + "eval_mar_100_container": 0.4873, + "eval_mar_100_motorbike": 0.3194, + "eval_mar_large": 0.6816, + "eval_mar_medium": 0.4203, + "eval_mar_small": 0.1343, + "eval_runtime": 113.6061, + "eval_samples_per_second": 20.272, + "eval_steps_per_second": 2.535, + "step": 78370 + }, + { + "epoch": 34.05639913232104, + "grad_norm": 6196.53125, + "learning_rate": 3.950222905142011e-05, + "loss": 1.3203, + "step": 78500 + }, + { + "epoch": 34.273318872017356, + "grad_norm": 8838.4443359375, + "learning_rate": 3.894768137049464e-05, + "loss": 1.3181, + "step": 79000 + }, + { + "epoch": 34.490238611713664, + "grad_norm": 18184.919921875, + "learning_rate": 3.839455944200391e-05, + "loss": 1.3205, + "step": 79500 + }, + { + "epoch": 34.70715835140998, + "grad_norm": 18842.814453125, + "learning_rate": 3.7842934618843426e-05, + "loss": 1.3153, + "step": 80000 + }, + { + "epoch": 34.92407809110629, + "grad_norm": 13190.8916015625, + "learning_rate": 3.7292878060781644e-05, + "loss": 1.3051, + "step": 80500 + }, + { + "epoch": 35.0, + "eval_loss": 1.2900042533874512, + "eval_map": 0.296, + "eval_map_50": 0.5787, + "eval_map_75": 0.2742, + "eval_map_bus": 0.3348, + "eval_map_car": 0.3218, + "eval_map_container": 0.3402, + "eval_map_large": 0.5639, + "eval_map_medium": 0.2572, + "eval_map_motorbike": 0.1874, + "eval_map_small": 0.0323, + "eval_mar_1": 0.1922, + "eval_mar_10": 0.3894, + "eval_mar_100": 0.4397, + "eval_mar_100_bus": 0.5183, + "eval_mar_100_car": 0.4396, + "eval_mar_100_container": 0.4799, + "eval_mar_100_motorbike": 0.3212, + "eval_mar_large": 0.6737, + "eval_mar_medium": 0.4174, + "eval_mar_small": 0.1411, + "eval_runtime": 112.7, + "eval_samples_per_second": 20.435, + "eval_steps_per_second": 2.555, + "step": 80675 + }, + { + "epoch": 35.140997830802604, + "grad_norm": 8913.3818359375, + "learning_rate": 3.674446072528038e-05, + "loss": 1.3126, + "step": 81000 + }, + { + "epoch": 35.35791757049891, + "grad_norm": 15553.4130859375, + "learning_rate": 3.619884501961284e-05, + "loss": 1.3133, + "step": 81500 + }, + { + "epoch": 35.57483731019523, + "grad_norm": 7857.3984375, + "learning_rate": 3.565391451542974e-05, + "loss": 1.3122, + "step": 82000 + }, + { + "epoch": 35.79175704989154, + "grad_norm": 12758.6630859375, + "learning_rate": 3.511191892675452e-05, + "loss": 1.3155, + "step": 82500 + }, + { + "epoch": 36.0, + "eval_loss": 1.2911115884780884, + "eval_map": 0.2962, + "eval_map_50": 0.5795, + "eval_map_75": 0.2712, + "eval_map_bus": 0.3395, + "eval_map_car": 0.3186, + "eval_map_container": 0.3402, + "eval_map_large": 0.5675, + "eval_map_medium": 0.2557, + "eval_map_motorbike": 0.1866, + "eval_map_small": 0.03, + "eval_mar_1": 0.1942, + "eval_mar_10": 0.391, + "eval_mar_100": 0.4423, + "eval_mar_100_bus": 0.5222, + "eval_mar_100_car": 0.4403, + "eval_mar_100_container": 0.4859, + "eval_mar_100_motorbike": 0.3209, + "eval_mar_large": 0.6705, + "eval_mar_medium": 0.4196, + "eval_mar_small": 0.1422, + "eval_runtime": 112.4497, + "eval_samples_per_second": 20.48, + "eval_steps_per_second": 2.561, + "step": 82980 + }, + { + "epoch": 36.00867678958785, + "grad_norm": 2367.160400390625, + "learning_rate": 3.457075586757238e-05, + "loss": 1.3097, + "step": 83000 + }, + { + "epoch": 36.22559652928417, + "grad_norm": 3832.09326171875, + "learning_rate": 3.40326594982283e-05, + "loss": 1.3186, + "step": 83500 + }, + { + "epoch": 36.44251626898048, + "grad_norm": 3979.951416015625, + "learning_rate": 3.3495542557672235e-05, + "loss": 1.3404, + "step": 84000 + }, + { + "epoch": 36.65943600867679, + "grad_norm": 4793.94384765625, + "learning_rate": 3.2960554697101216e-05, + "loss": 1.3213, + "step": 84500 + }, + { + "epoch": 36.8763557483731, + "grad_norm": 9881.50390625, + "learning_rate": 3.2427764930110524e-05, + "loss": 1.321, + "step": 85000 + }, + { + "epoch": 37.0, + "eval_loss": 1.2855924367904663, + "eval_map": 0.2944, + "eval_map_50": 0.5775, + "eval_map_75": 0.2692, + "eval_map_bus": 0.3374, + "eval_map_car": 0.3199, + "eval_map_container": 0.3341, + "eval_map_large": 0.5649, + "eval_map_medium": 0.2541, + "eval_map_motorbike": 0.1863, + "eval_map_small": 0.0338, + "eval_mar_1": 0.1918, + "eval_mar_10": 0.3885, + "eval_mar_100": 0.4412, + "eval_mar_100_bus": 0.5225, + "eval_mar_100_car": 0.4421, + "eval_mar_100_container": 0.4788, + "eval_mar_100_motorbike": 0.3215, + "eval_mar_large": 0.6679, + "eval_mar_medium": 0.4186, + "eval_mar_small": 0.1388, + "eval_runtime": 112.777, + "eval_samples_per_second": 20.421, + "eval_steps_per_second": 2.554, + "step": 85285 + }, + { + "epoch": 37.093275488069416, + "grad_norm": 15542.7197265625, + "learning_rate": 3.189724198674071e-05, + "loss": 1.3171, + "step": 85500 + }, + { + "epoch": 37.310195227765725, + "grad_norm": 3698.43017578125, + "learning_rate": 3.136905430461136e-05, + "loss": 1.3104, + "step": 86000 + }, + { + "epoch": 37.52711496746204, + "grad_norm": 5524.0537109375, + "learning_rate": 3.084327002009272e-05, + "loss": 1.3068, + "step": 86500 + }, + { + "epoch": 37.74403470715835, + "grad_norm": 5400.333984375, + "learning_rate": 3.031995695951594e-05, + "loss": 1.3093, + "step": 87000 + }, + { + "epoch": 37.960954446854664, + "grad_norm": 11807.9365234375, + "learning_rate": 2.9799182630423616e-05, + "loss": 1.3085, + "step": 87500 + }, + { + "epoch": 38.0, + "eval_loss": 1.279981017112732, + "eval_map": 0.2988, + "eval_map_50": 0.5815, + "eval_map_75": 0.2739, + "eval_map_bus": 0.3469, + "eval_map_car": 0.3222, + "eval_map_container": 0.3386, + "eval_map_large": 0.5778, + "eval_map_medium": 0.259, + "eval_map_motorbike": 0.1873, + "eval_map_small": 0.0266, + "eval_mar_1": 0.1945, + "eval_mar_10": 0.3932, + "eval_mar_100": 0.446, + "eval_mar_100_bus": 0.536, + "eval_mar_100_car": 0.4403, + "eval_mar_100_container": 0.4869, + "eval_mar_100_motorbike": 0.3207, + "eval_mar_large": 0.6784, + "eval_mar_medium": 0.4254, + "eval_mar_small": 0.1346, + "eval_runtime": 113.2741, + "eval_samples_per_second": 20.331, + "eval_steps_per_second": 2.543, + "step": 87590 + }, + { + "epoch": 38.17787418655097, + "grad_norm": 31377.580078125, + "learning_rate": 2.9281014212861156e-05, + "loss": 1.3009, + "step": 88000 + }, + { + "epoch": 38.39479392624729, + "grad_norm": 10812.712890625, + "learning_rate": 2.876654683036693e-05, + "loss": 1.3006, + "step": 88500 + }, + { + "epoch": 38.611713665943604, + "grad_norm": 6770.5703125, + "learning_rate": 2.8253784878082468e-05, + "loss": 1.3049, + "step": 89000 + }, + { + "epoch": 38.82863340563991, + "grad_norm": 3374.140625, + "learning_rate": 2.7743828194103766e-05, + "loss": 1.3096, + "step": 89500 + }, + { + "epoch": 39.0, + "eval_loss": 1.283420205116272, + "eval_map": 0.2971, + "eval_map_50": 0.582, + "eval_map_75": 0.2753, + "eval_map_bus": 0.3432, + "eval_map_car": 0.3233, + "eval_map_container": 0.3352, + "eval_map_large": 0.5674, + "eval_map_medium": 0.2568, + "eval_map_motorbike": 0.1866, + "eval_map_small": 0.0327, + "eval_mar_1": 0.1923, + "eval_mar_10": 0.3902, + "eval_mar_100": 0.4413, + "eval_mar_100_bus": 0.5224, + "eval_mar_100_car": 0.4396, + "eval_mar_100_container": 0.4819, + "eval_mar_100_motorbike": 0.3212, + "eval_mar_large": 0.6682, + "eval_mar_medium": 0.4171, + "eval_mar_small": 0.146, + "eval_runtime": 113.4871, + "eval_samples_per_second": 20.293, + "eval_steps_per_second": 2.538, + "step": 89895 + }, + { + "epoch": 39.04555314533623, + "grad_norm": 8068.66796875, + "learning_rate": 2.7237753825406963e-05, + "loss": 1.3144, + "step": 90000 + }, + { + "epoch": 39.26247288503254, + "grad_norm": 3847.1201171875, + "learning_rate": 2.67335987234038e-05, + "loss": 1.309, + "step": 90500 + }, + { + "epoch": 39.47939262472885, + "grad_norm": 3865.5576171875, + "learning_rate": 2.623244499417857e-05, + "loss": 1.3038, + "step": 91000 + }, + { + "epoch": 39.69631236442516, + "grad_norm": 2421.161376953125, + "learning_rate": 2.573435728671345e-05, + "loss": 1.3103, + "step": 91500 + }, + { + "epoch": 39.91323210412148, + "grad_norm": 6669.9892578125, + "learning_rate": 2.5239399854472795e-05, + "loss": 1.3095, + "step": 92000 + }, + { + "epoch": 40.0, + "eval_loss": 1.2760100364685059, + "eval_map": 0.3011, + "eval_map_50": 0.583, + "eval_map_75": 0.2793, + "eval_map_bus": 0.3446, + "eval_map_car": 0.3254, + "eval_map_container": 0.3432, + "eval_map_large": 0.5704, + "eval_map_medium": 0.2606, + "eval_map_motorbike": 0.1911, + "eval_map_small": 0.0298, + "eval_mar_1": 0.1948, + "eval_mar_10": 0.3921, + "eval_mar_100": 0.4461, + "eval_mar_100_bus": 0.5202, + "eval_mar_100_car": 0.4489, + "eval_mar_100_container": 0.4897, + "eval_mar_100_motorbike": 0.3254, + "eval_mar_large": 0.6631, + "eval_mar_medium": 0.424, + "eval_mar_small": 0.1358, + "eval_runtime": 114.2826, + "eval_samples_per_second": 20.152, + "eval_steps_per_second": 2.52, + "step": 92200 + }, + { + "epoch": 40.130151843817785, + "grad_norm": 10441.7392578125, + "learning_rate": 2.4747636547114554e-05, + "loss": 1.3029, + "step": 92500 + }, + { + "epoch": 40.3470715835141, + "grad_norm": 8002.83056640625, + "learning_rate": 2.425913080225366e-05, + "loss": 1.2935, + "step": 93000 + }, + { + "epoch": 40.56399132321041, + "grad_norm": 10335.00390625, + "learning_rate": 2.3773945637278417e-05, + "loss": 1.3025, + "step": 93500 + }, + { + "epoch": 40.780911062906725, + "grad_norm": 32124.755859375, + "learning_rate": 2.3292143641221354e-05, + "loss": 1.2973, + "step": 94000 + }, + { + "epoch": 40.99783080260303, + "grad_norm": 14672.322265625, + "learning_rate": 2.2813786966685218e-05, + "loss": 1.2922, + "step": 94500 + }, + { + "epoch": 41.0, + "eval_loss": 1.2656161785125732, + "eval_map": 0.3032, + "eval_map_50": 0.5874, + "eval_map_75": 0.2819, + "eval_map_bus": 0.3458, + "eval_map_car": 0.3279, + "eval_map_container": 0.346, + "eval_map_large": 0.5716, + "eval_map_medium": 0.264, + "eval_map_motorbike": 0.1932, + "eval_map_small": 0.0303, + "eval_mar_1": 0.197, + "eval_mar_10": 0.3954, + "eval_mar_100": 0.4498, + "eval_mar_100_bus": 0.5276, + "eval_mar_100_car": 0.4491, + "eval_mar_100_container": 0.4964, + "eval_mar_100_motorbike": 0.3259, + "eval_mar_large": 0.6702, + "eval_mar_medium": 0.4287, + "eval_mar_small": 0.1414, + "eval_runtime": 113.4627, + "eval_samples_per_second": 20.297, + "eval_steps_per_second": 2.538, + "step": 94505 + }, + { + "epoch": 41.21475054229935, + "grad_norm": 8619.771484375, + "learning_rate": 2.2339883480308453e-05, + "loss": 1.2826, + "step": 95000 + }, + { + "epoch": 41.431670281995665, + "grad_norm": 12052.697265625, + "learning_rate": 2.1868594923472446e-05, + "loss": 1.3059, + "step": 95500 + }, + { + "epoch": 41.64859002169197, + "grad_norm": 5313.166015625, + "learning_rate": 2.140093532637103e-05, + "loss": 1.2943, + "step": 96000 + }, + { + "epoch": 41.86550976138829, + "grad_norm": 6886.1923828125, + "learning_rate": 2.0936965017233235e-05, + "loss": 1.2981, + "step": 96500 + }, + { + "epoch": 42.0, + "eval_loss": 1.27132248878479, + "eval_map": 0.2998, + "eval_map_50": 0.5854, + "eval_map_75": 0.2756, + "eval_map_bus": 0.3414, + "eval_map_car": 0.3246, + "eval_map_container": 0.342, + "eval_map_large": 0.5711, + "eval_map_medium": 0.2612, + "eval_map_motorbike": 0.1911, + "eval_map_small": 0.0303, + "eval_mar_1": 0.1941, + "eval_mar_10": 0.3916, + "eval_mar_100": 0.4466, + "eval_mar_100_bus": 0.5222, + "eval_mar_100_car": 0.4467, + "eval_mar_100_container": 0.4902, + "eval_mar_100_motorbike": 0.3274, + "eval_mar_large": 0.6682, + "eval_mar_medium": 0.4239, + "eval_mar_small": 0.164, + "eval_runtime": 112.7103, + "eval_samples_per_second": 20.433, + "eval_steps_per_second": 2.555, + "step": 96810 + }, + { + "epoch": 42.0824295010846, + "grad_norm": 15306.6865234375, + "learning_rate": 2.0476743848368773e-05, + "loss": 1.2916, + "step": 97000 + }, + { + "epoch": 42.29934924078091, + "grad_norm": 12990.0068359375, + "learning_rate": 2.0020331188447145e-05, + "loss": 1.282, + "step": 97500 + }, + { + "epoch": 42.51626898047722, + "grad_norm": 16005.4462890625, + "learning_rate": 1.956778591483908e-05, + "loss": 1.2856, + "step": 98000 + }, + { + "epoch": 42.73318872017354, + "grad_norm": 25783.400390625, + "learning_rate": 1.9119166406021284e-05, + "loss": 1.2899, + "step": 98500 + }, + { + "epoch": 42.950108459869845, + "grad_norm": 11117.935546875, + "learning_rate": 1.8675415791909563e-05, + "loss": 1.2935, + "step": 99000 + }, + { + "epoch": 43.0, + "eval_loss": 1.2610080242156982, + "eval_map": 0.3037, + "eval_map_50": 0.5903, + "eval_map_75": 0.2813, + "eval_map_bus": 0.3471, + "eval_map_car": 0.3275, + "eval_map_container": 0.3447, + "eval_map_large": 0.5758, + "eval_map_medium": 0.2644, + "eval_map_motorbike": 0.1955, + "eval_map_small": 0.0348, + "eval_mar_1": 0.1945, + "eval_mar_10": 0.3989, + "eval_mar_100": 0.4522, + "eval_mar_100_bus": 0.5334, + "eval_mar_100_car": 0.4481, + "eval_mar_100_container": 0.4967, + "eval_mar_100_motorbike": 0.3307, + "eval_mar_large": 0.6741, + "eval_mar_medium": 0.431, + "eval_mar_small": 0.1547, + "eval_runtime": 112.9931, + "eval_samples_per_second": 20.382, + "eval_steps_per_second": 2.549, + "step": 99115 + }, + { + "epoch": 43.16702819956616, + "grad_norm": 5978.50146484375, + "learning_rate": 1.8235689911416127e-05, + "loss": 1.2929, + "step": 99500 + }, + { + "epoch": 43.38394793926247, + "grad_norm": 10374.5068359375, + "learning_rate": 1.7799176362471302e-05, + "loss": 1.2917, + "step": 100000 + }, + { + "epoch": 43.600867678958785, + "grad_norm": 13522.9091796875, + "learning_rate": 1.7366816729482123e-05, + "loss": 1.296, + "step": 100500 + }, + { + "epoch": 43.8177874186551, + "grad_norm": 16869.978515625, + "learning_rate": 1.693866678697154e-05, + "loss": 1.2847, + "step": 101000 + }, + { + "epoch": 44.0, + "eval_loss": 1.2659156322479248, + "eval_map": 0.3033, + "eval_map_50": 0.5896, + "eval_map_75": 0.2786, + "eval_map_bus": 0.3481, + "eval_map_car": 0.3254, + "eval_map_container": 0.3454, + "eval_map_large": 0.5694, + "eval_map_medium": 0.2663, + "eval_map_motorbike": 0.1945, + "eval_map_small": 0.0268, + "eval_mar_1": 0.1948, + "eval_mar_10": 0.3953, + "eval_mar_100": 0.4484, + "eval_mar_100_bus": 0.5268, + "eval_mar_100_car": 0.4491, + "eval_mar_100_container": 0.4898, + "eval_mar_100_motorbike": 0.3281, + "eval_mar_large": 0.6741, + "eval_mar_medium": 0.4272, + "eval_mar_small": 0.1437, + "eval_runtime": 113.4331, + "eval_samples_per_second": 20.303, + "eval_steps_per_second": 2.539, + "step": 101420 + }, + { + "epoch": 44.03470715835141, + "grad_norm": 8985.3876953125, + "learning_rate": 1.651562524362303e-05, + "loss": 1.2927, + "step": 101500 + }, + { + "epoch": 44.251626898047725, + "grad_norm": 7145.2099609375, + "learning_rate": 1.6096051132899187e-05, + "loss": 1.2957, + "step": 102000 + }, + { + "epoch": 44.46854663774403, + "grad_norm": 4585.701171875, + "learning_rate": 1.568085064179898e-05, + "loss": 1.2855, + "step": 102500 + }, + { + "epoch": 44.68546637744035, + "grad_norm": 3795.897216796875, + "learning_rate": 1.5270077331310885e-05, + "loss": 1.2888, + "step": 103000 + }, + { + "epoch": 44.90238611713666, + "grad_norm": 18655.283203125, + "learning_rate": 1.4863784191315833e-05, + "loss": 1.2921, + "step": 103500 + }, + { + "epoch": 45.0, + "eval_loss": 1.2572112083435059, + "eval_map": 0.3062, + "eval_map_50": 0.5916, + "eval_map_75": 0.2824, + "eval_map_bus": 0.3505, + "eval_map_car": 0.3286, + "eval_map_container": 0.3484, + "eval_map_large": 0.5699, + "eval_map_medium": 0.2681, + "eval_map_motorbike": 0.1973, + "eval_map_small": 0.0314, + "eval_mar_1": 0.1955, + "eval_mar_10": 0.397, + "eval_mar_100": 0.4515, + "eval_mar_100_bus": 0.5297, + "eval_mar_100_car": 0.4495, + "eval_mar_100_container": 0.4962, + "eval_mar_100_motorbike": 0.3305, + "eval_mar_large": 0.6712, + "eval_mar_medium": 0.4311, + "eval_mar_small": 0.1435, + "eval_runtime": 113.3089, + "eval_samples_per_second": 20.325, + "eval_steps_per_second": 2.542, + "step": 103725 + }, + { + "epoch": 45.11930585683297, + "grad_norm": 6453.04833984375, + "learning_rate": 1.4462822596803221e-05, + "loss": 1.2838, + "step": 104000 + }, + { + "epoch": 45.33622559652928, + "grad_norm": 6873.46484375, + "learning_rate": 1.4065637228751328e-05, + "loss": 1.2863, + "step": 104500 + }, + { + "epoch": 45.5531453362256, + "grad_norm": 4747.73388671875, + "learning_rate": 1.3673087404328727e-05, + "loss": 1.2938, + "step": 105000 + }, + { + "epoch": 45.770065075921906, + "grad_norm": 7545.3359375, + "learning_rate": 1.3285223762581107e-05, + "loss": 1.2803, + "step": 105500 + }, + { + "epoch": 45.98698481561822, + "grad_norm": 11557.0927734375, + "learning_rate": 1.290209633803514e-05, + "loss": 1.2763, + "step": 106000 + }, + { + "epoch": 46.0, + "eval_loss": 1.256932020187378, + "eval_map": 0.3055, + "eval_map_50": 0.5917, + "eval_map_75": 0.2824, + "eval_map_bus": 0.3482, + "eval_map_car": 0.3306, + "eval_map_container": 0.3467, + "eval_map_large": 0.5765, + "eval_map_medium": 0.2678, + "eval_map_motorbike": 0.1965, + "eval_map_small": 0.0329, + "eval_mar_1": 0.1953, + "eval_mar_10": 0.3975, + "eval_mar_100": 0.4506, + "eval_mar_100_bus": 0.5298, + "eval_mar_100_car": 0.4499, + "eval_mar_100_container": 0.493, + "eval_mar_100_motorbike": 0.3298, + "eval_mar_large": 0.6723, + "eval_mar_medium": 0.4301, + "eval_mar_small": 0.144, + "eval_runtime": 113.2333, + "eval_samples_per_second": 20.339, + "eval_steps_per_second": 2.543, + "step": 106030 + }, + { + "epoch": 46.20390455531454, + "grad_norm": 28058.578125, + "learning_rate": 1.2523754554244121e-05, + "loss": 1.2831, + "step": 106500 + }, + { + "epoch": 46.420824295010846, + "grad_norm": 26312.306640625, + "learning_rate": 1.2150247217412186e-05, + "loss": 1.2796, + "step": 107000 + }, + { + "epoch": 46.63774403470716, + "grad_norm": 20001.359375, + "learning_rate": 1.1781622510098372e-05, + "loss": 1.2823, + "step": 107500 + }, + { + "epoch": 46.85466377440347, + "grad_norm": 30923.48046875, + "learning_rate": 1.1418650422438832e-05, + "loss": 1.2791, + "step": 108000 + }, + { + "epoch": 47.0, + "eval_loss": 1.2564352750778198, + "eval_map": 0.3049, + "eval_map_50": 0.593, + "eval_map_75": 0.2806, + "eval_map_bus": 0.3465, + "eval_map_car": 0.3318, + "eval_map_container": 0.3458, + "eval_map_large": 0.5726, + "eval_map_medium": 0.2679, + "eval_map_motorbike": 0.1953, + "eval_map_small": 0.0322, + "eval_mar_1": 0.1956, + "eval_mar_10": 0.3959, + "eval_mar_100": 0.4482, + "eval_mar_100_bus": 0.5209, + "eval_mar_100_car": 0.4511, + "eval_mar_100_container": 0.4908, + "eval_mar_100_motorbike": 0.33, + "eval_mar_large": 0.6679, + "eval_mar_medium": 0.4258, + "eval_mar_small": 0.1452, + "eval_runtime": 113.1112, + "eval_samples_per_second": 20.36, + "eval_steps_per_second": 2.546, + "step": 108335 + }, + { + "epoch": 47.071583514099785, + "grad_norm": 12088.6435546875, + "learning_rate": 1.106063545260258e-05, + "loss": 1.2778, + "step": 108500 + }, + { + "epoch": 47.288503253796094, + "grad_norm": 15733.0224609375, + "learning_rate": 1.0706921215184502e-05, + "loss": 1.2828, + "step": 109000 + }, + { + "epoch": 47.50542299349241, + "grad_norm": 12590.6767578125, + "learning_rate": 1.0358275796773904e-05, + "loss": 1.2794, + "step": 109500 + }, + { + "epoch": 47.72234273318872, + "grad_norm": 10663.71484375, + "learning_rate": 1.001474417273483e-05, + "loss": 1.2814, + "step": 110000 + }, + { + "epoch": 47.939262472885034, + "grad_norm": 16210.3134765625, + "learning_rate": 9.676370658750372e-06, + "loss": 1.2792, + "step": 110500 + }, + { + "epoch": 48.0, + "eval_loss": 1.2534351348876953, + "eval_map": 0.3065, + "eval_map_50": 0.5926, + "eval_map_75": 0.2831, + "eval_map_bus": 0.3493, + "eval_map_car": 0.335, + "eval_map_container": 0.3455, + "eval_map_large": 0.5738, + "eval_map_medium": 0.2681, + "eval_map_motorbike": 0.1961, + "eval_map_small": 0.0297, + "eval_mar_1": 0.196, + "eval_mar_10": 0.3991, + "eval_mar_100": 0.4509, + "eval_mar_100_bus": 0.5296, + "eval_mar_100_car": 0.453, + "eval_mar_100_container": 0.4924, + "eval_mar_100_motorbike": 0.3286, + "eval_mar_large": 0.6753, + "eval_mar_medium": 0.4311, + "eval_mar_small": 0.1507, + "eval_runtime": 112.0353, + "eval_samples_per_second": 20.556, + "eval_steps_per_second": 2.571, + "step": 110640 + }, + { + "epoch": 48.15618221258134, + "grad_norm": 6229.44921875, + "learning_rate": 9.343860028577056e-06, + "loss": 1.2906, + "step": 111000 + }, + { + "epoch": 48.37310195227766, + "grad_norm": 5420.70849609375, + "learning_rate": 9.015922482605332e-06, + "loss": 1.2666, + "step": 111500 + }, + { + "epoch": 48.590021691973966, + "grad_norm": 3634.189697265625, + "learning_rate": 8.693271894987293e-06, + "loss": 1.2808, + "step": 112000 + }, + { + "epoch": 48.80694143167028, + "grad_norm": 6041.09619140625, + "learning_rate": 8.375949887746026e-06, + "loss": 1.2819, + "step": 112500 + }, + { + "epoch": 49.0, + "eval_loss": 1.254146695137024, + "eval_map": 0.3053, + "eval_map_50": 0.5921, + "eval_map_75": 0.2825, + "eval_map_bus": 0.3477, + "eval_map_car": 0.3319, + "eval_map_container": 0.3467, + "eval_map_large": 0.5698, + "eval_map_medium": 0.267, + "eval_map_motorbike": 0.1949, + "eval_map_small": 0.0279, + "eval_mar_1": 0.1953, + "eval_mar_10": 0.3973, + "eval_mar_100": 0.4501, + "eval_mar_100_bus": 0.5252, + "eval_mar_100_car": 0.4526, + "eval_mar_100_container": 0.4931, + "eval_mar_100_motorbike": 0.3292, + "eval_mar_large": 0.6678, + "eval_mar_medium": 0.429, + "eval_mar_small": 0.1504, + "eval_runtime": 112.0266, + "eval_samples_per_second": 20.558, + "eval_steps_per_second": 2.571, + "step": 112945 + }, + { + "epoch": 49.0238611713666, + "grad_norm": 20567.572265625, + "learning_rate": 8.06399739551611e-06, + "loss": 1.2793, + "step": 113000 + }, + { + "epoch": 49.240780911062906, + "grad_norm": 4496.19921875, + "learning_rate": 7.758062320395703e-06, + "loss": 1.2768, + "step": 113500 + }, + { + "epoch": 49.45770065075922, + "grad_norm": 4267.62255859375, + "learning_rate": 7.456957948623988e-06, + "loss": 1.2722, + "step": 114000 + }, + { + "epoch": 49.67462039045553, + "grad_norm": 6082.02978515625, + "learning_rate": 7.161341642100794e-06, + "loss": 1.2764, + "step": 114500 + }, + { + "epoch": 49.891540130151846, + "grad_norm": 12462.046875, + "learning_rate": 6.87125153541876e-06, + "loss": 1.2875, + "step": 115000 + }, + { + "epoch": 50.0, + "eval_loss": 1.2500559091567993, + "eval_map": 0.3077, + "eval_map_50": 0.5945, + "eval_map_75": 0.2867, + "eval_map_bus": 0.353, + "eval_map_car": 0.335, + "eval_map_container": 0.3467, + "eval_map_large": 0.5778, + "eval_map_medium": 0.2708, + "eval_map_motorbike": 0.196, + "eval_map_small": 0.0295, + "eval_mar_1": 0.197, + "eval_mar_10": 0.3999, + "eval_mar_100": 0.4529, + "eval_mar_100_bus": 0.5313, + "eval_mar_100_car": 0.4548, + "eval_mar_100_container": 0.495, + "eval_mar_100_motorbike": 0.3303, + "eval_mar_large": 0.6791, + "eval_mar_medium": 0.4327, + "eval_mar_small": 0.156, + "eval_runtime": 112.3685, + "eval_samples_per_second": 20.495, + "eval_steps_per_second": 2.563, + "step": 115250 + }, + { + "epoch": 50.108459869848154, + "grad_norm": 9009.076171875, + "learning_rate": 6.586725050289078e-06, + "loss": 1.2823, + "step": 115500 + }, + { + "epoch": 50.32537960954447, + "grad_norm": 29458.884765625, + "learning_rate": 6.307798890714117e-06, + "loss": 1.2757, + "step": 116000 + }, + { + "epoch": 50.54229934924078, + "grad_norm": 12566.5400390625, + "learning_rate": 6.035049969368911e-06, + "loss": 1.2777, + "step": 116500 + }, + { + "epoch": 50.759219088937094, + "grad_norm": 13344.3671875, + "learning_rate": 5.767420300672449e-06, + "loss": 1.2738, + "step": 117000 + }, + { + "epoch": 50.9761388286334, + "grad_norm": 7834.20703125, + "learning_rate": 5.505496648090353e-06, + "loss": 1.2744, + "step": 117500 + }, + { + "epoch": 51.0, + "eval_loss": 1.2519479990005493, + "eval_map": 0.3055, + "eval_map_50": 0.5938, + "eval_map_75": 0.2859, + "eval_map_bus": 0.3491, + "eval_map_car": 0.3304, + "eval_map_container": 0.3461, + "eval_map_large": 0.5779, + "eval_map_medium": 0.2683, + "eval_map_motorbike": 0.1965, + "eval_map_small": 0.0293, + "eval_mar_1": 0.1954, + "eval_mar_10": 0.3983, + "eval_mar_100": 0.4515, + "eval_mar_100_bus": 0.5298, + "eval_mar_100_car": 0.4514, + "eval_mar_100_container": 0.4927, + "eval_mar_100_motorbike": 0.3323, + "eval_mar_large": 0.6792, + "eval_mar_medium": 0.4307, + "eval_mar_small": 0.1574, + "eval_runtime": 111.7092, + "eval_samples_per_second": 20.616, + "eval_steps_per_second": 2.578, + "step": 117555 + }, + { + "epoch": 51.19305856832972, + "grad_norm": 5508.74267578125, + "learning_rate": 5.2493127998527795e-06, + "loss": 1.2873, + "step": 118000 + }, + { + "epoch": 51.409978308026034, + "grad_norm": 16584.37109375, + "learning_rate": 4.999396842843879e-06, + "loss": 1.2651, + "step": 118500 + }, + { + "epoch": 51.62689804772234, + "grad_norm": 4211.126953125, + "learning_rate": 4.754779359924699e-06, + "loss": 1.2731, + "step": 119000 + }, + { + "epoch": 51.84381778741866, + "grad_norm": 13401.8759765625, + "learning_rate": 4.5159985241065015e-06, + "loss": 1.2703, + "step": 119500 + }, + { + "epoch": 52.0, + "eval_loss": 1.2507617473602295, + "eval_map": 0.3076, + "eval_map_50": 0.5957, + "eval_map_75": 0.2871, + "eval_map_bus": 0.3493, + "eval_map_car": 0.3356, + "eval_map_container": 0.3485, + "eval_map_large": 0.5757, + "eval_map_medium": 0.2705, + "eval_map_motorbike": 0.1971, + "eval_map_small": 0.0292, + "eval_mar_1": 0.1964, + "eval_mar_10": 0.4, + "eval_mar_100": 0.4531, + "eval_mar_100_bus": 0.5316, + "eval_mar_100_car": 0.4556, + "eval_mar_100_container": 0.4943, + "eval_mar_100_motorbike": 0.3309, + "eval_mar_large": 0.6751, + "eval_mar_medium": 0.4329, + "eval_mar_small": 0.1567, + "eval_runtime": 114.4351, + "eval_samples_per_second": 20.125, + "eval_steps_per_second": 2.517, + "step": 119860 + }, + { + "epoch": 52.060737527114966, + "grad_norm": 4337.31201171875, + "learning_rate": 4.28308513818908e-06, + "loss": 1.2848, + "step": 120000 + }, + { + "epoch": 52.27765726681128, + "grad_norm": 33795.9140625, + "learning_rate": 4.056069248069421e-06, + "loss": 1.2738, + "step": 120500 + }, + { + "epoch": 52.49457700650759, + "grad_norm": 7602.009765625, + "learning_rate": 3.835416383072454e-06, + "loss": 1.2754, + "step": 121000 + }, + { + "epoch": 52.711496746203906, + "grad_norm": 6129.99755859375, + "learning_rate": 3.6202706367901073e-06, + "loss": 1.2683, + "step": 121500 + }, + { + "epoch": 52.928416485900215, + "grad_norm": 5628.37939453125, + "learning_rate": 3.411107889576004e-06, + "loss": 1.2697, + "step": 122000 + }, + { + "epoch": 53.0, + "eval_loss": 1.2477965354919434, + "eval_map": 0.3089, + "eval_map_50": 0.5969, + "eval_map_75": 0.2891, + "eval_map_bus": 0.3545, + "eval_map_car": 0.3364, + "eval_map_container": 0.3478, + "eval_map_large": 0.5734, + "eval_map_medium": 0.2729, + "eval_map_motorbike": 0.1971, + "eval_map_small": 0.0292, + "eval_mar_1": 0.1982, + "eval_mar_10": 0.4002, + "eval_mar_100": 0.4545, + "eval_mar_100_bus": 0.5327, + "eval_mar_100_car": 0.4586, + "eval_mar_100_container": 0.4959, + "eval_mar_100_motorbike": 0.3309, + "eval_mar_large": 0.6754, + "eval_mar_medium": 0.4349, + "eval_mar_small": 0.1496, + "eval_runtime": 113.1517, + "eval_samples_per_second": 20.353, + "eval_steps_per_second": 2.545, + "step": 122165 + }, + { + "epoch": 53.14533622559653, + "grad_norm": 7682.4912109375, + "learning_rate": 3.207955123487577e-06, + "loss": 1.2729, + "step": 122500 + }, + { + "epoch": 53.36225596529284, + "grad_norm": 16330.740234375, + "learning_rate": 3.010838545292888e-06, + "loss": 1.2656, + "step": 123000 + }, + { + "epoch": 53.579175704989154, + "grad_norm": 10252.83203125, + "learning_rate": 2.8201596270095608e-06, + "loss": 1.2726, + "step": 123500 + }, + { + "epoch": 53.79609544468546, + "grad_norm": 9575.732421875, + "learning_rate": 2.635178730346277e-06, + "loss": 1.268, + "step": 124000 + }, + { + "epoch": 54.0, + "eval_loss": 1.2473701238632202, + "eval_map": 0.3087, + "eval_map_50": 0.598, + "eval_map_75": 0.2878, + "eval_map_bus": 0.3532, + "eval_map_car": 0.3345, + "eval_map_container": 0.3464, + "eval_map_large": 0.5743, + "eval_map_medium": 0.2726, + "eval_map_motorbike": 0.2006, + "eval_map_small": 0.0289, + "eval_mar_1": 0.1978, + "eval_mar_10": 0.4014, + "eval_mar_100": 0.455, + "eval_mar_100_bus": 0.5352, + "eval_mar_100_car": 0.4574, + "eval_mar_100_container": 0.494, + "eval_mar_100_motorbike": 0.3333, + "eval_mar_large": 0.6771, + "eval_mar_medium": 0.4354, + "eval_mar_small": 0.1567, + "eval_runtime": 112.6797, + "eval_samples_per_second": 20.438, + "eval_steps_per_second": 2.556, + "step": 124470 + }, + { + "epoch": 54.01301518438178, + "grad_norm": 3493.781005859375, + "learning_rate": 2.4566595382205683e-06, + "loss": 1.2844, + "step": 124500 + }, + { + "epoch": 54.229934924078094, + "grad_norm": 1795.1060791015625, + "learning_rate": 2.2839095795851752e-06, + "loss": 1.2625, + "step": 125000 + }, + { + "epoch": 54.4468546637744, + "grad_norm": 4786.23046875, + "learning_rate": 2.117315010997223e-06, + "loss": 1.2669, + "step": 125500 + }, + { + "epoch": 54.66377440347072, + "grad_norm": 4156.8173828125, + "learning_rate": 1.956897323206286e-06, + "loss": 1.278, + "step": 126000 + }, + { + "epoch": 54.88069414316703, + "grad_norm": 3802.805908203125, + "learning_rate": 1.8026772101424282e-06, + "loss": 1.2765, + "step": 126500 + }, + { + "epoch": 55.0, + "eval_loss": 1.2465760707855225, + "eval_map": 0.3091, + "eval_map_50": 0.5973, + "eval_map_75": 0.2896, + "eval_map_bus": 0.3544, + "eval_map_car": 0.3361, + "eval_map_container": 0.3469, + "eval_map_large": 0.5784, + "eval_map_medium": 0.2729, + "eval_map_motorbike": 0.1991, + "eval_map_small": 0.0301, + "eval_mar_1": 0.1975, + "eval_mar_10": 0.4006, + "eval_mar_100": 0.4543, + "eval_mar_100_bus": 0.5321, + "eval_mar_100_car": 0.4577, + "eval_mar_100_container": 0.4944, + "eval_mar_100_motorbike": 0.3329, + "eval_mar_large": 0.6781, + "eval_mar_medium": 0.4341, + "eval_mar_small": 0.1526, + "eval_runtime": 112.2244, + "eval_samples_per_second": 20.521, + "eval_steps_per_second": 2.566, + "step": 126775 + }, + { + "epoch": 55.09761388286334, + "grad_norm": 3534.703857421875, + "learning_rate": 1.6546745662467334e-06, + "loss": 1.2739, + "step": 127000 + }, + { + "epoch": 55.31453362255965, + "grad_norm": 18442.876953125, + "learning_rate": 1.5129084839048678e-06, + "loss": 1.26, + "step": 127500 + }, + { + "epoch": 55.53145336225597, + "grad_norm": 4240.77734375, + "learning_rate": 1.377397250984197e-06, + "loss": 1.2687, + "step": 128000 + }, + { + "epoch": 55.748373101952275, + "grad_norm": 14645.23828125, + "learning_rate": 1.2481583484746096e-06, + "loss": 1.277, + "step": 128500 + }, + { + "epoch": 55.96529284164859, + "grad_norm": 5692.22412109375, + "learning_rate": 1.1254480609324047e-06, + "loss": 1.2748, + "step": 129000 + }, + { + "epoch": 56.0, + "eval_loss": 1.2461469173431396, + "eval_map": 0.3087, + "eval_map_50": 0.5979, + "eval_map_75": 0.2883, + "eval_map_bus": 0.3522, + "eval_map_car": 0.3356, + "eval_map_container": 0.3476, + "eval_map_large": 0.5786, + "eval_map_medium": 0.2726, + "eval_map_motorbike": 0.1995, + "eval_map_small": 0.0304, + "eval_mar_1": 0.1977, + "eval_mar_10": 0.4015, + "eval_mar_100": 0.4548, + "eval_mar_100_bus": 0.5339, + "eval_mar_100_car": 0.4574, + "eval_mar_100_container": 0.4949, + "eval_mar_100_motorbike": 0.3333, + "eval_mar_large": 0.6773, + "eval_mar_medium": 0.435, + "eval_mar_small": 0.1549, + "eval_runtime": 111.9985, + "eval_samples_per_second": 20.563, + "eval_steps_per_second": 2.571, + "step": 129080 + }, + { + "epoch": 56.1822125813449, + "grad_norm": 9871.357421875, + "learning_rate": 1.00879039851966e-06, + "loss": 1.2784, + "step": 129500 + }, + { + "epoch": 56.399132321041215, + "grad_norm": 8908.7138671875, + "learning_rate": 8.984526169130813e-07, + "loss": 1.2704, + "step": 130000 + }, + { + "epoch": 56.61605206073753, + "grad_norm": 16491.7421875, + "learning_rate": 7.944489497197504e-07, + "loss": 1.2697, + "step": 130500 + }, + { + "epoch": 56.83297180043384, + "grad_norm": 17585.138671875, + "learning_rate": 6.96792813444086e-07, + "loss": 1.2771, + "step": 131000 + }, + { + "epoch": 57.0, + "eval_loss": 1.2453677654266357, + "eval_map": 0.3097, + "eval_map_50": 0.5975, + "eval_map_75": 0.2886, + "eval_map_bus": 0.3528, + "eval_map_car": 0.3358, + "eval_map_container": 0.3499, + "eval_map_large": 0.5833, + "eval_map_medium": 0.2729, + "eval_map_motorbike": 0.2002, + "eval_map_small": 0.0303, + "eval_mar_1": 0.1977, + "eval_mar_10": 0.4019, + "eval_mar_100": 0.4556, + "eval_mar_100_bus": 0.5347, + "eval_mar_100_car": 0.4576, + "eval_mar_100_container": 0.4966, + "eval_mar_100_motorbike": 0.3336, + "eval_mar_large": 0.681, + "eval_mar_medium": 0.4356, + "eval_mar_small": 0.1552, + "eval_runtime": 113.6347, + "eval_samples_per_second": 20.267, + "eval_steps_per_second": 2.534, + "step": 131385 + }, + { + "epoch": 57.049891540130155, + "grad_norm": 7976.953125, + "learning_rate": 6.056730423994517e-07, + "loss": 1.2756, + "step": 131500 + }, + { + "epoch": 57.26681127982646, + "grad_norm": 6270.3828125, + "learning_rate": 5.207361854945081e-07, + "loss": 1.2654, + "step": 132000 + }, + { + "epoch": 57.48373101952278, + "grad_norm": 3344.49169921875, + "learning_rate": 4.421821685363259e-07, + "loss": 1.2664, + "step": 132500 + }, + { + "epoch": 57.70065075921909, + "grad_norm": 6102.4150390625, + "learning_rate": 3.700211250167618e-07, + "loss": 1.2718, + "step": 133000 + }, + { + "epoch": 57.9175704989154, + "grad_norm": 21649.18359375, + "learning_rate": 3.042623637321884e-07, + "loss": 1.2787, + "step": 133500 + }, + { + "epoch": 58.0, + "eval_loss": 1.245548963546753, + "eval_map": 0.3095, + "eval_map_50": 0.5973, + "eval_map_75": 0.2894, + "eval_map_bus": 0.3521, + "eval_map_car": 0.3362, + "eval_map_container": 0.3485, + "eval_map_large": 0.5805, + "eval_map_medium": 0.2738, + "eval_map_motorbike": 0.2011, + "eval_map_small": 0.0297, + "eval_mar_1": 0.1975, + "eval_mar_10": 0.4017, + "eval_mar_100": 0.4557, + "eval_mar_100_bus": 0.5339, + "eval_mar_100_car": 0.4585, + "eval_mar_100_container": 0.4966, + "eval_mar_100_motorbike": 0.3337, + "eval_mar_large": 0.6781, + "eval_mar_medium": 0.4362, + "eval_mar_small": 0.1576, + "eval_runtime": 113.2818, + "eval_samples_per_second": 20.33, + "eval_steps_per_second": 2.542, + "step": 133690 + }, + { + "epoch": 58.13449023861171, + "grad_norm": 29022.6796875, + "learning_rate": 2.449143675826382e-07, + "loss": 1.2724, + "step": 134000 + }, + { + "epoch": 58.35140997830803, + "grad_norm": 20785.9453125, + "learning_rate": 1.9198479247749534e-07, + "loss": 1.2716, + "step": 134500 + }, + { + "epoch": 58.568329718004335, + "grad_norm": 17548.994140625, + "learning_rate": 1.4556705847620922e-07, + "loss": 1.2606, + "step": 135000 + }, + { + "epoch": 58.78524945770065, + "grad_norm": 3488.3994140625, + "learning_rate": 1.0548111246240777e-07, + "loss": 1.2801, + "step": 135500 + }, + { + "epoch": 59.0, + "eval_loss": 1.2446414232254028, + "eval_map": 0.3092, + "eval_map_50": 0.5975, + "eval_map_75": 0.2889, + "eval_map_bus": 0.3524, + "eval_map_car": 0.3355, + "eval_map_container": 0.3491, + "eval_map_large": 0.5825, + "eval_map_medium": 0.2724, + "eval_map_motorbike": 0.1997, + "eval_map_small": 0.0299, + "eval_mar_1": 0.1976, + "eval_mar_10": 0.4018, + "eval_mar_100": 0.4561, + "eval_mar_100_bus": 0.5351, + "eval_mar_100_car": 0.4578, + "eval_mar_100_container": 0.4975, + "eval_mar_100_motorbike": 0.3341, + "eval_mar_large": 0.6803, + "eval_mar_medium": 0.4361, + "eval_mar_small": 0.1593, + "eval_runtime": 113.5853, + "eval_samples_per_second": 20.276, + "eval_steps_per_second": 2.536, + "step": 135995 + }, + { + "epoch": 59.00216919739697, + "grad_norm": 5638.24267578125, + "learning_rate": 7.183157442495758e-08, + "loss": 1.2682, + "step": 136000 + }, + { + "epoch": 59.219088937093275, + "grad_norm": 7117.09033203125, + "learning_rate": 4.462278516440543e-08, + "loss": 1.2661, + "step": 136500 + }, + { + "epoch": 59.43600867678959, + "grad_norm": 20093.61328125, + "learning_rate": 2.3858254622771693e-08, + "loss": 1.2717, + "step": 137000 + }, + { + "epoch": 59.6529284164859, + "grad_norm": 14570.955078125, + "learning_rate": 9.540661430756936e-09, + "loss": 1.2713, + "step": 137500 + }, + { + "epoch": 59.869848156182215, + "grad_norm": 8108.88232421875, + "learning_rate": 1.681153479959896e-09, + "loss": 1.2623, + "step": 138000 + }, + { + "epoch": 60.0, + "eval_loss": 1.2452585697174072, + "eval_map": 0.3085, + "eval_map_50": 0.5989, + "eval_map_75": 0.2888, + "eval_map_bus": 0.3511, + "eval_map_car": 0.3354, + "eval_map_container": 0.3477, + "eval_map_large": 0.5812, + "eval_map_medium": 0.272, + "eval_map_motorbike": 0.2, + "eval_map_small": 0.0295, + "eval_mar_1": 0.1973, + "eval_mar_10": 0.4012, + "eval_mar_100": 0.4549, + "eval_mar_100_bus": 0.5331, + "eval_mar_100_car": 0.4573, + "eval_mar_100_container": 0.4953, + "eval_mar_100_motorbike": 0.3339, + "eval_mar_large": 0.6786, + "eval_mar_medium": 0.435, + "eval_mar_small": 0.1586, + "eval_runtime": 113.0597, + "eval_samples_per_second": 20.37, + "eval_steps_per_second": 2.547, + "step": 138300 + }, + { + "epoch": 60.0, + "step": 138300, + "total_flos": 1.1304051141381194e+20, + "train_loss": 1.4027004139887105, + "train_runtime": 29881.2617, + "train_samples_per_second": 18.507, + "train_steps_per_second": 4.628 + } + ], + "logging_steps": 500, + "max_steps": 138300, + "num_input_tokens_seen": 0, + "num_train_epochs": 60, + "save_steps": 500, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": true, + "should_training_stop": true + }, + "attributes": {} + } + }, + "total_flos": 1.1304051141381194e+20, + "train_batch_size": 4, + "trial_name": null, + "trial_params": null +}