diff --git "a/trainer_state.json" "b/trainer_state.json" --- "a/trainer_state.json" +++ "b/trainer_state.json" @@ -1,9 +1,9 @@ { "best_metric": null, "best_model_checkpoint": null, - "epoch": 1.7277551524126866, + "epoch": 0.13123359580052493, "eval_steps": 500, - "global_step": 14000, + "global_step": 100, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, @@ -11,84008 +11,608 @@ { "epoch": 0.0, "learning_rate": 0.0, - "loss": 20.5996, + "loss": 4.396, "step": 1 }, { "epoch": 0.0, - "learning_rate": 2.8135546322422195e-05, - "loss": 11.2562, + "learning_rate": 3.826919265136599e-07, + "loss": 4.21, "step": 2 }, { "epoch": 0.0, - "learning_rate": 4.459378585834222e-05, - "loss": 11.2609, + "learning_rate": 6.065523528528873e-07, + "loss": 4.3296, "step": 3 }, { - "epoch": 0.0, - "learning_rate": 5.627109264484439e-05, - "loss": 10.5546, + "epoch": 0.01, + "learning_rate": 7.653838530273198e-07, + "loss": 4.334, "step": 4 }, { - "epoch": 0.0, - "learning_rate": 6.532871547103689e-05, - "loss": 9.5941, + "epoch": 0.01, + "learning_rate": 8.885831358586367e-07, + "loss": 4.3884, "step": 5 }, { - "epoch": 0.0, - "learning_rate": 7.27293321807644e-05, - "loss": 8.7383, + "epoch": 0.01, + "learning_rate": 9.892442793665471e-07, + "loss": 4.32, "step": 6 }, { - "epoch": 0.0, - "learning_rate": 7.898646445303166e-05, - "loss": 7.9862, + "epoch": 0.01, + "learning_rate": 1.07435206352983e-06, + "loss": 4.2667, "step": 7 }, { - "epoch": 0.0, - "learning_rate": 8.440663896726658e-05, - "loss": 7.4495, + "epoch": 0.01, + "learning_rate": 1.1480757795409794e-06, + "loss": 4.2037, "step": 8 }, { - "epoch": 0.0, - "learning_rate": 8.918757171668444e-05, - "loss": 7.0743, + "epoch": 0.01, + "learning_rate": 1.2131047057057746e-06, + "loss": 4.4414, "step": 9 }, { - "epoch": 0.0, - "learning_rate": 9.346426179345912e-05, - "loss": 6.6677, + "epoch": 0.01, + "learning_rate": 1.2712750623722968e-06, + "loss": 4.1682, "step": 10 }, { - "epoch": 0.0, - "learning_rate": 9.733299855542168e-05, - "loss": 6.316, + "epoch": 0.01, + "learning_rate": 1.3238965507785759e-06, + "loss": 4.2204, "step": 11 }, { - "epoch": 0.0, - "learning_rate": 0.0001008648785031866, - "loss": 5.9883, + "epoch": 0.02, + "learning_rate": 1.371936205880207e-06, + "loss": 4.2052, "step": 12 }, { - "epoch": 0.0, - "learning_rate": 0.00010411389310308964, - "loss": 5.5639, + "epoch": 0.02, + "learning_rate": 1.4161284046830791e-06, + "loss": 4.1135, "step": 13 }, { - "epoch": 0.0, - "learning_rate": 0.00010712201077545386, - "loss": 5.2103, + "epoch": 0.02, + "learning_rate": 1.4570439900434897e-06, + "loss": 3.9597, "step": 14 }, { - "epoch": 0.0, - "learning_rate": 0.00010992250132937912, - "loss": 4.838, + "epoch": 0.02, + "learning_rate": 1.495135488711524e-06, + "loss": 3.8066, "step": 15 }, { - "epoch": 0.0, - "learning_rate": 0.00011254218528968878, - "loss": 4.4533, + "epoch": 0.02, + "learning_rate": 1.5307677060546395e-06, + "loss": 4.2143, "step": 16 }, { - "epoch": 0.0, - "learning_rate": 0.00011500300011117837, - "loss": 4.138, + "epoch": 0.02, + "learning_rate": 1.5642390292710904e-06, + "loss": 4.0728, "step": 17 }, { - "epoch": 0.0, - "learning_rate": 0.0001173231180391066, - "loss": 3.7683, + "epoch": 0.02, + "learning_rate": 1.5957966322194344e-06, + "loss": 4.3082, "step": 18 }, { - "epoch": 0.0, - "learning_rate": 0.00011951776132878371, - "loss": 3.4471, + "epoch": 0.02, + "learning_rate": 1.6256475638101063e-06, + "loss": 4.2929, "step": 19 }, { - "epoch": 0.0, - "learning_rate": 0.00012159980811588127, - "loss": 3.2164, + "epoch": 0.03, + "learning_rate": 1.6539669888859565e-06, + "loss": 3.6756, "step": 20 }, { - "epoch": 0.0, - "learning_rate": 0.00012358025031137388, - "loss": 2.9709, + "epoch": 0.03, + "learning_rate": 1.6809044163827172e-06, + "loss": 4.0849, "step": 21 }, { - "epoch": 0.0, - "learning_rate": 0.00012546854487784388, - "loss": 2.8759, + "epoch": 0.03, + "learning_rate": 1.706588477292236e-06, + "loss": 4.216, "step": 22 }, { - "epoch": 0.0, - "learning_rate": 0.00012727288695698884, - "loss": 2.6603, + "epoch": 0.03, + "learning_rate": 1.7311306396673579e-06, + "loss": 4.128, "step": 23 }, { - "epoch": 0.0, - "learning_rate": 0.0001290004248256088, - "loss": 2.548, + "epoch": 0.03, + "learning_rate": 1.7546281323938668e-06, + "loss": 3.9854, "step": 24 }, { - "epoch": 0.0, - "learning_rate": 0.00013065743094207378, - "loss": 2.4274, + "epoch": 0.03, + "learning_rate": 1.7771662717172735e-06, + "loss": 4.1697, "step": 25 }, { - "epoch": 0.0, - "learning_rate": 0.00013224943942551182, - "loss": 2.2454, + "epoch": 0.03, + "learning_rate": 1.7988203311967389e-06, + "loss": 4.0979, "step": 26 }, { - "epoch": 0.0, - "learning_rate": 0.00013378135757502663, - "loss": 2.2135, + "epoch": 0.04, + "learning_rate": 1.8196570585586616e-06, + "loss": 3.9488, "step": 27 }, { - "epoch": 0.0, - "learning_rate": 0.00013525755709787606, - "loss": 2.1087, + "epoch": 0.04, + "learning_rate": 1.8397359165571497e-06, + "loss": 4.0495, "step": 28 }, { - "epoch": 0.0, - "learning_rate": 0.0001366819493218585, - "loss": 2.0553, + "epoch": 0.04, + "learning_rate": 1.859110105992117e-06, + "loss": 4.101, "step": 29 }, { - "epoch": 0.0, - "learning_rate": 0.0001380580476518013, - "loss": 1.9273, + "epoch": 0.04, + "learning_rate": 1.8778274152251838e-06, + "loss": 3.8262, "step": 30 }, { - "epoch": 0.0, - "learning_rate": 0.00013938901978126304, - "loss": 1.902, + "epoch": 0.04, + "learning_rate": 1.8959309303488189e-06, + "loss": 3.9416, "step": 31 }, { - "epoch": 0.0, - "learning_rate": 0.00014067773161211098, - "loss": 1.8262, + "epoch": 0.04, + "learning_rate": 1.913459632568299e-06, + "loss": 3.7671, "step": 32 }, { - "epoch": 0.0, - "learning_rate": 0.00014192678441376388, - "loss": 1.7976, + "epoch": 0.04, + "learning_rate": 1.9304489036314633e-06, + "loss": 4.0306, "step": 33 }, { - "epoch": 0.0, - "learning_rate": 0.00014313854643360055, - "loss": 1.7331, + "epoch": 0.04, + "learning_rate": 1.9469309557847503e-06, + "loss": 3.9613, "step": 34 }, { - "epoch": 0.0, - "learning_rate": 0.00014431517992406857, - "loss": 1.6727, + "epoch": 0.05, + "learning_rate": 1.962935199388467e-06, + "loss": 3.7291, "step": 35 }, { - "epoch": 0.0, - "learning_rate": 0.0001454586643615288, - "loss": 1.6559, + "epoch": 0.05, + "learning_rate": 1.9784885587330943e-06, + "loss": 3.793, "step": 36 }, { - "epoch": 0.0, - "learning_rate": 0.00014657081648315152, - "loss": 1.6092, + "epoch": 0.05, + "learning_rate": 1.993615744575612e-06, + "loss": 3.6288, "step": 37 }, { - "epoch": 0.0, - "learning_rate": 0.00014765330765120592, - "loss": 1.5719, + "epoch": 0.05, + "learning_rate": 2.0083394903237663e-06, + "loss": 3.9299, "step": 38 }, { - "epoch": 0.0, - "learning_rate": 0.00014870767896143185, - "loss": 1.5397, + "epoch": 0.05, + "learning_rate": 2.022680757535966e-06, + "loss": 3.8319, "step": 39 }, { - "epoch": 0.0, - "learning_rate": 0.00014973535443830348, - "loss": 1.5075, + "epoch": 0.05, + "learning_rate": 2.0366589153996162e-06, + "loss": 3.7277, "step": 40 }, { - "epoch": 0.01, - "learning_rate": 0.00015073765260071798, - "loss": 1.504, + "epoch": 0.05, + "learning_rate": 2.050291898044415e-06, + "loss": 3.7845, "step": 41 }, { - "epoch": 0.01, - "learning_rate": 0.0001517157966337961, - "loss": 1.4748, + "epoch": 0.06, + "learning_rate": 2.063596342896377e-06, + "loss": 3.5937, "step": 42 }, { - "epoch": 0.01, - "learning_rate": 0.00015267092336364776, - "loss": 1.3966, + "epoch": 0.06, + "learning_rate": 2.076587712750118e-06, + "loss": 3.5983, "step": 43 }, { - "epoch": 0.01, - "learning_rate": 0.00015360409120026606, - "loss": 1.4112, + "epoch": 0.06, + "learning_rate": 2.0892804038058957e-06, + "loss": 3.7483, "step": 44 }, { - "epoch": 0.01, - "learning_rate": 0.0001545162871877213, - "loss": 1.3946, + "epoch": 0.06, + "learning_rate": 2.101687841564411e-06, + "loss": 3.6843, "step": 45 }, { - "epoch": 0.01, - "learning_rate": 0.00015540843327941102, - "loss": 1.3437, + "epoch": 0.06, + "learning_rate": 2.113822566181018e-06, + "loss": 3.7431, "step": 46 }, { - "epoch": 0.01, - "learning_rate": 0.00015628139193838605, - "loss": 1.3224, + "epoch": 0.06, + "learning_rate": 2.1256963086398127e-06, + "loss": 3.5885, "step": 47 }, { - "epoch": 0.01, - "learning_rate": 0.000157135971148031, - "loss": 1.2771, + "epoch": 0.06, + "learning_rate": 2.1373200589075267e-06, + "loss": 3.6473, "step": 48 }, { - "epoch": 0.01, - "learning_rate": 0.00015797292890606333, - "loss": 1.3013, + "epoch": 0.06, + "learning_rate": 2.14870412705966e-06, + "loss": 3.3018, "step": 49 }, { - "epoch": 0.01, - "learning_rate": 0.000158792977264496, - "loss": 1.2927, + "epoch": 0.07, + "learning_rate": 2.159858198230933e-06, + "loss": 3.5044, "step": 50 }, { - "epoch": 0.01, - "learning_rate": 0.00015959678596952058, - "loss": 1.2703, + "epoch": 0.07, + "learning_rate": 2.170791382123977e-06, + "loss": 3.7595, "step": 51 }, { - "epoch": 0.01, - "learning_rate": 0.000160384985747934, - "loss": 1.2674, + "epoch": 0.07, + "learning_rate": 2.181512257710399e-06, + "loss": 3.5821, "step": 52 }, { - "epoch": 0.01, - "learning_rate": 0.00016115817128051248, - "loss": 1.234, + "epoch": 0.07, + "learning_rate": 2.192028913673789e-06, + "loss": 3.752, "step": 53 }, { - "epoch": 0.01, - "learning_rate": 0.00016191690389744885, - "loss": 1.2058, + "epoch": 0.07, + "learning_rate": 2.2023489850723216e-06, + "loss": 3.5635, "step": 54 }, { - "epoch": 0.01, - "learning_rate": 0.0001626617140264586, - "loss": 1.2098, + "epoch": 0.07, + "learning_rate": 2.2124796866372125e-06, + "loss": 3.5492, "step": 55 }, { - "epoch": 0.01, - "learning_rate": 0.00016339310342029824, - "loss": 1.1964, + "epoch": 0.07, + "learning_rate": 2.22242784307081e-06, + "loss": 3.4708, "step": 56 }, { - "epoch": 0.01, - "learning_rate": 0.00016411154718712595, - "loss": 1.162, + "epoch": 0.07, + "learning_rate": 2.2321999166629935e-06, + "loss": 3.4797, "step": 57 }, { - "epoch": 0.01, - "learning_rate": 0.00016481749564428065, - "loss": 1.176, + "epoch": 0.08, + "learning_rate": 2.2418020325057765e-06, + "loss": 3.5858, "step": 58 }, { - "epoch": 0.01, - "learning_rate": 0.00016551137601359504, - "loss": 1.1815, + "epoch": 0.08, + "learning_rate": 2.251240001552474e-06, + "loss": 3.5595, "step": 59 }, { - "epoch": 0.01, - "learning_rate": 0.00016619359397422348, - "loss": 1.1616, + "epoch": 0.08, + "learning_rate": 2.2605193417388435e-06, + "loss": 3.5123, "step": 60 }, { - "epoch": 0.01, - "learning_rate": 0.00016686453508711946, - "loss": 1.1035, + "epoch": 0.08, + "learning_rate": 2.269645297358435e-06, + "loss": 3.4325, "step": 61 }, { - "epoch": 0.01, - "learning_rate": 0.00016752456610368525, - "loss": 1.1352, + "epoch": 0.08, + "learning_rate": 2.278622856862479e-06, + "loss": 3.4439, "step": 62 }, { - "epoch": 0.01, - "learning_rate": 0.0001681740361697161, - "loss": 1.0959, + "epoch": 0.08, + "learning_rate": 2.2874567692356042e-06, + "loss": 3.4072, "step": 63 }, { - "epoch": 0.01, - "learning_rate": 0.00016881327793453316, - "loss": 1.1233, + "epoch": 0.08, + "learning_rate": 2.2961515590819588e-06, + "loss": 3.6176, "step": 64 }, { - "epoch": 0.01, - "learning_rate": 0.0001694426085741265, - "loss": 1.1331, + "epoch": 0.09, + "learning_rate": 2.3047115405417158e-06, + "loss": 3.5513, "step": 65 }, { - "epoch": 0.01, - "learning_rate": 0.00017006233073618606, - "loss": 1.1262, + "epoch": 0.09, + "learning_rate": 2.313140830145123e-06, + "loss": 3.5387, "step": 66 }, { - "epoch": 0.01, - "learning_rate": 0.0001706727334140692, - "loss": 1.0701, + "epoch": 0.09, + "learning_rate": 2.3214433586999722e-06, + "loss": 3.3643, "step": 67 }, { - "epoch": 0.01, - "learning_rate": 0.00017127409275602277, - "loss": 1.1018, + "epoch": 0.09, + "learning_rate": 2.32962288229841e-06, + "loss": 3.329, "step": 68 }, { - "epoch": 0.01, - "learning_rate": 0.00017186667281533107, - "loss": 1.0504, + "epoch": 0.09, + "learning_rate": 2.3376829925202453e-06, + "loss": 3.3631, "step": 69 }, { - "epoch": 0.01, - "learning_rate": 0.00017245072624649078, - "loss": 1.0683, + "epoch": 0.09, + "learning_rate": 2.3456271259021266e-06, + "loss": 3.505, "step": 70 }, { - "epoch": 0.01, - "learning_rate": 0.00017302649495200644, - "loss": 1.0704, + "epoch": 0.09, + "learning_rate": 2.3534585727350773e-06, + "loss": 3.3134, "step": 71 }, { - "epoch": 0.01, - "learning_rate": 0.000173594210683951, - "loss": 1.0504, + "epoch": 0.09, + "learning_rate": 2.361180485246754e-06, + "loss": 3.4492, "step": 72 }, { - "epoch": 0.01, - "learning_rate": 0.00017415409560403523, - "loss": 1.0216, + "epoch": 0.1, + "learning_rate": 2.3687958852193585e-06, + "loss": 3.2279, "step": 73 }, { - "epoch": 0.01, - "learning_rate": 0.00017470636280557373, - "loss": 1.0027, + "epoch": 0.1, + "learning_rate": 2.376307671089272e-06, + "loss": 3.3059, "step": 74 }, { - "epoch": 0.01, - "learning_rate": 0.000175251216800416, - "loss": 1.0084, + "epoch": 0.1, + "learning_rate": 2.3837186245701603e-06, + "loss": 3.4335, "step": 75 }, { - "epoch": 0.01, - "learning_rate": 0.0001757888539736281, - "loss": 1.0463, + "epoch": 0.1, + "learning_rate": 2.391031416837426e-06, + "loss": 3.3363, "step": 76 }, { - "epoch": 0.01, - "learning_rate": 0.00017631946300845336, - "loss": 1.0056, + "epoch": 0.1, + "learning_rate": 2.398248614308406e-06, + "loss": 3.2824, "step": 77 }, { - "epoch": 0.01, - "learning_rate": 0.000176843225283854, - "loss": 0.9764, + "epoch": 0.1, + "learning_rate": 2.4053726840496263e-06, + "loss": 3.3852, "step": 78 }, { - "epoch": 0.01, - "learning_rate": 0.0001773603152467301, - "loss": 0.9691, + "epoch": 0.1, + "learning_rate": 2.4124059988396154e-06, + "loss": 3.5303, "step": 79 }, { - "epoch": 0.01, - "learning_rate": 0.00017787090076072564, - "loss": 0.955, + "epoch": 0.1, + "learning_rate": 2.419350841913276e-06, + "loss": 3.3088, "step": 80 }, { - "epoch": 0.01, - "learning_rate": 0.00017837514343336887, - "loss": 0.9708, + "epoch": 0.11, + "learning_rate": 2.4262094114115493e-06, + "loss": 3.3774, "step": 81 }, { - "epoch": 0.01, - "learning_rate": 0.0001788731989231402, - "loss": 0.9518, + "epoch": 0.11, + "learning_rate": 2.4329838245580745e-06, + "loss": 3.3502, "step": 82 }, { - "epoch": 0.01, - "learning_rate": 0.00017936521722792945, - "loss": 0.9557, + "epoch": 0.11, + "learning_rate": 2.4396761215827013e-06, + "loss": 3.3218, "step": 83 }, { - "epoch": 0.01, - "learning_rate": 0.00017985134295621827, - "loss": 0.9577, + "epoch": 0.11, + "learning_rate": 2.4462882694100367e-06, + "loss": 3.4322, "step": 84 }, { - "epoch": 0.01, - "learning_rate": 0.00018033171558221527, - "loss": 0.9631, + "epoch": 0.11, + "learning_rate": 2.452822165129727e-06, + "loss": 3.297, "step": 85 }, { - "epoch": 0.01, - "learning_rate": 0.00018080646968606997, - "loss": 0.926, + "epoch": 0.11, + "learning_rate": 2.4592796392637773e-06, + "loss": 3.297, "step": 86 }, { - "epoch": 0.01, - "learning_rate": 0.00018127573518020068, - "loss": 0.9196, + "epoch": 0.11, + "learning_rate": 2.4656624588450042e-06, + "loss": 3.3604, "step": 87 }, { - "epoch": 0.01, - "learning_rate": 0.00018173963752268825, - "loss": 0.9344, + "epoch": 0.12, + "learning_rate": 2.471972330319556e-06, + "loss": 3.2638, "step": 88 }, { - "epoch": 0.01, - "learning_rate": 0.00018219829791861307, - "loss": 0.9398, + "epoch": 0.12, + "learning_rate": 2.478210902285443e-06, + "loss": 3.186, "step": 89 }, { - "epoch": 0.01, - "learning_rate": 0.00018265183351014348, - "loss": 0.9389, + "epoch": 0.12, + "learning_rate": 2.484379768078071e-06, + "loss": 3.3819, "step": 90 }, { - "epoch": 0.01, - "learning_rate": 0.00018310035755612127, - "loss": 0.9357, + "epoch": 0.12, + "learning_rate": 2.490480468212909e-06, + "loss": 3.362, "step": 91 }, { - "epoch": 0.01, - "learning_rate": 0.00018354397960183323, - "loss": 0.9268, + "epoch": 0.12, + "learning_rate": 2.4965144926946778e-06, + "loss": 3.3608, "step": 92 }, { - "epoch": 0.01, - "learning_rate": 0.00018398280563960528, - "loss": 0.947, + "epoch": 0.12, + "learning_rate": 2.5024832832017063e-06, + "loss": 3.2796, "step": 93 }, { - "epoch": 0.01, - "learning_rate": 0.00018441693826080826, - "loss": 0.9128, + "epoch": 0.12, + "learning_rate": 2.5083882351534724e-06, + "loss": 3.2159, "step": 94 }, { - "epoch": 0.01, - "learning_rate": 0.0001848464767998206, - "loss": 0.8744, + "epoch": 0.12, + "learning_rate": 2.514230699668743e-06, + "loss": 3.2004, "step": 95 }, { - "epoch": 0.01, - "learning_rate": 0.0001852715174704532, - "loss": 0.9054, + "epoch": 0.13, + "learning_rate": 2.5200119854211865e-06, + "loss": 3.1361, "step": 96 }, { - "epoch": 0.01, - "learning_rate": 0.00018569215349530506, - "loss": 0.9108, + "epoch": 0.13, + "learning_rate": 2.5257333603988366e-06, + "loss": 3.354, "step": 97 }, { - "epoch": 0.01, - "learning_rate": 0.00018610847522848557, - "loss": 0.8987, + "epoch": 0.13, + "learning_rate": 2.5313960535733198e-06, + "loss": 3.1423, "step": 98 }, { - "epoch": 0.01, - "learning_rate": 0.0001865205702721061, - "loss": 0.8952, + "epoch": 0.13, + "learning_rate": 2.5370012564843503e-06, + "loss": 3.2997, "step": 99 }, { - "epoch": 0.01, - "learning_rate": 0.00018692852358691823, - "loss": 0.8931, + "epoch": 0.13, + "learning_rate": 2.5425501247445936e-06, + "loss": 3.3779, "step": 100 - }, - { - "epoch": 0.01, - "learning_rate": 0.0001873324175974465, - "loss": 0.8943, - "step": 101 - }, - { - "epoch": 0.01, - "learning_rate": 0.00018773233229194274, - "loss": 0.9029, - "step": 102 - }, - { - "epoch": 0.01, - "learning_rate": 0.00018812834531746386, - "loss": 0.874, - "step": 103 - }, - { - "epoch": 0.01, - "learning_rate": 0.00018852053207035622, - "loss": 0.8726, - "step": 104 - }, - { - "epoch": 0.01, - "learning_rate": 0.00018890896578241075, - "loss": 0.9077, - "step": 105 - }, - { - "epoch": 0.01, - "learning_rate": 0.00018929371760293467, - "loss": 0.8552, - "step": 106 - }, - { - "epoch": 0.01, - "learning_rate": 0.0001896748566769694, - "loss": 0.8447, - "step": 107 - }, - { - "epoch": 0.01, - "learning_rate": 0.00019005245021987103, - "loss": 0.8702, - "step": 108 - }, - { - "epoch": 0.01, - "learning_rate": 0.00019042656358845297, - "loss": 0.8499, - "step": 109 - }, - { - "epoch": 0.01, - "learning_rate": 0.00019079726034888078, - "loss": 0.848, - "step": 110 - }, - { - "epoch": 0.01, - "learning_rate": 0.00019116460234149373, - "loss": 0.8333, - "step": 111 - }, - { - "epoch": 0.01, - "learning_rate": 0.00019152864974272043, - "loss": 0.8686, - "step": 112 - }, - { - "epoch": 0.01, - "learning_rate": 0.00019188946112424184, - "loss": 0.8577, - "step": 113 - }, - { - "epoch": 0.01, - "learning_rate": 0.00019224709350954813, - "loss": 0.8249, - "step": 114 - }, - { - "epoch": 0.01, - "learning_rate": 0.0001926016024280257, - "loss": 0.8363, - "step": 115 - }, - { - "epoch": 0.01, - "learning_rate": 0.00019295304196670284, - "loss": 0.8514, - "step": 116 - }, - { - "epoch": 0.01, - "learning_rate": 0.00019330146481977406, - "loss": 0.8519, - "step": 117 - }, - { - "epoch": 0.01, - "learning_rate": 0.00019364692233601725, - "loss": 0.8517, - "step": 118 - }, - { - "epoch": 0.01, - "learning_rate": 0.00019398946456421003, - "loss": 0.8294, - "step": 119 - }, - { - "epoch": 0.01, - "learning_rate": 0.0001943291402966457, - "loss": 0.8277, - "step": 120 - }, - { - "epoch": 0.01, - "learning_rate": 0.00019466599711084336, - "loss": 0.8522, - "step": 121 - }, - { - "epoch": 0.02, - "learning_rate": 0.00019500008140954167, - "loss": 0.8292, - "step": 122 - }, - { - "epoch": 0.02, - "learning_rate": 0.0001953314384590602, - "loss": 0.8131, - "step": 123 - }, - { - "epoch": 0.02, - "learning_rate": 0.00019566011242610744, - "loss": 0.8052, - "step": 124 - }, - { - "epoch": 0.02, - "learning_rate": 0.0001959861464131107, - "loss": 0.8186, - "step": 125 - }, - { - "epoch": 0.02, - "learning_rate": 0.0001963095824921383, - "loss": 0.7795, - "step": 126 - }, - { - "epoch": 0.02, - "learning_rate": 0.00019663046173748093, - "loss": 0.8162, - "step": 127 - }, - { - "epoch": 0.02, - "learning_rate": 0.00019694882425695535, - "loss": 0.7905, - "step": 128 - }, - { - "epoch": 0.02, - "learning_rate": 0.00019726470922198997, - "loss": 0.7901, - "step": 129 - }, - { - "epoch": 0.02, - "learning_rate": 0.00019757815489654872, - "loss": 0.8148, - "step": 130 - }, - { - "epoch": 0.02, - "learning_rate": 0.00019788919866494666, - "loss": 0.8095, - "step": 131 - }, - { - "epoch": 0.02, - "learning_rate": 0.00019819787705860825, - "loss": 0.8041, - "step": 132 - }, - { - "epoch": 0.02, - "learning_rate": 0.0001985042257818154, - "loss": 0.7831, - "step": 133 - }, - { - "epoch": 0.02, - "learning_rate": 0.0001988082797364914, - "loss": 0.7724, - "step": 134 - }, - { - "epoch": 0.02, - "learning_rate": 0.00019911007304606354, - "loss": 0.765, - "step": 135 - }, - { - "epoch": 0.02, - "learning_rate": 0.00019940963907844495, - "loss": 0.7972, - "step": 136 - }, - { - "epoch": 0.02, - "learning_rate": 0.0001997070104681748, - "loss": 0.7593, - "step": 137 - }, - { - "epoch": 0.02, - "learning_rate": 0.00020000221913775326, - "loss": 0.7535, - "step": 138 - }, - { - "epoch": 0.02, - "learning_rate": 0.00020029529631820618, - "loss": 0.7774, - "step": 139 - }, - { - "epoch": 0.02, - "learning_rate": 0.00020058627256891296, - "loss": 0.7892, - "step": 140 - }, - { - "epoch": 0.02, - "learning_rate": 0.00020087517779672829, - "loss": 0.7428, - "step": 141 - }, - { - "epoch": 0.02, - "learning_rate": 0.00020116204127442863, - "loss": 0.771, - "step": 142 - }, - { - "epoch": 0.02, - "learning_rate": 0.00020144689165851128, - "loss": 0.7806, - "step": 143 - }, - { - "epoch": 0.02, - "learning_rate": 0.0002017297570063732, - "loss": 0.791, - "step": 144 - }, - { - "epoch": 0.02, - "learning_rate": 0.00020201066479289535, - "loss": 0.7662, - "step": 145 - }, - { - "epoch": 0.02, - "learning_rate": 0.00020228964192645744, - "loss": 0.77, - "step": 146 - }, - { - "epoch": 0.02, - "learning_rate": 0.0002025667147644055, - "loss": 0.7447, - "step": 147 - }, - { - "epoch": 0.02, - "learning_rate": 0.00020284190912799589, - "loss": 0.7446, - "step": 148 - }, - { - "epoch": 0.02, - "learning_rate": 0.00020311525031683526, - "loss": 0.7611, - "step": 149 - }, - { - "epoch": 0.02, - "learning_rate": 0.0002033867631228382, - "loss": 0.761, - "step": 150 - }, - { - "epoch": 0.02, - "learning_rate": 0.0002036564718437211, - "loss": 0.7442, - "step": 151 - }, - { - "epoch": 0.02, - "learning_rate": 0.00020392440029605032, - "loss": 0.7439, - "step": 152 - }, - { - "epoch": 0.02, - "learning_rate": 0.00020419057182786277, - "loss": 0.7589, - "step": 153 - }, - { - "epoch": 0.02, - "learning_rate": 0.00020445500933087554, - "loss": 0.7247, - "step": 154 - }, - { - "epoch": 0.02, - "learning_rate": 0.00020471773525229995, - "loss": 0.7245, - "step": 155 - }, - { - "epoch": 0.02, - "learning_rate": 0.00020497877160627622, - "loss": 0.7234, - "step": 156 - }, - { - "epoch": 0.02, - "learning_rate": 0.00020523813998494245, - "loss": 0.7325, - "step": 157 - }, - { - "epoch": 0.02, - "learning_rate": 0.00020549586156915232, - "loss": 0.7311, - "step": 158 - }, - { - "epoch": 0.02, - "learning_rate": 0.0002057519571388547, - "loss": 0.7132, - "step": 159 - }, - { - "epoch": 0.02, - "learning_rate": 0.00020600644708314785, - "loss": 0.7442, - "step": 160 - }, - { - "epoch": 0.02, - "learning_rate": 0.00020625935141002053, - "loss": 0.6854, - "step": 161 - }, - { - "epoch": 0.02, - "learning_rate": 0.000206510689755791, - "loss": 0.7512, - "step": 162 - }, - { - "epoch": 0.02, - "learning_rate": 0.00020676048139425666, - "loss": 0.6922, - "step": 163 - }, - { - "epoch": 0.02, - "learning_rate": 0.00020700874524556237, - "loss": 0.7238, - "step": 164 - }, - { - "epoch": 0.02, - "learning_rate": 0.00020725549988480076, - "loss": 0.7165, - "step": 165 - }, - { - "epoch": 0.02, - "learning_rate": 0.00020750076355035166, - "loss": 0.7122, - "step": 166 - }, - { - "epoch": 0.02, - "learning_rate": 0.0002077445541519713, - "loss": 0.7225, - "step": 167 - }, - { - "epoch": 0.02, - "learning_rate": 0.00020798688927864046, - "loss": 0.7189, - "step": 168 - }, - { - "epoch": 0.02, - "learning_rate": 0.00020822778620617927, - "loss": 0.7182, - "step": 169 - }, - { - "epoch": 0.02, - "learning_rate": 0.00020846726190463746, - "loss": 0.7067, - "step": 170 - }, - { - "epoch": 0.02, - "learning_rate": 0.00020870533304546819, - "loss": 0.7273, - "step": 171 - }, - { - "epoch": 0.02, - "learning_rate": 0.00020894201600849216, - "loss": 0.7488, - "step": 172 - }, - { - "epoch": 0.02, - "learning_rate": 0.0002091773268886607, - "loss": 0.7133, - "step": 173 - }, - { - "epoch": 0.02, - "learning_rate": 0.0002094112815026229, - "loss": 0.7098, - "step": 174 - }, - { - "epoch": 0.02, - "learning_rate": 0.0002096438953951055, - "loss": 0.7207, - "step": 175 - }, - { - "epoch": 0.02, - "learning_rate": 0.0002098751838451104, - "loss": 0.7133, - "step": 176 - }, - { - "epoch": 0.02, - "learning_rate": 0.00021010516187193725, - "loss": 0.687, - "step": 177 - }, - { - "epoch": 0.02, - "learning_rate": 0.00021033384424103526, - "loss": 0.7027, - "step": 178 - }, - { - "epoch": 0.02, - "learning_rate": 0.00021056124546969257, - "loss": 0.6941, - "step": 179 - }, - { - "epoch": 0.02, - "learning_rate": 0.0002107873798325657, - "loss": 0.692, - "step": 180 - }, - { - "epoch": 0.02, - "learning_rate": 0.0002110122613670571, - "loss": 0.6891, - "step": 181 - }, - { - "epoch": 0.02, - "learning_rate": 0.00021123590387854348, - "loss": 0.6897, - "step": 182 - }, - { - "epoch": 0.02, - "learning_rate": 0.0002114583209454617, - "loss": 0.6941, - "step": 183 - }, - { - "epoch": 0.02, - "learning_rate": 0.00021167952592425542, - "loss": 0.6823, - "step": 184 - }, - { - "epoch": 0.02, - "learning_rate": 0.00021189953195418842, - "loss": 0.6741, - "step": 185 - }, - { - "epoch": 0.02, - "learning_rate": 0.00021211835196202747, - "loss": 0.6849, - "step": 186 - }, - { - "epoch": 0.02, - "learning_rate": 0.00021233599866660004, - "loss": 0.6666, - "step": 187 - }, - { - "epoch": 0.02, - "learning_rate": 0.00021255248458323044, - "loss": 0.6873, - "step": 188 - }, - { - "epoch": 0.02, - "learning_rate": 0.0002127678220280583, - "loss": 0.6925, - "step": 189 - }, - { - "epoch": 0.02, - "learning_rate": 0.0002129820231222428, - "loss": 0.693, - "step": 190 - }, - { - "epoch": 0.02, - "learning_rate": 0.00021319509979605714, - "loss": 0.6992, - "step": 191 - }, - { - "epoch": 0.02, - "learning_rate": 0.0002134070637928754, - "loss": 0.6835, - "step": 192 - }, - { - "epoch": 0.02, - "learning_rate": 0.00021361792667305644, - "loss": 0.6562, - "step": 193 - }, - { - "epoch": 0.02, - "learning_rate": 0.00021382769981772727, - "loss": 0.6548, - "step": 194 - }, - { - "epoch": 0.02, - "learning_rate": 0.00021403639443246875, - "loss": 0.6547, - "step": 195 - }, - { - "epoch": 0.02, - "learning_rate": 0.00021424402155090772, - "loss": 0.707, - "step": 196 - }, - { - "epoch": 0.02, - "learning_rate": 0.00021445059203821723, - "loss": 0.6786, - "step": 197 - }, - { - "epoch": 0.02, - "learning_rate": 0.0002146561165945283, - "loss": 0.6692, - "step": 198 - }, - { - "epoch": 0.02, - "learning_rate": 0.00021486060575825566, - "loss": 0.6463, - "step": 199 - }, - { - "epoch": 0.02, - "learning_rate": 0.00021506406990934036, - "loss": 0.6616, - "step": 200 - }, - { - "epoch": 0.02, - "learning_rate": 0.00021526651927241143, - "loss": 0.657, - "step": 201 - }, - { - "epoch": 0.02, - "learning_rate": 0.0002154679639198687, - "loss": 0.6805, - "step": 202 - }, - { - "epoch": 0.03, - "learning_rate": 0.00021566841377489016, - "loss": 0.6773, - "step": 203 - }, - { - "epoch": 0.03, - "learning_rate": 0.00021586787861436492, - "loss": 0.651, - "step": 204 - }, - { - "epoch": 0.03, - "learning_rate": 0.00021606636807175488, - "loss": 0.65, - "step": 205 - }, - { - "epoch": 0.03, - "learning_rate": 0.00021626389163988604, - "loss": 0.6584, - "step": 206 - }, - { - "epoch": 0.03, - "learning_rate": 0.00021646045867367323, - "loss": 0.6689, - "step": 207 - }, - { - "epoch": 0.03, - "learning_rate": 0.0002166560783927784, - "loss": 0.6428, - "step": 208 - }, - { - "epoch": 0.03, - "learning_rate": 0.0002168507598842054, - "loss": 0.6816, - "step": 209 - }, - { - "epoch": 0.03, - "learning_rate": 0.00021704451210483296, - "loss": 0.6791, - "step": 210 - }, - { - "epoch": 0.03, - "learning_rate": 0.00021723734388388744, - "loss": 0.6535, - "step": 211 - }, - { - "epoch": 0.03, - "learning_rate": 0.00021742926392535688, - "loss": 0.66, - "step": 212 - }, - { - "epoch": 0.03, - "learning_rate": 0.00021762028081034868, - "loss": 0.649, - "step": 213 - }, - { - "epoch": 0.03, - "learning_rate": 0.0002178104029993916, - "loss": 0.6703, - "step": 214 - }, - { - "epoch": 0.03, - "learning_rate": 0.00021799963883468467, - "loss": 0.6653, - "step": 215 - }, - { - "epoch": 0.03, - "learning_rate": 0.00021818799654229324, - "loss": 0.6675, - "step": 216 - }, - { - "epoch": 0.03, - "learning_rate": 0.00021837548423429473, - "loss": 0.6728, - "step": 217 - }, - { - "epoch": 0.03, - "learning_rate": 0.00021856210991087516, - "loss": 0.6236, - "step": 218 - }, - { - "epoch": 0.03, - "learning_rate": 0.00021874788146237747, - "loss": 0.6569, - "step": 219 - }, - { - "epoch": 0.03, - "learning_rate": 0.000218932806671303, - "loss": 0.6762, - "step": 220 - }, - { - "epoch": 0.03, - "learning_rate": 0.00021911689321426798, - "loss": 0.6441, - "step": 221 - }, - { - "epoch": 0.03, - "learning_rate": 0.0002193001486639159, - "loss": 0.6356, - "step": 222 - }, - { - "epoch": 0.03, - "learning_rate": 0.00021948258049078642, - "loss": 0.6312, - "step": 223 - }, - { - "epoch": 0.03, - "learning_rate": 0.0002196641960651426, - "loss": 0.6473, - "step": 224 - }, - { - "epoch": 0.03, - "learning_rate": 0.00021984500265875823, - "loss": 0.6395, - "step": 225 - }, - { - "epoch": 0.03, - "learning_rate": 0.00022002500744666405, - "loss": 0.6372, - "step": 226 - }, - { - "epoch": 0.03, - "learning_rate": 0.0002202042175088569, - "loss": 0.6445, - "step": 227 - }, - { - "epoch": 0.03, - "learning_rate": 0.00022038263983197034, - "loss": 0.6354, - "step": 228 - }, - { - "epoch": 0.03, - "learning_rate": 0.0002205602813109091, - "loss": 0.6376, - "step": 229 - }, - { - "epoch": 0.03, - "learning_rate": 0.00022073714875044792, - "loss": 0.6191, - "step": 230 - }, - { - "epoch": 0.03, - "learning_rate": 0.00022091324886679552, - "loss": 0.6238, - "step": 231 - }, - { - "epoch": 0.03, - "learning_rate": 0.00022108858828912505, - "loss": 0.6109, - "step": 232 - }, - { - "epoch": 0.03, - "learning_rate": 0.0002212631735610713, - "loss": 0.6511, - "step": 233 - }, - { - "epoch": 0.03, - "learning_rate": 0.00022143701114219624, - "loss": 0.6147, - "step": 234 - }, - { - "epoch": 0.03, - "learning_rate": 0.00022161010740942298, - "loss": 0.6286, - "step": 235 - }, - { - "epoch": 0.03, - "learning_rate": 0.00022178246865843943, - "loss": 0.6061, - "step": 236 - }, - { - "epoch": 0.03, - "learning_rate": 0.00022195410110507232, - "loss": 0.6432, - "step": 237 - }, - { - "epoch": 0.03, - "learning_rate": 0.00022212501088663222, - "loss": 0.6326, - "step": 238 - }, - { - "epoch": 0.03, - "learning_rate": 0.00022229520406323036, - "loss": 0.6281, - "step": 239 - }, - { - "epoch": 0.03, - "learning_rate": 0.00022246468661906788, - "loss": 0.6156, - "step": 240 - }, - { - "epoch": 0.03, - "learning_rate": 0.0002226334644636987, - "loss": 0.635, - "step": 241 - }, - { - "epoch": 0.03, - "learning_rate": 0.00022280154343326555, - "loss": 0.6319, - "step": 242 - }, - { - "epoch": 0.03, - "learning_rate": 0.00022296892929171103, - "loss": 0.6241, - "step": 243 - }, - { - "epoch": 0.03, - "learning_rate": 0.00022313562773196386, - "loss": 0.6195, - "step": 244 - }, - { - "epoch": 0.03, - "learning_rate": 0.00022330164437710026, - "loss": 0.621, - "step": 245 - }, - { - "epoch": 0.03, - "learning_rate": 0.00022346698478148237, - "loss": 0.6173, - "step": 246 - }, - { - "epoch": 0.03, - "learning_rate": 0.00022363165443187337, - "loss": 0.6327, - "step": 247 - }, - { - "epoch": 0.03, - "learning_rate": 0.00022379565874852965, - "loss": 0.6602, - "step": 248 - }, - { - "epoch": 0.03, - "learning_rate": 0.00022395900308627166, - "loss": 0.6246, - "step": 249 - }, - { - "epoch": 0.03, - "learning_rate": 0.0002241216927355329, - "loss": 0.6353, - "step": 250 - }, - { - "epoch": 0.03, - "learning_rate": 0.00022428373292338795, - "loss": 0.6116, - "step": 251 - }, - { - "epoch": 0.03, - "learning_rate": 0.00022444512881456048, - "loss": 0.6097, - "step": 252 - }, - { - "epoch": 0.03, - "learning_rate": 0.00022460588551241053, - "loss": 0.5791, - "step": 253 - }, - { - "epoch": 0.03, - "learning_rate": 0.00022476600805990314, - "loss": 0.6228, - "step": 254 - }, - { - "epoch": 0.03, - "learning_rate": 0.00022492550144055746, - "loss": 0.6145, - "step": 255 - }, - { - "epoch": 0.03, - "learning_rate": 0.00022508437057937756, - "loss": 0.6022, - "step": 256 - }, - { - "epoch": 0.03, - "learning_rate": 0.00022524262034376465, - "loss": 0.6165, - "step": 257 - }, - { - "epoch": 0.03, - "learning_rate": 0.00022540025554441216, - "loss": 0.614, - "step": 258 - }, - { - "epoch": 0.03, - "learning_rate": 0.00022555728093618318, - "loss": 0.6022, - "step": 259 - }, - { - "epoch": 0.03, - "learning_rate": 0.0002257137012189709, - "loss": 0.6325, - "step": 260 - }, - { - "epoch": 0.03, - "learning_rate": 0.00022586952103854292, - "loss": 0.6095, - "step": 261 - }, - { - "epoch": 0.03, - "learning_rate": 0.00022602474498736885, - "loss": 0.6141, - "step": 262 - }, - { - "epoch": 0.03, - "learning_rate": 0.000226179377605433, - "loss": 0.5995, - "step": 263 - }, - { - "epoch": 0.03, - "learning_rate": 0.00022633342338103046, - "loss": 0.5984, - "step": 264 - }, - { - "epoch": 0.03, - "learning_rate": 0.00022648688675154939, - "loss": 0.5912, - "step": 265 - }, - { - "epoch": 0.03, - "learning_rate": 0.0002266397721042376, - "loss": 0.6121, - "step": 266 - }, - { - "epoch": 0.03, - "learning_rate": 0.0002267920837769553, - "loss": 0.6209, - "step": 267 - }, - { - "epoch": 0.03, - "learning_rate": 0.00022694382605891359, - "loss": 0.6045, - "step": 268 - }, - { - "epoch": 0.03, - "learning_rate": 0.0002270950031913992, - "loss": 0.628, - "step": 269 - }, - { - "epoch": 0.03, - "learning_rate": 0.00022724561936848572, - "loss": 0.6227, - "step": 270 - }, - { - "epoch": 0.03, - "learning_rate": 0.000227395678737732, - "loss": 0.6093, - "step": 271 - }, - { - "epoch": 0.03, - "learning_rate": 0.00022754518540086716, - "loss": 0.5772, - "step": 272 - }, - { - "epoch": 0.03, - "learning_rate": 0.0002276941434144635, - "loss": 0.6146, - "step": 273 - }, - { - "epoch": 0.03, - "learning_rate": 0.00022784255679059702, - "loss": 0.5905, - "step": 274 - }, - { - "epoch": 0.03, - "learning_rate": 0.00022799042949749548, - "loss": 0.5993, - "step": 275 - }, - { - "epoch": 0.03, - "learning_rate": 0.00022813776546017542, - "loss": 0.6021, - "step": 276 - }, - { - "epoch": 0.03, - "learning_rate": 0.00022828456856106714, - "loss": 0.619, - "step": 277 - }, - { - "epoch": 0.03, - "learning_rate": 0.00022843084264062837, - "loss": 0.5983, - "step": 278 - }, - { - "epoch": 0.03, - "learning_rate": 0.00022857659149794744, - "loss": 0.5856, - "step": 279 - }, - { - "epoch": 0.03, - "learning_rate": 0.00022872181889133515, - "loss": 0.6103, - "step": 280 - }, - { - "epoch": 0.03, - "learning_rate": 0.00022886652853890618, - "loss": 0.6156, - "step": 281 - }, - { - "epoch": 0.03, - "learning_rate": 0.00022901072411915047, - "loss": 0.5848, - "step": 282 - }, - { - "epoch": 0.03, - "learning_rate": 0.00022915440927149419, - "loss": 0.6229, - "step": 283 - }, - { - "epoch": 0.04, - "learning_rate": 0.00022929758759685084, - "loss": 0.618, - "step": 284 - }, - { - "epoch": 0.04, - "learning_rate": 0.00022944026265816285, - "loss": 0.6025, - "step": 285 - }, - { - "epoch": 0.04, - "learning_rate": 0.0002295824379809335, - "loss": 0.5933, - "step": 286 - }, - { - "epoch": 0.04, - "learning_rate": 0.00022972411705374964, - "loss": 0.6136, - "step": 287 - }, - { - "epoch": 0.04, - "learning_rate": 0.0002298653033287954, - "loss": 0.6173, - "step": 288 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023000600022235674, - "loss": 0.6339, - "step": 289 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023014621111531756, - "loss": 0.6105, - "step": 290 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023028593935364727, - "loss": 0.5943, - "step": 291 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023042518824887962, - "loss": 0.5828, - "step": 292 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023056396107858397, - "loss": 0.576, - "step": 293 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023070226108682772, - "loss": 0.5977, - "step": 294 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023084009148463194, - "loss": 0.599, - "step": 295 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023097745545041807, - "loss": 0.613, - "step": 296 - }, - { - "epoch": 0.04, - "learning_rate": 0.0002311143561304483, - "loss": 0.6109, - "step": 297 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023125079663925745, - "loss": 0.5874, - "step": 298 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023138678006007847, - "loss": 0.5783, - "step": 299 - }, - { - "epoch": 0.04, - "learning_rate": 0.0002315223094452604, - "loss": 0.5931, - "step": 300 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023165738781667943, - "loss": 0.5988, - "step": 301 - }, - { - "epoch": 0.04, - "learning_rate": 0.0002317920181661433, - "loss": 0.5841, - "step": 302 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023192620345578868, - "loss": 0.5895, - "step": 303 - }, - { - "epoch": 0.04, - "learning_rate": 0.0002320599466184725, - "loss": 0.6045, - "step": 304 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023219325055815637, - "loss": 0.5805, - "step": 305 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023232611815028498, - "loss": 0.5773, - "step": 306 - }, - { - "epoch": 0.04, - "learning_rate": 0.0002324585522421583, - "loss": 0.5841, - "step": 307 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023259055565329773, - "loss": 0.5794, - "step": 308 - }, - { - "epoch": 0.04, - "learning_rate": 0.0002327221311758061, - "loss": 0.5841, - "step": 309 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023285328157472213, - "loss": 0.5969, - "step": 310 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023298400958836926, - "loss": 0.5662, - "step": 311 - }, - { - "epoch": 0.04, - "learning_rate": 0.0002331143179286984, - "loss": 0.5893, - "step": 312 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023324420928162569, - "loss": 0.5553, - "step": 313 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023337368630736466, - "loss": 0.5873, - "step": 314 - }, - { - "epoch": 0.04, - "learning_rate": 0.000233502751640753, - "loss": 0.5793, - "step": 315 - }, - { - "epoch": 0.04, - "learning_rate": 0.0002336314078915745, - "loss": 0.5652, - "step": 316 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023375965764487556, - "loss": 0.546, - "step": 317 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023388750346127688, - "loss": 0.5628, - "step": 318 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023401494787728014, - "loss": 0.5829, - "step": 319 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023414199340557004, - "loss": 0.6037, - "step": 320 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023426864253531165, - "loss": 0.5803, - "step": 321 - }, - { - "epoch": 0.04, - "learning_rate": 0.0002343948977324427, - "loss": 0.5734, - "step": 322 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023452076143996208, - "loss": 0.5826, - "step": 323 - }, - { - "epoch": 0.04, - "learning_rate": 0.0002346462360782132, - "loss": 0.5475, - "step": 324 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023477132404516342, - "loss": 0.5693, - "step": 325 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023489602771667884, - "loss": 0.5862, - "step": 326 - }, - { - "epoch": 0.04, - "learning_rate": 0.0002350203494467952, - "loss": 0.5394, - "step": 327 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023514429156798458, - "loss": 0.5924, - "step": 328 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023526785639141774, - "loss": 0.5656, - "step": 329 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023539104620722297, - "loss": 0.5671, - "step": 330 - }, - { - "epoch": 0.04, - "learning_rate": 0.0002355138632847406, - "loss": 0.5638, - "step": 331 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023563630987277382, - "loss": 0.5718, - "step": 332 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023575838819983597, - "loss": 0.5677, - "step": 333 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023588010047439348, - "loss": 0.5936, - "step": 334 - }, - { - "epoch": 0.04, - "learning_rate": 0.0002360014488851061, - "loss": 0.5604, - "step": 335 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023612243560106267, - "loss": 0.5702, - "step": 336 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023624306277201385, - "loss": 0.553, - "step": 337 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023636333252860146, - "loss": 0.5655, - "step": 338 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023648324698258405, - "loss": 0.5555, - "step": 339 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023660280822705967, - "loss": 0.5497, - "step": 340 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023672201833668474, - "loss": 0.5917, - "step": 341 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023684087936789032, - "loss": 0.5611, - "step": 342 - }, - { - "epoch": 0.04, - "learning_rate": 0.000236959393359095, - "loss": 0.5514, - "step": 343 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023707756233091437, - "loss": 0.5685, - "step": 344 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023719538828636795, - "loss": 0.5824, - "step": 345 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023731287321108292, - "loss": 0.5585, - "step": 346 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023743001907349466, - "loss": 0.552, - "step": 347 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023754682782504508, - "loss": 0.5888, - "step": 348 - }, - { - "epoch": 0.04, - "learning_rate": 0.0002376633014003772, - "loss": 0.5762, - "step": 349 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023777944171752766, - "loss": 0.5668, - "step": 350 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023789525067811624, - "loss": 0.5601, - "step": 351 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023801073016753262, - "loss": 0.5674, - "step": 352 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023812588205512054, - "loss": 0.561, - "step": 353 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023824070819435943, - "loss": 0.5567, - "step": 354 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023835521042304332, - "loss": 0.5585, - "step": 355 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023846939056345747, - "loss": 0.5459, - "step": 356 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023858325042255222, - "loss": 0.5732, - "step": 357 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023869679179211475, - "loss": 0.5857, - "step": 358 - }, - { - "epoch": 0.04, - "learning_rate": 0.000238810016448938, - "loss": 0.5733, - "step": 359 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023892292615498788, - "loss": 0.5668, - "step": 360 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023903552265756742, - "loss": 0.598, - "step": 361 - }, - { - "epoch": 0.04, - "learning_rate": 0.0002391478076894793, - "loss": 0.5777, - "step": 362 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023925978296918552, - "loss": 0.5733, - "step": 363 - }, - { - "epoch": 0.04, - "learning_rate": 0.00023937145020096567, - "loss": 0.5811, - "step": 364 - }, - { - "epoch": 0.05, - "learning_rate": 0.00023948281107507213, - "loss": 0.5379, - "step": 365 - }, - { - "epoch": 0.05, - "learning_rate": 0.00023959386726788386, - "loss": 0.5803, - "step": 366 - }, - { - "epoch": 0.05, - "learning_rate": 0.00023970462044205768, - "loss": 0.5477, - "step": 367 - }, - { - "epoch": 0.05, - "learning_rate": 0.00023981507224667763, - "loss": 0.5864, - "step": 368 - }, - { - "epoch": 0.05, - "learning_rate": 0.0002399252243174024, - "loss": 0.5567, - "step": 369 - }, - { - "epoch": 0.05, - "learning_rate": 0.0002400350782766106, - "loss": 0.5484, - "step": 370 - }, - { - "epoch": 0.05, - "learning_rate": 0.00024014463573354415, - "loss": 0.5653, - "step": 371 - }, - { - "epoch": 0.05, - "learning_rate": 0.00024025389828444965, - "loss": 0.5795, - "step": 372 - }, - { - "epoch": 0.05, - "learning_rate": 0.00024036286751271806, - "loss": 0.5392, - "step": 373 - }, - { - "epoch": 0.05, - "learning_rate": 0.00024047154498902222, - "loss": 0.5583, - "step": 374 - }, - { - "epoch": 0.05, - "learning_rate": 0.0002405799322714529, - "loss": 0.5274, - "step": 375 - }, - { - "epoch": 0.05, - "learning_rate": 0.00024068803090565268, - "loss": 0.5811, - "step": 376 - }, - { - "epoch": 0.05, - "learning_rate": 0.0002407958424249481, - "loss": 0.5701, - "step": 377 - }, - { - "epoch": 0.05, - "learning_rate": 0.0002409033683504805, - "loss": 0.5587, - "step": 378 - }, - { - "epoch": 0.05, - "learning_rate": 0.00024101061019133444, - "loss": 0.5523, - "step": 379 - }, - { - "epoch": 0.05, - "learning_rate": 0.000241117569444665, - "loss": 0.5588, - "step": 380 - }, - { - "epoch": 0.05, - "learning_rate": 0.00024122424759582314, - "loss": 0.5654, - "step": 381 - }, - { - "epoch": 0.05, - "learning_rate": 0.00024133064611847933, - "loss": 0.5572, - "step": 382 - }, - { - "epoch": 0.05, - "learning_rate": 0.0002414367664747459, - "loss": 0.5406, - "step": 383 - }, - { - "epoch": 0.05, - "learning_rate": 0.00024154261011529758, - "loss": 0.5567, - "step": 384 - }, - { - "epoch": 0.05, - "learning_rate": 0.00024164817847949026, - "loss": 0.5588, - "step": 385 - }, - { - "epoch": 0.05, - "learning_rate": 0.00024175347299547863, - "loss": 0.5492, - "step": 386 - }, - { - "epoch": 0.05, - "learning_rate": 0.0002418584950803322, - "loss": 0.5928, - "step": 387 - }, - { - "epoch": 0.05, - "learning_rate": 0.00024196324614014946, - "loss": 0.559, - "step": 388 - }, - { - "epoch": 0.05, - "learning_rate": 0.00024206772757017097, - "loss": 0.5431, - "step": 389 - }, - { - "epoch": 0.05, - "learning_rate": 0.00024217194075489094, - "loss": 0.5436, - "step": 390 - }, - { - "epoch": 0.05, - "learning_rate": 0.0002422758870681672, - "loss": 0.5594, - "step": 391 - }, - { - "epoch": 0.05, - "learning_rate": 0.0002423795678733299, - "loss": 0.5348, - "step": 392 - }, - { - "epoch": 0.05, - "learning_rate": 0.0002424829845232889, - "loss": 0.5528, - "step": 393 - }, - { - "epoch": 0.05, - "learning_rate": 0.00024258613836063942, - "loss": 0.5565, - "step": 394 - }, - { - "epoch": 0.05, - "learning_rate": 0.00024268903071776701, - "loss": 0.5514, - "step": 395 - }, - { - "epoch": 0.05, - "learning_rate": 0.0002427916629169505, - "loss": 0.542, - "step": 396 - }, - { - "epoch": 0.05, - "learning_rate": 0.00024289403627046404, - "loss": 0.5502, - "step": 397 - }, - { - "epoch": 0.05, - "learning_rate": 0.00024299615208067785, - "loss": 0.5705, - "step": 398 - }, - { - "epoch": 0.05, - "learning_rate": 0.0002430980116401576, - "loss": 0.5501, - "step": 399 - }, - { - "epoch": 0.05, - "learning_rate": 0.00024319961623176254, - "loss": 0.5462, - "step": 400 - }, - { - "epoch": 0.05, - "learning_rate": 0.00024330096712874255, - "loss": 0.5567, - "step": 401 - }, - { - "epoch": 0.05, - "learning_rate": 0.00024340206559483364, - "loss": 0.5438, - "step": 402 - }, - { - "epoch": 0.05, - "learning_rate": 0.00024350291288435265, - "loss": 0.578, - "step": 403 - }, - { - "epoch": 0.05, - "learning_rate": 0.0002436035102422909, - "loss": 0.5747, - "step": 404 - }, - { - "epoch": 0.05, - "learning_rate": 0.00024370385890440572, - "loss": 0.5439, - "step": 405 - }, - { - "epoch": 0.05, - "learning_rate": 0.00024380396009731235, - "loss": 0.5797, - "step": 406 - }, - { - "epoch": 0.05, - "learning_rate": 0.00024390381503857318, - "loss": 0.5218, - "step": 407 - }, - { - "epoch": 0.05, - "learning_rate": 0.00024400342493678713, - "loss": 0.5508, - "step": 408 - }, - { - "epoch": 0.05, - "learning_rate": 0.00024410279099167722, - "loss": 0.5324, - "step": 409 - }, - { - "epoch": 0.05, - "learning_rate": 0.00024420191439417706, - "loss": 0.5526, - "step": 410 - }, - { - "epoch": 0.05, - "learning_rate": 0.00024430079632651696, - "loss": 0.5538, - "step": 411 - }, - { - "epoch": 0.05, - "learning_rate": 0.00024439943796230825, - "loss": 0.5467, - "step": 412 - }, - { - "epoch": 0.05, - "learning_rate": 0.00024449784046662673, - "loss": 0.5116, - "step": 413 - }, - { - "epoch": 0.05, - "learning_rate": 0.0002445960049960954, - "loss": 0.5154, - "step": 414 - }, - { - "epoch": 0.05, - "learning_rate": 0.00024469393269896633, - "loss": 0.5603, - "step": 415 - }, - { - "epoch": 0.05, - "learning_rate": 0.0002447916247152006, - "loss": 0.5386, - "step": 416 - }, - { - "epoch": 0.05, - "learning_rate": 0.0002448890821765484, - "loss": 0.5547, - "step": 417 - }, - { - "epoch": 0.05, - "learning_rate": 0.0002449863062066276, - "loss": 0.5591, - "step": 418 - }, - { - "epoch": 0.05, - "learning_rate": 0.00024508329792100134, - "loss": 0.5616, - "step": 419 - }, - { - "epoch": 0.05, - "learning_rate": 0.0002451800584272552, - "loss": 0.5189, - "step": 420 - }, - { - "epoch": 0.05, - "learning_rate": 0.00024527658882507236, - "loss": 0.5318, - "step": 421 - }, - { - "epoch": 0.05, - "learning_rate": 0.00024537289020630965, - "loss": 0.5335, - "step": 422 - }, - { - "epoch": 0.05, - "learning_rate": 0.0002454689636550705, - "loss": 0.5381, - "step": 423 - }, - { - "epoch": 0.05, - "learning_rate": 0.00024556481024777906, - "loss": 0.5445, - "step": 424 - }, - { - "epoch": 0.05, - "learning_rate": 0.00024566043105325215, - "loss": 0.5311, - "step": 425 - }, - { - "epoch": 0.05, - "learning_rate": 0.00024575582713277087, - "loss": 0.5161, - "step": 426 - }, - { - "epoch": 0.05, - "learning_rate": 0.00024585099954015115, - "loss": 0.5328, - "step": 427 - }, - { - "epoch": 0.05, - "learning_rate": 0.0002459459493218138, - "loss": 0.5608, - "step": 428 - }, - { - "epoch": 0.05, - "learning_rate": 0.0002460406775168535, - "loss": 0.5346, - "step": 429 - }, - { - "epoch": 0.05, - "learning_rate": 0.00024613518515710685, - "loss": 0.5354, - "step": 430 - }, - { - "epoch": 0.05, - "learning_rate": 0.00024622947326722005, - "loss": 0.5199, - "step": 431 - }, - { - "epoch": 0.05, - "learning_rate": 0.0002463235428647154, - "loss": 0.5527, - "step": 432 - }, - { - "epoch": 0.05, - "learning_rate": 0.0002464173949600572, - "loss": 0.5602, - "step": 433 - }, - { - "epoch": 0.05, - "learning_rate": 0.0002465110305567169, - "loss": 0.5292, - "step": 434 - }, - { - "epoch": 0.05, - "learning_rate": 0.00024660445065123756, - "loss": 0.5295, - "step": 435 - }, - { - "epoch": 0.05, - "learning_rate": 0.00024669765623329734, - "loss": 0.5196, - "step": 436 - }, - { - "epoch": 0.05, - "learning_rate": 0.00024679064828577254, - "loss": 0.5541, - "step": 437 - }, - { - "epoch": 0.05, - "learning_rate": 0.00024688342778479965, - "loss": 0.5347, - "step": 438 - }, - { - "epoch": 0.05, - "learning_rate": 0.00024697599569983695, - "loss": 0.5117, - "step": 439 - }, - { - "epoch": 0.05, - "learning_rate": 0.00024706835299372515, - "loss": 0.5347, - "step": 440 - }, - { - "epoch": 0.05, - "learning_rate": 0.00024716050062274775, - "loss": 0.5135, - "step": 441 - }, - { - "epoch": 0.05, - "learning_rate": 0.0002472524395366902, - "loss": 0.4996, - "step": 442 - }, - { - "epoch": 0.05, - "learning_rate": 0.0002473441706788986, - "loss": 0.5324, - "step": 443 - }, - { - "epoch": 0.05, - "learning_rate": 0.0002474356949863381, - "loss": 0.5371, - "step": 444 - }, - { - "epoch": 0.05, - "learning_rate": 0.00024752701338965, - "loss": 0.5124, - "step": 445 - }, - { - "epoch": 0.06, - "learning_rate": 0.0002476181268132086, - "loss": 0.5364, - "step": 446 - }, - { - "epoch": 0.06, - "learning_rate": 0.0002477090361751775, - "loss": 0.5252, - "step": 447 - }, - { - "epoch": 0.06, - "learning_rate": 0.0002477997423875648, - "loss": 0.5328, - "step": 448 - }, - { - "epoch": 0.06, - "learning_rate": 0.0002478902463562786, - "loss": 0.5434, - "step": 449 - }, - { - "epoch": 0.06, - "learning_rate": 0.0002479805489811804, - "loss": 0.532, - "step": 450 - }, - { - "epoch": 0.06, - "learning_rate": 0.00024807065115613967, - "loss": 0.5388, - "step": 451 - }, - { - "epoch": 0.06, - "learning_rate": 0.00024816055376908623, - "loss": 0.5202, - "step": 452 - }, - { - "epoch": 0.06, - "learning_rate": 0.00024825025770206335, - "loss": 0.518, - "step": 453 - }, - { - "epoch": 0.06, - "learning_rate": 0.0002483397638312791, - "loss": 0.5026, - "step": 454 - }, - { - "epoch": 0.06, - "learning_rate": 0.0002484290730271582, - "loss": 0.5237, - "step": 455 - }, - { - "epoch": 0.06, - "learning_rate": 0.00024851818615439255, - "loss": 0.5048, - "step": 456 - }, - { - "epoch": 0.06, - "learning_rate": 0.0002486071040719914, - "loss": 0.5371, - "step": 457 - }, - { - "epoch": 0.06, - "learning_rate": 0.0002486958276333313, - "loss": 0.5359, - "step": 458 - }, - { - "epoch": 0.06, - "learning_rate": 0.00024878435768620503, - "loss": 0.5239, - "step": 459 - }, - { - "epoch": 0.06, - "learning_rate": 0.0002488726950728701, - "loss": 0.5309, - "step": 460 - }, - { - "epoch": 0.06, - "learning_rate": 0.0002489608406300973, - "loss": 0.53, - "step": 461 - }, - { - "epoch": 0.06, - "learning_rate": 0.00024904879518921773, - "loss": 0.5151, - "step": 462 - }, - { - "epoch": 0.06, - "learning_rate": 0.0002491365595761701, - "loss": 0.5153, - "step": 463 - }, - { - "epoch": 0.06, - "learning_rate": 0.00024922413461154726, - "loss": 0.5247, - "step": 464 - }, - { - "epoch": 0.06, - "learning_rate": 0.00024931152111064216, - "loss": 0.5157, - "step": 465 - }, - { - "epoch": 0.06, - "learning_rate": 0.0002493987198834935, - "loss": 0.5216, - "step": 466 - }, - { - "epoch": 0.06, - "learning_rate": 0.0002494857317349307, - "loss": 0.5199, - "step": 467 - }, - { - "epoch": 0.06, - "learning_rate": 0.00024957255746461845, - "loss": 0.5145, - "step": 468 - }, - { - "epoch": 0.06, - "learning_rate": 0.00024965919786710085, - "loss": 0.5101, - "step": 469 - }, - { - "epoch": 0.06, - "learning_rate": 0.0002497456537318452, - "loss": 0.5175, - "step": 470 - }, - { - "epoch": 0.06, - "learning_rate": 0.00024983192584328463, - "loss": 0.5174, - "step": 471 - }, - { - "epoch": 0.06, - "learning_rate": 0.0002499180149808616, - "loss": 0.5272, - "step": 472 - }, - { - "epoch": 0.06, - "learning_rate": 0.0002500039219190694, - "loss": 0.5273, - "step": 473 - }, - { - "epoch": 0.06, - "learning_rate": 0.00025008964742749453, - "loss": 0.5166, - "step": 474 - }, - { - "epoch": 0.06, - "learning_rate": 0.00025017519227085754, - "loss": 0.505, - "step": 475 - }, - { - "epoch": 0.06, - "learning_rate": 0.00025026055720905443, - "loss": 0.5314, - "step": 476 - }, - { - "epoch": 0.06, - "learning_rate": 0.00025034574299719693, - "loss": 0.5289, - "step": 477 - }, - { - "epoch": 0.06, - "learning_rate": 0.00025043075038565254, - "loss": 0.527, - "step": 478 - }, - { - "epoch": 0.06, - "learning_rate": 0.0002505155801200843, - "loss": 0.5052, - "step": 479 - }, - { - "epoch": 0.06, - "learning_rate": 0.00025060023294149006, - "loss": 0.5169, - "step": 480 - }, - { - "epoch": 0.06, - "learning_rate": 0.00025068470958624115, - "loss": 0.4821, - "step": 481 - }, - { - "epoch": 0.06, - "learning_rate": 0.0002507690107861209, - "loss": 0.5085, - "step": 482 - }, - { - "epoch": 0.06, - "learning_rate": 0.0002508531372683627, - "loss": 0.5106, - "step": 483 - }, - { - "epoch": 0.06, - "learning_rate": 0.00025093708975568776, - "loss": 0.5273, - "step": 484 - }, - { - "epoch": 0.06, - "learning_rate": 0.00025102086896634194, - "loss": 0.5239, - "step": 485 - }, - { - "epoch": 0.06, - "learning_rate": 0.00025110447561413324, - "loss": 0.5436, - "step": 486 - }, - { - "epoch": 0.06, - "learning_rate": 0.00025118791040846774, - "loss": 0.5134, - "step": 487 - }, - { - "epoch": 0.06, - "learning_rate": 0.00025127117405438604, - "loss": 0.5183, - "step": 488 - }, - { - "epoch": 0.06, - "learning_rate": 0.00025135426725259887, - "loss": 0.508, - "step": 489 - }, - { - "epoch": 0.06, - "learning_rate": 0.00025143719069952244, - "loss": 0.4972, - "step": 490 - }, - { - "epoch": 0.06, - "learning_rate": 0.00025151994508731365, - "loss": 0.5197, - "step": 491 - }, - { - "epoch": 0.06, - "learning_rate": 0.0002516025311039046, - "loss": 0.5347, - "step": 492 - }, - { - "epoch": 0.06, - "learning_rate": 0.0002516849494330368, - "loss": 0.4823, - "step": 493 - }, - { - "epoch": 0.06, - "learning_rate": 0.0002517672007542956, - "loss": 0.5184, - "step": 494 - }, - { - "epoch": 0.06, - "learning_rate": 0.00025184928574314297, - "loss": 0.5438, - "step": 495 - }, - { - "epoch": 0.06, - "learning_rate": 0.00025193120507095186, - "loss": 0.5147, - "step": 496 - }, - { - "epoch": 0.06, - "learning_rate": 0.00025201295940503813, - "loss": 0.529, - "step": 497 - }, - { - "epoch": 0.06, - "learning_rate": 0.00025209454940869385, - "loss": 0.5197, - "step": 498 - }, - { - "epoch": 0.06, - "learning_rate": 0.0002521759757412193, - "loss": 0.5065, - "step": 499 - }, - { - "epoch": 0.06, - "learning_rate": 0.0002522572390579551, - "loss": 0.5029, - "step": 500 - }, - { - "epoch": 0.06, - "learning_rate": 0.0002523383400103135, - "loss": 0.5118, - "step": 501 - }, - { - "epoch": 0.06, - "learning_rate": 0.00025241927924581016, - "loss": 0.5283, - "step": 502 - }, - { - "epoch": 0.06, - "learning_rate": 0.000252500057408095, - "loss": 0.5018, - "step": 503 - }, - { - "epoch": 0.06, - "learning_rate": 0.0002525806751369827, - "loss": 0.5226, - "step": 504 - }, - { - "epoch": 0.06, - "learning_rate": 0.0002526611330684834, - "loss": 0.5238, - "step": 505 - }, - { - "epoch": 0.06, - "learning_rate": 0.0002527414318348327, - "loss": 0.4869, - "step": 506 - }, - { - "epoch": 0.06, - "learning_rate": 0.0002528215720645215, - "loss": 0.5146, - "step": 507 - }, - { - "epoch": 0.06, - "learning_rate": 0.00025290155438232535, - "loss": 0.493, - "step": 508 - }, - { - "epoch": 0.06, - "learning_rate": 0.00025298137940933386, - "loss": 0.4928, - "step": 509 - }, - { - "epoch": 0.06, - "learning_rate": 0.00025306104776297967, - "loss": 0.5222, - "step": 510 - }, - { - "epoch": 0.06, - "learning_rate": 0.0002531405600570669, - "loss": 0.5141, - "step": 511 - }, - { - "epoch": 0.06, - "learning_rate": 0.00025321991690179977, - "loss": 0.5115, - "step": 512 - }, - { - "epoch": 0.06, - "learning_rate": 0.00025329911890381037, - "loss": 0.5213, - "step": 513 - }, - { - "epoch": 0.06, - "learning_rate": 0.00025337816666618683, - "loss": 0.4986, - "step": 514 - }, - { - "epoch": 0.06, - "learning_rate": 0.00025345706078850076, - "loss": 0.516, - "step": 515 - }, - { - "epoch": 0.06, - "learning_rate": 0.00025353580186683437, - "loss": 0.4949, - "step": 516 - }, - { - "epoch": 0.06, - "learning_rate": 0.00025361439049380774, - "loss": 0.515, - "step": 517 - }, - { - "epoch": 0.06, - "learning_rate": 0.0002536928272586054, - "loss": 0.5152, - "step": 518 - }, - { - "epoch": 0.06, - "learning_rate": 0.0002537711127470029, - "loss": 0.5111, - "step": 519 - }, - { - "epoch": 0.06, - "learning_rate": 0.0002538492475413931, - "loss": 0.5021, - "step": 520 - }, - { - "epoch": 0.06, - "learning_rate": 0.00025392723222081217, - "loss": 0.5141, - "step": 521 - }, - { - "epoch": 0.06, - "learning_rate": 0.00025400506736096513, - "loss": 0.4984, - "step": 522 - }, - { - "epoch": 0.06, - "learning_rate": 0.00025408275353425164, - "loss": 0.5066, - "step": 523 - }, - { - "epoch": 0.06, - "learning_rate": 0.00025416029130979103, - "loss": 0.5511, - "step": 524 - }, - { - "epoch": 0.06, - "learning_rate": 0.0002542376812534477, - "loss": 0.5109, - "step": 525 - }, - { - "epoch": 0.06, - "learning_rate": 0.0002543149239278552, - "loss": 0.5047, - "step": 526 - }, - { - "epoch": 0.07, - "learning_rate": 0.0002543920198924414, - "loss": 0.4749, - "step": 527 - }, - { - "epoch": 0.07, - "learning_rate": 0.00025446896970345267, - "loss": 0.5084, - "step": 528 - }, - { - "epoch": 0.07, - "learning_rate": 0.00025454577391397767, - "loss": 0.5195, - "step": 529 - }, - { - "epoch": 0.07, - "learning_rate": 0.00025462243307397157, - "loss": 0.51, - "step": 530 - }, - { - "epoch": 0.07, - "learning_rate": 0.00025469894773027943, - "loss": 0.5219, - "step": 531 - }, - { - "epoch": 0.07, - "learning_rate": 0.0002547753184266598, - "loss": 0.4916, - "step": 532 - }, - { - "epoch": 0.07, - "learning_rate": 0.0002548515457038076, - "loss": 0.4878, - "step": 533 - }, - { - "epoch": 0.07, - "learning_rate": 0.0002549276300993775, - "loss": 0.4975, - "step": 534 - }, - { - "epoch": 0.07, - "learning_rate": 0.0002550035721480063, - "loss": 0.5175, - "step": 535 - }, - { - "epoch": 0.07, - "learning_rate": 0.0002550793723813358, - "loss": 0.4936, - "step": 536 - }, - { - "epoch": 0.07, - "learning_rate": 0.00025515503132803475, - "loss": 0.5001, - "step": 537 - }, - { - "epoch": 0.07, - "learning_rate": 0.0002552305495138214, - "loss": 0.4894, - "step": 538 - }, - { - "epoch": 0.07, - "learning_rate": 0.000255305927461485, - "loss": 0.5192, - "step": 539 - }, - { - "epoch": 0.07, - "learning_rate": 0.00025538116569090793, - "loss": 0.5294, - "step": 540 - }, - { - "epoch": 0.07, - "learning_rate": 0.0002554562647190868, - "loss": 0.4904, - "step": 541 - }, - { - "epoch": 0.07, - "learning_rate": 0.0002555312250601542, - "loss": 0.5143, - "step": 542 - }, - { - "epoch": 0.07, - "learning_rate": 0.0002556060472253993, - "loss": 0.517, - "step": 543 - }, - { - "epoch": 0.07, - "learning_rate": 0.0002556807317232893, - "loss": 0.5075, - "step": 544 - }, - { - "epoch": 0.07, - "learning_rate": 0.0002557552790594899, - "loss": 0.4907, - "step": 545 - }, - { - "epoch": 0.07, - "learning_rate": 0.0002558296897368857, - "loss": 0.4995, - "step": 546 - }, - { - "epoch": 0.07, - "learning_rate": 0.0002559039642556009, - "loss": 0.485, - "step": 547 - }, - { - "epoch": 0.07, - "learning_rate": 0.00025597810311301923, - "loss": 0.4926, - "step": 548 - }, - { - "epoch": 0.07, - "learning_rate": 0.00025605210680380386, - "loss": 0.4986, - "step": 549 - }, - { - "epoch": 0.07, - "learning_rate": 0.00025612597581991766, - "loss": 0.4904, - "step": 550 - }, - { - "epoch": 0.07, - "learning_rate": 0.0002561997106506422, - "loss": 0.4991, - "step": 551 - }, - { - "epoch": 0.07, - "learning_rate": 0.00025627331178259763, - "loss": 0.4891, - "step": 552 - }, - { - "epoch": 0.07, - "learning_rate": 0.0002563467796997618, - "loss": 0.5238, - "step": 553 - }, - { - "epoch": 0.07, - "learning_rate": 0.0002564201148834893, - "loss": 0.4976, - "step": 554 - }, - { - "epoch": 0.07, - "learning_rate": 0.00025649331781253063, - "loss": 0.4861, - "step": 555 - }, - { - "epoch": 0.07, - "learning_rate": 0.0002565663889630506, - "loss": 0.4973, - "step": 556 - }, - { - "epoch": 0.07, - "learning_rate": 0.0002566393288086471, - "loss": 0.4926, - "step": 557 - }, - { - "epoch": 0.07, - "learning_rate": 0.0002567121378203696, - "loss": 0.5086, - "step": 558 - }, - { - "epoch": 0.07, - "learning_rate": 0.0002567848164667374, - "loss": 0.4859, - "step": 559 - }, - { - "epoch": 0.07, - "learning_rate": 0.00025685736521375733, - "loss": 0.5131, - "step": 560 - }, - { - "epoch": 0.07, - "learning_rate": 0.0002569297845249422, - "loss": 0.5121, - "step": 561 - }, - { - "epoch": 0.07, - "learning_rate": 0.0002570020748613284, - "loss": 0.5042, - "step": 562 - }, - { - "epoch": 0.07, - "learning_rate": 0.0002570742366814932, - "loss": 0.4832, - "step": 563 - }, - { - "epoch": 0.07, - "learning_rate": 0.00025714627044157265, - "loss": 0.4924, - "step": 564 - }, - { - "epoch": 0.07, - "learning_rate": 0.0002572181765952788, - "loss": 0.5076, - "step": 565 - }, - { - "epoch": 0.07, - "learning_rate": 0.0002572899555939164, - "loss": 0.4835, - "step": 566 - }, - { - "epoch": 0.07, - "learning_rate": 0.0002573616078864005, - "loss": 0.4821, - "step": 567 - }, - { - "epoch": 0.07, - "learning_rate": 0.000257433133919273, - "loss": 0.5083, - "step": 568 - }, - { - "epoch": 0.07, - "learning_rate": 0.0002575045341367193, - "loss": 0.5124, - "step": 569 - }, - { - "epoch": 0.07, - "learning_rate": 0.00025757580898058506, - "loss": 0.4731, - "step": 570 - }, - { - "epoch": 0.07, - "learning_rate": 0.0002576469588903922, - "loss": 0.5054, - "step": 571 - }, - { - "epoch": 0.07, - "learning_rate": 0.0002577179843033557, - "loss": 0.5095, - "step": 572 - }, - { - "epoch": 0.07, - "learning_rate": 0.0002577888856543993, - "loss": 0.5109, - "step": 573 - }, - { - "epoch": 0.07, - "learning_rate": 0.00025785966337617185, - "loss": 0.483, - "step": 574 - }, - { - "epoch": 0.07, - "learning_rate": 0.00025793031789906267, - "loss": 0.4754, - "step": 575 - }, - { - "epoch": 0.07, - "learning_rate": 0.0002580008496512176, - "loss": 0.5141, - "step": 576 - }, - { - "epoch": 0.07, - "learning_rate": 0.00025807125905855457, - "loss": 0.5059, - "step": 577 - }, - { - "epoch": 0.07, - "learning_rate": 0.0002581415465447789, - "loss": 0.499, - "step": 578 - }, - { - "epoch": 0.07, - "learning_rate": 0.0002582117125313987, - "loss": 0.5166, - "step": 579 - }, - { - "epoch": 0.07, - "learning_rate": 0.00025828175743773977, - "loss": 0.5106, - "step": 580 - }, - { - "epoch": 0.07, - "learning_rate": 0.00025835168168096106, - "loss": 0.4973, - "step": 581 - }, - { - "epoch": 0.07, - "learning_rate": 0.00025842148567606946, - "loss": 0.4985, - "step": 582 - }, - { - "epoch": 0.07, - "learning_rate": 0.0002584911698359341, - "loss": 0.487, - "step": 583 - }, - { - "epoch": 0.07, - "learning_rate": 0.0002585607345713018, - "loss": 0.5053, - "step": 584 - }, - { - "epoch": 0.07, - "learning_rate": 0.00025863018029081096, - "loss": 0.4854, - "step": 585 - }, - { - "epoch": 0.07, - "learning_rate": 0.0002586995074010061, - "loss": 0.498, - "step": 586 - }, - { - "epoch": 0.07, - "learning_rate": 0.00025876871630635254, - "loss": 0.4959, - "step": 587 - }, - { - "epoch": 0.07, - "learning_rate": 0.0002588378074092499, - "loss": 0.5015, - "step": 588 - }, - { - "epoch": 0.07, - "learning_rate": 0.00025890678111004675, - "loss": 0.4981, - "step": 589 - }, - { - "epoch": 0.07, - "learning_rate": 0.0002589756378070541, - "loss": 0.4708, - "step": 590 - }, - { - "epoch": 0.07, - "learning_rate": 0.00025904437789655947, - "loss": 0.4811, - "step": 591 - }, - { - "epoch": 0.07, - "learning_rate": 0.0002591130017728403, - "loss": 0.4968, - "step": 592 - }, - { - "epoch": 0.07, - "learning_rate": 0.00025918150982817787, - "loss": 0.4855, - "step": 593 - }, - { - "epoch": 0.07, - "learning_rate": 0.0002592499024528705, - "loss": 0.5014, - "step": 594 - }, - { - "epoch": 0.07, - "learning_rate": 0.00025931818003524694, - "loss": 0.4892, - "step": 595 - }, - { - "epoch": 0.07, - "learning_rate": 0.00025938634296167963, - "loss": 0.4599, - "step": 596 - }, - { - "epoch": 0.07, - "learning_rate": 0.0002594543916165979, - "loss": 0.4907, - "step": 597 - }, - { - "epoch": 0.07, - "learning_rate": 0.00025952232638250066, - "loss": 0.4968, - "step": 598 - }, - { - "epoch": 0.07, - "learning_rate": 0.00025959014763996983, - "loss": 0.4989, - "step": 599 - }, - { - "epoch": 0.07, - "learning_rate": 0.00025965785576768257, - "loss": 0.511, - "step": 600 - }, - { - "epoch": 0.07, - "learning_rate": 0.00025972545114242445, - "loss": 0.5194, - "step": 601 - }, - { - "epoch": 0.07, - "learning_rate": 0.00025979293413910164, - "loss": 0.4876, - "step": 602 - }, - { - "epoch": 0.07, - "learning_rate": 0.0002598603051307536, - "loss": 0.5128, - "step": 603 - }, - { - "epoch": 0.07, - "learning_rate": 0.0002599275644885655, - "loss": 0.4895, - "step": 604 - }, - { - "epoch": 0.07, - "learning_rate": 0.00025999471258188027, - "loss": 0.4759, - "step": 605 - }, - { - "epoch": 0.07, - "learning_rate": 0.0002600617497782109, - "loss": 0.492, - "step": 606 - }, - { - "epoch": 0.07, - "learning_rate": 0.00026012867644325264, - "loss": 0.5247, - "step": 607 - }, - { - "epoch": 0.08, - "learning_rate": 0.0002601954929408947, - "loss": 0.4946, - "step": 608 - }, - { - "epoch": 0.08, - "learning_rate": 0.00026026219963323235, - "loss": 0.4908, - "step": 609 - }, - { - "epoch": 0.08, - "learning_rate": 0.00026032879688057855, - "loss": 0.4991, - "step": 610 - }, - { - "epoch": 0.08, - "learning_rate": 0.0002603952850414757, - "loss": 0.4851, - "step": 611 - }, - { - "epoch": 0.08, - "learning_rate": 0.0002604616644727072, - "loss": 0.4964, - "step": 612 - }, - { - "epoch": 0.08, - "learning_rate": 0.00026052793552930884, - "loss": 0.4865, - "step": 613 - }, - { - "epoch": 0.08, - "learning_rate": 0.0002605940985645805, - "loss": 0.4917, - "step": 614 - }, - { - "epoch": 0.08, - "learning_rate": 0.0002606601539300971, - "loss": 0.4675, - "step": 615 - }, - { - "epoch": 0.08, - "learning_rate": 0.00026072610197571994, - "loss": 0.4983, - "step": 616 - }, - { - "epoch": 0.08, - "learning_rate": 0.0002607919430496079, - "loss": 0.5101, - "step": 617 - }, - { - "epoch": 0.08, - "learning_rate": 0.0002608576774982283, - "loss": 0.486, - "step": 618 - }, - { - "epoch": 0.08, - "learning_rate": 0.000260923305666368, - "loss": 0.4911, - "step": 619 - }, - { - "epoch": 0.08, - "learning_rate": 0.0002609888278971443, - "loss": 0.4879, - "step": 620 - }, - { - "epoch": 0.08, - "learning_rate": 0.00026105424453201544, - "loss": 0.4883, - "step": 621 - }, - { - "epoch": 0.08, - "learning_rate": 0.00026111955591079144, - "loss": 0.4816, - "step": 622 - }, - { - "epoch": 0.08, - "learning_rate": 0.0002611847623716448, - "loss": 0.511, - "step": 623 - }, - { - "epoch": 0.08, - "learning_rate": 0.0002612498642511206, - "loss": 0.5026, - "step": 624 - }, - { - "epoch": 0.08, - "learning_rate": 0.00026131486188414756, - "loss": 0.4912, - "step": 625 - }, - { - "epoch": 0.08, - "learning_rate": 0.00026137975560404787, - "loss": 0.4916, - "step": 626 - }, - { - "epoch": 0.08, - "learning_rate": 0.0002614445457425476, - "loss": 0.4879, - "step": 627 - }, - { - "epoch": 0.08, - "learning_rate": 0.00026150923262978685, - "loss": 0.4896, - "step": 628 - }, - { - "epoch": 0.08, - "learning_rate": 0.0002615738165943299, - "loss": 0.4952, - "step": 629 - }, - { - "epoch": 0.08, - "learning_rate": 0.0002616382979631752, - "loss": 0.458, - "step": 630 - }, - { - "epoch": 0.08, - "learning_rate": 0.00026170267706176526, - "loss": 0.4872, - "step": 631 - }, - { - "epoch": 0.08, - "learning_rate": 0.0002617669542139967, - "loss": 0.4794, - "step": 632 - }, - { - "epoch": 0.08, - "learning_rate": 0.0002618311297422296, - "loss": 0.4828, - "step": 633 - }, - { - "epoch": 0.08, - "learning_rate": 0.00026189520396729775, - "loss": 0.4692, - "step": 634 - }, - { - "epoch": 0.08, - "learning_rate": 0.0002619591772085178, - "loss": 0.4966, - "step": 635 - }, - { - "epoch": 0.08, - "learning_rate": 0.0002620230497836991, - "loss": 0.4828, - "step": 636 - }, - { - "epoch": 0.08, - "learning_rate": 0.000262086822009153, - "loss": 0.5165, - "step": 637 - }, - { - "epoch": 0.08, - "learning_rate": 0.0002621504941997023, - "loss": 0.4843, - "step": 638 - }, - { - "epoch": 0.08, - "learning_rate": 0.00026221406666869084, - "loss": 0.4911, - "step": 639 - }, - { - "epoch": 0.08, - "learning_rate": 0.0002622775397279922, - "loss": 0.5008, - "step": 640 - }, - { - "epoch": 0.08, - "learning_rate": 0.00026234091368801946, - "loss": 0.4843, - "step": 641 - }, - { - "epoch": 0.08, - "learning_rate": 0.00026240418885773386, - "loss": 0.4938, - "step": 642 - }, - { - "epoch": 0.08, - "learning_rate": 0.00026246736554465396, - "loss": 0.4881, - "step": 643 - }, - { - "epoch": 0.08, - "learning_rate": 0.0002625304440548649, - "loss": 0.4973, - "step": 644 - }, - { - "epoch": 0.08, - "learning_rate": 0.0002625934246930269, - "loss": 0.4845, - "step": 645 - }, - { - "epoch": 0.08, - "learning_rate": 0.00026265630776238426, - "loss": 0.4975, - "step": 646 - }, - { - "epoch": 0.08, - "learning_rate": 0.0002627190935647742, - "loss": 0.4482, - "step": 647 - }, - { - "epoch": 0.08, - "learning_rate": 0.0002627817824006354, - "loss": 0.5101, - "step": 648 - }, - { - "epoch": 0.08, - "learning_rate": 0.0002628443745690167, - "loss": 0.4783, - "step": 649 - }, - { - "epoch": 0.08, - "learning_rate": 0.0002629068703675856, - "loss": 0.4874, - "step": 650 - }, - { - "epoch": 0.08, - "learning_rate": 0.0002629692700926369, - "loss": 0.4669, - "step": 651 - }, - { - "epoch": 0.08, - "learning_rate": 0.000263031574039101, - "loss": 0.5026, - "step": 652 - }, - { - "epoch": 0.08, - "learning_rate": 0.0002630937825005523, - "loss": 0.4624, - "step": 653 - }, - { - "epoch": 0.08, - "learning_rate": 0.0002631558957692174, - "loss": 0.4776, - "step": 654 - }, - { - "epoch": 0.08, - "learning_rate": 0.00026321791413598354, - "loss": 0.4743, - "step": 655 - }, - { - "epoch": 0.08, - "learning_rate": 0.00026327983789040674, - "loss": 0.501, - "step": 656 - }, - { - "epoch": 0.08, - "learning_rate": 0.0002633416673207196, - "loss": 0.4756, - "step": 657 - }, - { - "epoch": 0.08, - "learning_rate": 0.0002634034027138399, - "loss": 0.4838, - "step": 658 - }, - { - "epoch": 0.08, - "learning_rate": 0.000263465044355378, - "loss": 0.481, - "step": 659 - }, - { - "epoch": 0.08, - "learning_rate": 0.0002635265925296452, - "loss": 0.4686, - "step": 660 - }, - { - "epoch": 0.08, - "learning_rate": 0.00026358804751966126, - "loss": 0.4627, - "step": 661 - }, - { - "epoch": 0.08, - "learning_rate": 0.00026364940960716277, - "loss": 0.4665, - "step": 662 - }, - { - "epoch": 0.08, - "learning_rate": 0.00026371067907261016, - "loss": 0.4776, - "step": 663 - }, - { - "epoch": 0.08, - "learning_rate": 0.000263771856195196, - "loss": 0.4756, - "step": 664 - }, - { - "epoch": 0.08, - "learning_rate": 0.00026383294125285233, - "loss": 0.4763, - "step": 665 - }, - { - "epoch": 0.08, - "learning_rate": 0.00026389393452225815, - "loss": 0.4696, - "step": 666 - }, - { - "epoch": 0.08, - "learning_rate": 0.0002639548362788473, - "loss": 0.4712, - "step": 667 - }, - { - "epoch": 0.08, - "learning_rate": 0.00026401564679681564, - "loss": 0.4695, - "step": 668 - }, - { - "epoch": 0.08, - "learning_rate": 0.00026407636634912863, - "loss": 0.4772, - "step": 669 - }, - { - "epoch": 0.08, - "learning_rate": 0.0002641369952075283, - "loss": 0.4743, - "step": 670 - }, - { - "epoch": 0.08, - "learning_rate": 0.0002641975336425411, - "loss": 0.4775, - "step": 671 - }, - { - "epoch": 0.08, - "learning_rate": 0.00026425798192348485, - "loss": 0.4878, - "step": 672 - }, - { - "epoch": 0.08, - "learning_rate": 0.0002643183403184758, - "loss": 0.4863, - "step": 673 - }, - { - "epoch": 0.08, - "learning_rate": 0.00026437860909443603, - "loss": 0.4781, - "step": 674 - }, - { - "epoch": 0.08, - "learning_rate": 0.00026443878851710044, - "loss": 0.4599, - "step": 675 - }, - { - "epoch": 0.08, - "learning_rate": 0.00026449887885102364, - "loss": 0.4708, - "step": 676 - }, - { - "epoch": 0.08, - "learning_rate": 0.0002645588803595872, - "loss": 0.4358, - "step": 677 - }, - { - "epoch": 0.08, - "learning_rate": 0.00026461879330500626, - "loss": 0.4859, - "step": 678 - }, - { - "epoch": 0.08, - "learning_rate": 0.0002646786179483367, - "loss": 0.4555, - "step": 679 - }, - { - "epoch": 0.08, - "learning_rate": 0.0002647383545494818, - "loss": 0.473, - "step": 680 - }, - { - "epoch": 0.08, - "learning_rate": 0.0002647980033671991, - "loss": 0.486, - "step": 681 - }, - { - "epoch": 0.08, - "learning_rate": 0.0002648575646591069, - "loss": 0.4965, - "step": 682 - }, - { - "epoch": 0.08, - "learning_rate": 0.0002649170386816913, - "loss": 0.4796, - "step": 683 - }, - { - "epoch": 0.08, - "learning_rate": 0.00026497642569031253, - "loss": 0.4741, - "step": 684 - }, - { - "epoch": 0.08, - "learning_rate": 0.0002650357259392117, - "loss": 0.474, - "step": 685 - }, - { - "epoch": 0.08, - "learning_rate": 0.0002650949396815172, - "loss": 0.4771, - "step": 686 - }, - { - "epoch": 0.08, - "learning_rate": 0.0002651540671692513, - "loss": 0.4733, - "step": 687 - }, - { - "epoch": 0.08, - "learning_rate": 0.0002652131086533366, - "loss": 0.48, - "step": 688 - }, - { - "epoch": 0.09, - "learning_rate": 0.0002652720643836021, - "loss": 0.4691, - "step": 689 - }, - { - "epoch": 0.09, - "learning_rate": 0.00026533093460879014, - "loss": 0.4667, - "step": 690 - }, - { - "epoch": 0.09, - "learning_rate": 0.0002653897195765621, - "loss": 0.4448, - "step": 691 - }, - { - "epoch": 0.09, - "learning_rate": 0.0002654484195335051, - "loss": 0.4997, - "step": 692 - }, - { - "epoch": 0.09, - "learning_rate": 0.00026550703472513775, - "loss": 0.4738, - "step": 693 - }, - { - "epoch": 0.09, - "learning_rate": 0.0002655655653959169, - "loss": 0.4679, - "step": 694 - }, - { - "epoch": 0.09, - "learning_rate": 0.0002656240117892431, - "loss": 0.4794, - "step": 695 - }, - { - "epoch": 0.09, - "learning_rate": 0.0002656823741474673, - "loss": 0.4896, - "step": 696 - }, - { - "epoch": 0.09, - "learning_rate": 0.00026574065271189635, - "loss": 0.474, - "step": 697 - }, - { - "epoch": 0.09, - "learning_rate": 0.0002657988477227994, - "loss": 0.4637, - "step": 698 - }, - { - "epoch": 0.09, - "learning_rate": 0.0002658569594194135, - "loss": 0.4851, - "step": 699 - }, - { - "epoch": 0.09, - "learning_rate": 0.00026591498803994984, - "loss": 0.4807, - "step": 700 - }, - { - "epoch": 0.09, - "learning_rate": 0.0002659729338215993, - "loss": 0.4784, - "step": 701 - }, - { - "epoch": 0.09, - "learning_rate": 0.00026603079700053843, - "loss": 0.4757, - "step": 702 - }, - { - "epoch": 0.09, - "learning_rate": 0.0002660885778119353, - "loss": 0.4485, - "step": 703 - }, - { - "epoch": 0.09, - "learning_rate": 0.00026614627648995483, - "loss": 0.4664, - "step": 704 - }, - { - "epoch": 0.09, - "learning_rate": 0.00026620389326776516, - "loss": 0.4606, - "step": 705 - }, - { - "epoch": 0.09, - "learning_rate": 0.00026626142837754275, - "loss": 0.4735, - "step": 706 - }, - { - "epoch": 0.09, - "learning_rate": 0.00026631888205047816, - "loss": 0.4698, - "step": 707 - }, - { - "epoch": 0.09, - "learning_rate": 0.00026637625451678165, - "loss": 0.4777, - "step": 708 - }, - { - "epoch": 0.09, - "learning_rate": 0.0002664335460056887, - "loss": 0.4853, - "step": 709 - }, - { - "epoch": 0.09, - "learning_rate": 0.00026649075674546553, - "loss": 0.4766, - "step": 710 - }, - { - "epoch": 0.09, - "learning_rate": 0.0002665478869634145, - "loss": 0.4881, - "step": 711 - }, - { - "epoch": 0.09, - "learning_rate": 0.0002666049368858797, - "loss": 0.4555, - "step": 712 - }, - { - "epoch": 0.09, - "learning_rate": 0.0002666619067382519, - "loss": 0.465, - "step": 713 - }, - { - "epoch": 0.09, - "learning_rate": 0.0002667187967449744, - "loss": 0.4477, - "step": 714 - }, - { - "epoch": 0.09, - "learning_rate": 0.00026677560712954815, - "loss": 0.4578, - "step": 715 - }, - { - "epoch": 0.09, - "learning_rate": 0.00026683233811453696, - "loss": 0.4681, - "step": 716 - }, - { - "epoch": 0.09, - "learning_rate": 0.0002668889899215725, - "loss": 0.4845, - "step": 717 - }, - { - "epoch": 0.09, - "learning_rate": 0.0002669455627713602, - "loss": 0.4791, - "step": 718 - }, - { - "epoch": 0.09, - "learning_rate": 0.00026700205688368365, - "loss": 0.4723, - "step": 719 - }, - { - "epoch": 0.09, - "learning_rate": 0.0002670584724774101, - "loss": 0.4697, - "step": 720 - }, - { - "epoch": 0.09, - "learning_rate": 0.00026711480977049555, - "loss": 0.4907, - "step": 721 - }, - { - "epoch": 0.09, - "learning_rate": 0.0002671710689799896, - "loss": 0.4701, - "step": 722 - }, - { - "epoch": 0.09, - "learning_rate": 0.0002672272503220409, - "loss": 0.4695, - "step": 723 - }, - { - "epoch": 0.09, - "learning_rate": 0.00026728335401190144, - "loss": 0.4449, - "step": 724 - }, - { - "epoch": 0.09, - "learning_rate": 0.0002673393802639323, - "loss": 0.4427, - "step": 725 - }, - { - "epoch": 0.09, - "learning_rate": 0.00026739532929160773, - "loss": 0.4762, - "step": 726 - }, - { - "epoch": 0.09, - "learning_rate": 0.0002674512013075209, - "loss": 0.4627, - "step": 727 - }, - { - "epoch": 0.09, - "learning_rate": 0.0002675069965233879, - "loss": 0.478, - "step": 728 - }, - { - "epoch": 0.09, - "learning_rate": 0.00026756271515005327, - "loss": 0.4454, - "step": 729 - }, - { - "epoch": 0.09, - "learning_rate": 0.0002676183573974943, - "loss": 0.4705, - "step": 730 - }, - { - "epoch": 0.09, - "learning_rate": 0.00026767392347482613, - "loss": 0.4751, - "step": 731 - }, - { - "epoch": 0.09, - "learning_rate": 0.00026772941359030607, - "loss": 0.4478, - "step": 732 - }, - { - "epoch": 0.09, - "learning_rate": 0.00026778482795133853, - "loss": 0.4812, - "step": 733 - }, - { - "epoch": 0.09, - "learning_rate": 0.00026784016676447987, - "loss": 0.4773, - "step": 734 - }, - { - "epoch": 0.09, - "learning_rate": 0.00026789543023544247, - "loss": 0.4611, - "step": 735 - }, - { - "epoch": 0.09, - "learning_rate": 0.00026795061856909984, - "loss": 0.4167, - "step": 736 - }, - { - "epoch": 0.09, - "learning_rate": 0.00026800573196949086, - "loss": 0.4803, - "step": 737 - }, - { - "epoch": 0.09, - "learning_rate": 0.0002680607706398246, - "loss": 0.472, - "step": 738 - }, - { - "epoch": 0.09, - "learning_rate": 0.0002681157347824844, - "loss": 0.4614, - "step": 739 - }, - { - "epoch": 0.09, - "learning_rate": 0.0002681706245990328, - "loss": 0.4734, - "step": 740 - }, - { - "epoch": 0.09, - "learning_rate": 0.00026822544029021556, - "loss": 0.4928, - "step": 741 - }, - { - "epoch": 0.09, - "learning_rate": 0.00026828018205596636, - "loss": 0.4803, - "step": 742 - }, - { - "epoch": 0.09, - "learning_rate": 0.000268334850095411, - "loss": 0.4701, - "step": 743 - }, - { - "epoch": 0.09, - "learning_rate": 0.00026838944460687183, - "loss": 0.4351, - "step": 744 - }, - { - "epoch": 0.09, - "learning_rate": 0.00026844396578787214, - "loss": 0.4763, - "step": 745 - }, - { - "epoch": 0.09, - "learning_rate": 0.00026849841383514025, - "loss": 0.448, - "step": 746 - }, - { - "epoch": 0.09, - "learning_rate": 0.0002685527889446139, - "loss": 0.4826, - "step": 747 - }, - { - "epoch": 0.09, - "learning_rate": 0.00026860709131144443, - "loss": 0.4937, - "step": 748 - }, - { - "epoch": 0.09, - "learning_rate": 0.00026866132113000107, - "loss": 0.4697, - "step": 749 - }, - { - "epoch": 0.09, - "learning_rate": 0.0002687154785938751, - "loss": 0.4642, - "step": 750 - }, - { - "epoch": 0.09, - "learning_rate": 0.0002687695638958838, - "loss": 0.46, - "step": 751 - }, - { - "epoch": 0.09, - "learning_rate": 0.00026882357722807487, - "loss": 0.4761, - "step": 752 - }, - { - "epoch": 0.09, - "learning_rate": 0.0002688775187817302, - "loss": 0.4805, - "step": 753 - }, - { - "epoch": 0.09, - "learning_rate": 0.0002689313887473703, - "loss": 0.47, - "step": 754 - }, - { - "epoch": 0.09, - "learning_rate": 0.000268985187314758, - "loss": 0.4567, - "step": 755 - }, - { - "epoch": 0.09, - "learning_rate": 0.0002690389146729027, - "loss": 0.4742, - "step": 756 - }, - { - "epoch": 0.09, - "learning_rate": 0.0002690925710100642, - "loss": 0.5081, - "step": 757 - }, - { - "epoch": 0.09, - "learning_rate": 0.00026914615651375665, - "loss": 0.4828, - "step": 758 - }, - { - "epoch": 0.09, - "learning_rate": 0.00026919967137075274, - "loss": 0.4578, - "step": 759 - }, - { - "epoch": 0.09, - "learning_rate": 0.0002692531157670872, - "loss": 0.4536, - "step": 760 - }, - { - "epoch": 0.09, - "learning_rate": 0.00026930648988806113, - "loss": 0.4735, - "step": 761 - }, - { - "epoch": 0.09, - "learning_rate": 0.0002693597939182453, - "loss": 0.4552, - "step": 762 - }, - { - "epoch": 0.09, - "learning_rate": 0.0002694130280414847, - "loss": 0.4755, - "step": 763 - }, - { - "epoch": 0.09, - "learning_rate": 0.00026946619244090154, - "loss": 0.4667, - "step": 764 - }, - { - "epoch": 0.09, - "learning_rate": 0.00026951928729889964, - "loss": 0.4521, - "step": 765 - }, - { - "epoch": 0.09, - "learning_rate": 0.0002695723127971681, - "loss": 0.4868, - "step": 766 - }, - { - "epoch": 0.09, - "learning_rate": 0.0002696252691166847, - "loss": 0.463, - "step": 767 - }, - { - "epoch": 0.09, - "learning_rate": 0.0002696781564377198, - "loss": 0.4817, - "step": 768 - }, - { - "epoch": 0.09, - "learning_rate": 0.00026973097493984016, - "loss": 0.4809, - "step": 769 - }, - { - "epoch": 0.1, - "learning_rate": 0.0002697837248019124, - "loss": 0.4777, - "step": 770 - }, - { - "epoch": 0.1, - "learning_rate": 0.00026983640620210686, - "loss": 0.4769, - "step": 771 - }, - { - "epoch": 0.1, - "learning_rate": 0.00026988901931790084, - "loss": 0.4603, - "step": 772 - }, - { - "epoch": 0.1, - "learning_rate": 0.00026994156432608255, - "loss": 0.4926, - "step": 773 - }, - { - "epoch": 0.1, - "learning_rate": 0.0002699940414027544, - "loss": 0.4805, - "step": 774 - }, - { - "epoch": 0.1, - "learning_rate": 0.0002700464507233369, - "loss": 0.4763, - "step": 775 - }, - { - "epoch": 0.1, - "learning_rate": 0.00027009879246257167, - "loss": 0.4885, - "step": 776 - }, - { - "epoch": 0.1, - "learning_rate": 0.00027015106679452536, - "loss": 0.4798, - "step": 777 - }, - { - "epoch": 0.1, - "learning_rate": 0.0002702032738925932, - "loss": 0.4551, - "step": 778 - }, - { - "epoch": 0.1, - "learning_rate": 0.0002702554139295017, - "loss": 0.47, - "step": 779 - }, - { - "epoch": 0.1, - "learning_rate": 0.0002703074870773131, - "loss": 0.4735, - "step": 780 - }, - { - "epoch": 0.1, - "learning_rate": 0.00027035949350742814, - "loss": 0.5072, - "step": 781 - }, - { - "epoch": 0.1, - "learning_rate": 0.0002704114333905894, - "loss": 0.4753, - "step": 782 - }, - { - "epoch": 0.1, - "learning_rate": 0.0002704633068968851, - "loss": 0.4896, - "step": 783 - }, - { - "epoch": 0.1, - "learning_rate": 0.0002705151141957521, - "loss": 0.4563, - "step": 784 - }, - { - "epoch": 0.1, - "learning_rate": 0.00027056685545597935, - "loss": 0.442, - "step": 785 - }, - { - "epoch": 0.1, - "learning_rate": 0.0002706185308457111, - "loss": 0.4396, - "step": 786 - }, - { - "epoch": 0.1, - "learning_rate": 0.00027067014053245024, - "loss": 0.4822, - "step": 787 - }, - { - "epoch": 0.1, - "learning_rate": 0.00027072168468306163, - "loss": 0.4616, - "step": 788 - }, - { - "epoch": 0.1, - "learning_rate": 0.00027077316346377515, - "loss": 0.4474, - "step": 789 - }, - { - "epoch": 0.1, - "learning_rate": 0.0002708245770401892, - "loss": 0.4605, - "step": 790 - }, - { - "epoch": 0.1, - "learning_rate": 0.00027087592557727353, - "loss": 0.4642, - "step": 791 - }, - { - "epoch": 0.1, - "learning_rate": 0.0002709272092393727, - "loss": 0.4924, - "step": 792 - }, - { - "epoch": 0.1, - "learning_rate": 0.0002709784281902091, - "loss": 0.4733, - "step": 793 - }, - { - "epoch": 0.1, - "learning_rate": 0.00027102958259288626, - "loss": 0.4693, - "step": 794 - }, - { - "epoch": 0.1, - "learning_rate": 0.0002710806726098916, - "loss": 0.4831, - "step": 795 - }, - { - "epoch": 0.1, - "learning_rate": 0.00027113169840310003, - "loss": 0.4763, - "step": 796 - }, - { - "epoch": 0.1, - "learning_rate": 0.00027118266013377666, - "loss": 0.4717, - "step": 797 - }, - { - "epoch": 0.1, - "learning_rate": 0.0002712335579625798, - "loss": 0.47, - "step": 798 - }, - { - "epoch": 0.1, - "learning_rate": 0.0002712843920495644, - "loss": 0.4562, - "step": 799 - }, - { - "epoch": 0.1, - "learning_rate": 0.00027133516255418473, - "loss": 0.4896, - "step": 800 - }, - { - "epoch": 0.1, - "learning_rate": 0.00027138586963529755, - "loss": 0.4807, - "step": 801 - }, - { - "epoch": 0.1, - "learning_rate": 0.00027143651345116473, - "loss": 0.4878, - "step": 802 - }, - { - "epoch": 0.1, - "learning_rate": 0.0002714870941594569, - "loss": 0.4597, - "step": 803 - }, - { - "epoch": 0.1, - "learning_rate": 0.0002715376119172558, - "loss": 0.4769, - "step": 804 - }, - { - "epoch": 0.1, - "learning_rate": 0.0002715880668810574, - "loss": 0.4888, - "step": 805 - }, - { - "epoch": 0.1, - "learning_rate": 0.00027163845920677486, - "loss": 0.4668, - "step": 806 - }, - { - "epoch": 0.1, - "learning_rate": 0.0002716887890497414, - "loss": 0.4687, - "step": 807 - }, - { - "epoch": 0.1, - "learning_rate": 0.00027173905656471305, - "loss": 0.4532, - "step": 808 - }, - { - "epoch": 0.1, - "learning_rate": 0.00027178926190587176, - "loss": 0.4552, - "step": 809 - }, - { - "epoch": 0.1, - "learning_rate": 0.0002718394052268279, - "loss": 0.4893, - "step": 810 - }, - { - "epoch": 0.1, - "learning_rate": 0.0002718894866806235, - "loss": 0.4598, - "step": 811 - }, - { - "epoch": 0.1, - "learning_rate": 0.00027193950641973456, - "loss": 0.4631, - "step": 812 - }, - { - "epoch": 0.1, - "learning_rate": 0.00027198946459607416, - "loss": 0.4597, - "step": 813 - }, - { - "epoch": 0.1, - "learning_rate": 0.0002720393613609954, - "loss": 0.4704, - "step": 814 - }, - { - "epoch": 0.1, - "learning_rate": 0.00027208919686529353, - "loss": 0.4632, - "step": 815 - }, - { - "epoch": 0.1, - "learning_rate": 0.00027213897125920935, - "loss": 0.4794, - "step": 816 - }, - { - "epoch": 0.1, - "learning_rate": 0.0002721886846924315, - "loss": 0.4795, - "step": 817 - }, - { - "epoch": 0.1, - "learning_rate": 0.0002722383373140994, - "loss": 0.4672, - "step": 818 - }, - { - "epoch": 0.1, - "learning_rate": 0.0002722879292728057, - "loss": 0.4659, - "step": 819 - }, - { - "epoch": 0.1, - "learning_rate": 0.00027233746071659925, - "loss": 0.4544, - "step": 820 - }, - { - "epoch": 0.1, - "learning_rate": 0.0002723869317929875, - "loss": 0.4693, - "step": 821 - }, - { - "epoch": 0.1, - "learning_rate": 0.0002724363426489392, - "loss": 0.4678, - "step": 822 - }, - { - "epoch": 0.1, - "learning_rate": 0.0002724856934308871, - "loss": 0.4583, - "step": 823 - }, - { - "epoch": 0.1, - "learning_rate": 0.00027253498428473044, - "loss": 0.4779, - "step": 824 - }, - { - "epoch": 0.1, - "learning_rate": 0.00027258421535583763, - "loss": 0.4716, - "step": 825 - }, - { - "epoch": 0.1, - "learning_rate": 0.00027263338678904886, - "loss": 0.472, - "step": 826 - }, - { - "epoch": 0.1, - "learning_rate": 0.0002726824987286785, - "loss": 0.483, - "step": 827 - }, - { - "epoch": 0.1, - "learning_rate": 0.0002727315513185176, - "loss": 0.4828, - "step": 828 - }, - { - "epoch": 0.1, - "learning_rate": 0.0002727805447018369, - "loss": 0.4479, - "step": 829 - }, - { - "epoch": 0.1, - "learning_rate": 0.0002728294790213885, - "loss": 0.4428, - "step": 830 - }, - { - "epoch": 0.1, - "learning_rate": 0.00027287835441940935, - "loss": 0.4661, - "step": 831 - }, - { - "epoch": 0.1, - "learning_rate": 0.0002729271710376228, - "loss": 0.4566, - "step": 832 - }, - { - "epoch": 0.1, - "learning_rate": 0.0002729759290172417, - "loss": 0.4711, - "step": 833 - }, - { - "epoch": 0.1, - "learning_rate": 0.0002730246284989706, - "loss": 0.487, - "step": 834 - }, - { - "epoch": 0.1, - "learning_rate": 0.0002730732696230082, - "loss": 0.4536, - "step": 835 - }, - { - "epoch": 0.1, - "learning_rate": 0.0002731218525290498, - "loss": 0.4747, - "step": 836 - }, - { - "epoch": 0.1, - "learning_rate": 0.0002731703773562897, - "loss": 0.4812, - "step": 837 - }, - { - "epoch": 0.1, - "learning_rate": 0.00027321884424342353, - "loss": 0.4706, - "step": 838 - }, - { - "epoch": 0.1, - "learning_rate": 0.0002732672533286509, - "loss": 0.463, - "step": 839 - }, - { - "epoch": 0.1, - "learning_rate": 0.00027331560474967736, - "loss": 0.4501, - "step": 840 - }, - { - "epoch": 0.1, - "learning_rate": 0.000273363898643717, - "loss": 0.4593, - "step": 841 - }, - { - "epoch": 0.1, - "learning_rate": 0.0002734121351474946, - "loss": 0.459, - "step": 842 - }, - { - "epoch": 0.1, - "learning_rate": 0.0002734603143972484, - "loss": 0.4547, - "step": 843 - }, - { - "epoch": 0.1, - "learning_rate": 0.00027350843652873183, - "loss": 0.4713, - "step": 844 - }, - { - "epoch": 0.1, - "learning_rate": 0.00027355650167721615, - "loss": 0.4759, - "step": 845 - }, - { - "epoch": 0.1, - "learning_rate": 0.0002736045099774927, - "loss": 0.4646, - "step": 846 - }, - { - "epoch": 0.1, - "learning_rate": 0.000273652461563875, - "loss": 0.4463, - "step": 847 - }, - { - "epoch": 0.1, - "learning_rate": 0.00027370035657020125, - "loss": 0.459, - "step": 848 - }, - { - "epoch": 0.1, - "learning_rate": 0.0002737481951298364, - "loss": 0.4638, - "step": 849 - }, - { - "epoch": 0.1, - "learning_rate": 0.00027379597737567433, - "loss": 0.4401, - "step": 850 - }, - { - "epoch": 0.11, - "learning_rate": 0.0002738437034401404, - "loss": 0.4428, - "step": 851 - }, - { - "epoch": 0.11, - "learning_rate": 0.00027389137345519305, - "loss": 0.4721, - "step": 852 - }, - { - "epoch": 0.11, - "learning_rate": 0.0002739389875523267, - "loss": 0.4454, - "step": 853 - }, - { - "epoch": 0.11, - "learning_rate": 0.00027398654586257334, - "loss": 0.4926, - "step": 854 - }, - { - "epoch": 0.11, - "learning_rate": 0.00027403404851650504, - "loss": 0.4822, - "step": 855 - }, - { - "epoch": 0.11, - "learning_rate": 0.000274081495644236, - "loss": 0.4746, - "step": 856 - }, - { - "epoch": 0.11, - "learning_rate": 0.0002741288873754246, - "loss": 0.4716, - "step": 857 - }, - { - "epoch": 0.11, - "learning_rate": 0.0002741762238392757, - "loss": 0.4702, - "step": 858 - }, - { - "epoch": 0.11, - "learning_rate": 0.00027422350516454256, - "loss": 0.4567, - "step": 859 - }, - { - "epoch": 0.11, - "learning_rate": 0.00027427073147952904, - "loss": 0.4781, - "step": 860 - }, - { - "epoch": 0.11, - "learning_rate": 0.0002743179029120918, - "loss": 0.4509, - "step": 861 - }, - { - "epoch": 0.11, - "learning_rate": 0.0002743650195896423, - "loss": 0.451, - "step": 862 - }, - { - "epoch": 0.11, - "learning_rate": 0.0002744120816391485, - "loss": 0.464, - "step": 863 - }, - { - "epoch": 0.11, - "learning_rate": 0.0002744590891871376, - "loss": 0.4729, - "step": 864 - }, - { - "epoch": 0.11, - "learning_rate": 0.00027450604235969755, - "loss": 0.4495, - "step": 865 - }, - { - "epoch": 0.11, - "learning_rate": 0.0002745529412824794, - "loss": 0.4525, - "step": 866 - }, - { - "epoch": 0.11, - "learning_rate": 0.0002745997860806989, - "loss": 0.4519, - "step": 867 - }, - { - "epoch": 0.11, - "learning_rate": 0.00027464657687913916, - "loss": 0.463, - "step": 868 - }, - { - "epoch": 0.11, - "learning_rate": 0.0002746933138021518, - "loss": 0.4549, - "step": 869 - }, - { - "epoch": 0.11, - "learning_rate": 0.0002747399969736598, - "loss": 0.461, - "step": 870 - }, - { - "epoch": 0.11, - "learning_rate": 0.00027478662651715885, - "loss": 0.4673, - "step": 871 - }, - { - "epoch": 0.11, - "learning_rate": 0.0002748332025557196, - "loss": 0.4615, - "step": 872 - }, - { - "epoch": 0.11, - "learning_rate": 0.0002748797252119895, - "loss": 0.47, - "step": 873 - }, - { - "epoch": 0.11, - "learning_rate": 0.00027492619460819473, - "loss": 0.461, - "step": 874 - }, - { - "epoch": 0.11, - "learning_rate": 0.00027497261086614235, - "loss": 0.4629, - "step": 875 - }, - { - "epoch": 0.11, - "learning_rate": 0.0002750189741072219, - "loss": 0.4668, - "step": 876 - }, - { - "epoch": 0.11, - "learning_rate": 0.0002750652844524073, - "loss": 0.4592, - "step": 877 - }, - { - "epoch": 0.11, - "learning_rate": 0.00027511154202225914, - "loss": 0.4631, - "step": 878 - }, - { - "epoch": 0.11, - "learning_rate": 0.00027515774693692615, - "loss": 0.4823, - "step": 879 - }, - { - "epoch": 0.11, - "learning_rate": 0.00027520389931614734, - "loss": 0.4552, - "step": 880 - }, - { - "epoch": 0.11, - "learning_rate": 0.00027524999927925367, - "loss": 0.457, - "step": 881 - }, - { - "epoch": 0.11, - "learning_rate": 0.00027529604694516993, - "loss": 0.4543, - "step": 882 - }, - { - "epoch": 0.11, - "learning_rate": 0.0002753420424324168, - "loss": 0.4614, - "step": 883 - }, - { - "epoch": 0.11, - "learning_rate": 0.0002753879858591124, - "loss": 0.4576, - "step": 884 - }, - { - "epoch": 0.11, - "learning_rate": 0.00027543387734297415, - "loss": 0.452, - "step": 885 - }, - { - "epoch": 0.11, - "learning_rate": 0.0002754797170013208, - "loss": 0.4622, - "step": 886 - }, - { - "epoch": 0.11, - "learning_rate": 0.00027552550495107405, - "loss": 0.4745, - "step": 887 - }, - { - "epoch": 0.11, - "learning_rate": 0.0002755712413087603, - "loss": 0.4426, - "step": 888 - }, - { - "epoch": 0.11, - "learning_rate": 0.0002756169261905126, - "loss": 0.4543, - "step": 889 - }, - { - "epoch": 0.11, - "learning_rate": 0.0002756625597120722, - "loss": 0.4623, - "step": 890 - }, - { - "epoch": 0.11, - "learning_rate": 0.0002757081419887905, - "loss": 0.473, - "step": 891 - }, - { - "epoch": 0.11, - "learning_rate": 0.0002757536731356308, - "loss": 0.447, - "step": 892 - }, - { - "epoch": 0.11, - "learning_rate": 0.0002757991532671698, - "loss": 0.4759, - "step": 893 - }, - { - "epoch": 0.11, - "learning_rate": 0.0002758445824975996, - "loss": 0.4576, - "step": 894 - }, - { - "epoch": 0.11, - "learning_rate": 0.00027588996094072947, - "loss": 0.447, - "step": 895 - }, - { - "epoch": 0.11, - "learning_rate": 0.000275935288709987, - "loss": 0.4405, - "step": 896 - }, - { - "epoch": 0.11, - "learning_rate": 0.0002759805659184207, - "loss": 0.4403, - "step": 897 - }, - { - "epoch": 0.11, - "learning_rate": 0.0002760257926787008, - "loss": 0.4728, - "step": 898 - }, - { - "epoch": 0.11, - "learning_rate": 0.0002760709691031215, - "loss": 0.4739, - "step": 899 - }, - { - "epoch": 0.11, - "learning_rate": 0.0002761160953036026, - "loss": 0.4701, - "step": 900 - }, - { - "epoch": 0.11, - "learning_rate": 0.00027616117139169085, - "loss": 0.4435, - "step": 901 - }, - { - "epoch": 0.11, - "learning_rate": 0.00027620619747856186, - "loss": 0.4469, - "step": 902 - }, - { - "epoch": 0.11, - "learning_rate": 0.00027625117367502167, - "loss": 0.4657, - "step": 903 - }, - { - "epoch": 0.11, - "learning_rate": 0.0002762961000915084, - "loss": 0.4576, - "step": 904 - }, - { - "epoch": 0.11, - "learning_rate": 0.00027634097683809395, - "loss": 0.4586, - "step": 905 - }, - { - "epoch": 0.11, - "learning_rate": 0.00027638580402448553, - "loss": 0.4712, - "step": 906 - }, - { - "epoch": 0.11, - "learning_rate": 0.00027643058176002707, - "loss": 0.4599, - "step": 907 - }, - { - "epoch": 0.11, - "learning_rate": 0.0002764753101537013, - "loss": 0.4474, - "step": 908 - }, - { - "epoch": 0.11, - "learning_rate": 0.0002765199893141309, - "loss": 0.4463, - "step": 909 - }, - { - "epoch": 0.11, - "learning_rate": 0.0002765646193495804, - "loss": 0.4405, - "step": 910 - }, - { - "epoch": 0.11, - "learning_rate": 0.00027660920036795745, - "loss": 0.4735, - "step": 911 - }, - { - "epoch": 0.11, - "learning_rate": 0.0002766537324768147, - "loss": 0.4555, - "step": 912 - }, - { - "epoch": 0.11, - "learning_rate": 0.00027669821578335107, - "loss": 0.4627, - "step": 913 - }, - { - "epoch": 0.11, - "learning_rate": 0.0002767426503944136, - "loss": 0.4604, - "step": 914 - }, - { - "epoch": 0.11, - "learning_rate": 0.0002767870364164986, - "loss": 0.4717, - "step": 915 - }, - { - "epoch": 0.11, - "learning_rate": 0.00027683137395575347, - "loss": 0.4682, - "step": 916 - }, - { - "epoch": 0.11, - "learning_rate": 0.00027687566311797833, - "loss": 0.4613, - "step": 917 - }, - { - "epoch": 0.11, - "learning_rate": 0.0002769199040086272, - "loss": 0.4699, - "step": 918 - }, - { - "epoch": 0.11, - "learning_rate": 0.00027696409673280963, - "loss": 0.4703, - "step": 919 - }, - { - "epoch": 0.11, - "learning_rate": 0.0002770082413952923, - "loss": 0.4543, - "step": 920 - }, - { - "epoch": 0.11, - "learning_rate": 0.0002770523381005005, - "loss": 0.433, - "step": 921 - }, - { - "epoch": 0.11, - "learning_rate": 0.0002770963869525195, - "loss": 0.4511, - "step": 922 - }, - { - "epoch": 0.11, - "learning_rate": 0.0002771403880550961, - "loss": 0.4689, - "step": 923 - }, - { - "epoch": 0.11, - "learning_rate": 0.0002771843415116399, - "loss": 0.444, - "step": 924 - }, - { - "epoch": 0.11, - "learning_rate": 0.0002772282474252253, - "loss": 0.4547, - "step": 925 - }, - { - "epoch": 0.11, - "learning_rate": 0.0002772721058985923, - "loss": 0.4513, - "step": 926 - }, - { - "epoch": 0.11, - "learning_rate": 0.00027731591703414825, - "loss": 0.4702, - "step": 927 - }, - { - "epoch": 0.11, - "learning_rate": 0.00027735968093396945, - "loss": 0.4427, - "step": 928 - }, - { - "epoch": 0.11, - "learning_rate": 0.00027740339769980214, - "loss": 0.4613, - "step": 929 - }, - { - "epoch": 0.11, - "learning_rate": 0.00027744706743306434, - "loss": 0.4475, - "step": 930 - }, - { - "epoch": 0.11, - "learning_rate": 0.00027749069023484706, - "loss": 0.4449, - "step": 931 - }, - { - "epoch": 0.12, - "learning_rate": 0.00027753426620591567, - "loss": 0.4563, - "step": 932 - }, - { - "epoch": 0.12, - "learning_rate": 0.00027757779544671147, - "loss": 0.4778, - "step": 933 - }, - { - "epoch": 0.12, - "learning_rate": 0.0002776212780573529, - "loss": 0.4411, - "step": 934 - }, - { - "epoch": 0.12, - "learning_rate": 0.00027766471413763694, - "loss": 0.4628, - "step": 935 - }, - { - "epoch": 0.12, - "learning_rate": 0.00027770810378704064, - "loss": 0.4697, - "step": 936 - }, - { - "epoch": 0.12, - "learning_rate": 0.0002777514471047223, - "loss": 0.4428, - "step": 937 - }, - { - "epoch": 0.12, - "learning_rate": 0.00027779474418952304, - "loss": 0.4552, - "step": 938 - }, - { - "epoch": 0.12, - "learning_rate": 0.00027783799513996795, - "loss": 0.4589, - "step": 939 - }, - { - "epoch": 0.12, - "learning_rate": 0.0002778812000542674, - "loss": 0.4592, - "step": 940 - }, - { - "epoch": 0.12, - "learning_rate": 0.0002779243590303186, - "loss": 0.4505, - "step": 941 - }, - { - "epoch": 0.12, - "learning_rate": 0.00027796747216570687, - "loss": 0.4671, - "step": 942 - }, - { - "epoch": 0.12, - "learning_rate": 0.0002780105395577068, - "loss": 0.455, - "step": 943 - }, - { - "epoch": 0.12, - "learning_rate": 0.0002780535613032838, - "loss": 0.4631, - "step": 944 - }, - { - "epoch": 0.12, - "learning_rate": 0.00027809653749909523, - "loss": 0.4602, - "step": 945 - }, - { - "epoch": 0.12, - "learning_rate": 0.00027813946824149164, - "loss": 0.4479, - "step": 946 - }, - { - "epoch": 0.12, - "learning_rate": 0.00027818235362651845, - "loss": 0.4533, - "step": 947 - }, - { - "epoch": 0.12, - "learning_rate": 0.00027822519374991666, - "loss": 0.4682, - "step": 948 - }, - { - "epoch": 0.12, - "learning_rate": 0.00027826798870712486, - "loss": 0.4501, - "step": 949 - }, - { - "epoch": 0.12, - "learning_rate": 0.00027831073859327973, - "loss": 0.4348, - "step": 950 - }, - { - "epoch": 0.12, - "learning_rate": 0.0002783534435032178, - "loss": 0.4539, - "step": 951 - }, - { - "epoch": 0.12, - "learning_rate": 0.0002783961035314766, - "loss": 0.4479, - "step": 952 - }, - { - "epoch": 0.12, - "learning_rate": 0.00027843871877229596, - "loss": 0.4526, - "step": 953 - }, - { - "epoch": 0.12, - "learning_rate": 0.0002784812893196191, - "loss": 0.4515, - "step": 954 - }, - { - "epoch": 0.12, - "learning_rate": 0.00027852381526709404, - "loss": 0.4659, - "step": 955 - }, - { - "epoch": 0.12, - "learning_rate": 0.0002785662967080747, - "loss": 0.4486, - "step": 956 - }, - { - "epoch": 0.12, - "learning_rate": 0.00027860873373562235, - "loss": 0.4828, - "step": 957 - }, - { - "epoch": 0.12, - "learning_rate": 0.0002786511264425065, - "loss": 0.4665, - "step": 958 - }, - { - "epoch": 0.12, - "learning_rate": 0.00027869347492120647, - "loss": 0.465, - "step": 959 - }, - { - "epoch": 0.12, - "learning_rate": 0.0002787357792639123, - "loss": 0.4859, - "step": 960 - }, - { - "epoch": 0.12, - "learning_rate": 0.0002787780395625261, - "loss": 0.4429, - "step": 961 - }, - { - "epoch": 0.12, - "learning_rate": 0.00027882025590866334, - "loss": 0.4551, - "step": 962 - }, - { - "epoch": 0.12, - "learning_rate": 0.0002788624283936539, - "loss": 0.483, - "step": 963 - }, - { - "epoch": 0.12, - "learning_rate": 0.00027890455710854307, - "loss": 0.4566, - "step": 964 - }, - { - "epoch": 0.12, - "learning_rate": 0.00027894664214409335, - "loss": 0.4464, - "step": 965 - }, - { - "epoch": 0.12, - "learning_rate": 0.00027898868359078487, - "loss": 0.4739, - "step": 966 - }, - { - "epoch": 0.12, - "learning_rate": 0.0002790306815388172, - "loss": 0.4428, - "step": 967 - }, - { - "epoch": 0.12, - "learning_rate": 0.0002790726360781099, - "loss": 0.4429, - "step": 968 - }, - { - "epoch": 0.12, - "learning_rate": 0.0002791145472983043, - "loss": 0.4483, - "step": 969 - }, - { - "epoch": 0.12, - "learning_rate": 0.0002791564152887642, - "loss": 0.4452, - "step": 970 - }, - { - "epoch": 0.12, - "learning_rate": 0.000279198240138577, - "loss": 0.4614, - "step": 971 - }, - { - "epoch": 0.12, - "learning_rate": 0.0002792400219365554, - "loss": 0.4538, - "step": 972 - }, - { - "epoch": 0.12, - "learning_rate": 0.0002792817607712378, - "loss": 0.4565, - "step": 973 - }, - { - "epoch": 0.12, - "learning_rate": 0.00027932345673089, - "loss": 0.4562, - "step": 974 - }, - { - "epoch": 0.12, - "learning_rate": 0.00027936510990350563, - "loss": 0.4756, - "step": 975 - }, - { - "epoch": 0.12, - "learning_rate": 0.00027940672037680823, - "loss": 0.4592, - "step": 976 - }, - { - "epoch": 0.12, - "learning_rate": 0.0002794482882382516, - "loss": 0.4621, - "step": 977 - }, - { - "epoch": 0.12, - "learning_rate": 0.00027948981357502105, - "loss": 0.4529, - "step": 978 - }, - { - "epoch": 0.12, - "learning_rate": 0.00027953129647403474, - "loss": 0.4595, - "step": 979 - }, - { - "epoch": 0.12, - "learning_rate": 0.0002795727370219446, - "loss": 0.4419, - "step": 980 - }, - { - "epoch": 0.12, - "learning_rate": 0.00027961413530513745, - "loss": 0.4662, - "step": 981 - }, - { - "epoch": 0.12, - "learning_rate": 0.00027965549140973584, - "loss": 0.458, - "step": 982 - }, - { - "epoch": 0.12, - "learning_rate": 0.00027969680542159965, - "loss": 0.4229, - "step": 983 - }, - { - "epoch": 0.12, - "learning_rate": 0.00027973807742632677, - "loss": 0.477, - "step": 984 - }, - { - "epoch": 0.12, - "learning_rate": 0.00027977930750925414, - "loss": 0.4912, - "step": 985 - }, - { - "epoch": 0.12, - "learning_rate": 0.000279820495755459, - "loss": 0.4487, - "step": 986 - }, - { - "epoch": 0.12, - "learning_rate": 0.00027986164224976, - "loss": 0.4519, - "step": 987 - }, - { - "epoch": 0.12, - "learning_rate": 0.00027990274707671777, - "loss": 0.4338, - "step": 988 - }, - { - "epoch": 0.12, - "learning_rate": 0.00027994381032063665, - "loss": 0.471, - "step": 989 - }, - { - "epoch": 0.12, - "learning_rate": 0.0002799848320655652, - "loss": 0.4538, - "step": 990 - }, - { - "epoch": 0.12, - "learning_rate": 0.00028002581239529745, - "loss": 0.4648, - "step": 991 - }, - { - "epoch": 0.12, - "learning_rate": 0.000280066751393374, - "loss": 0.4564, - "step": 992 - }, - { - "epoch": 0.12, - "learning_rate": 0.0002801076491430828, - "loss": 0.4735, - "step": 993 - }, - { - "epoch": 0.12, - "learning_rate": 0.0002801485057274603, - "loss": 0.4354, - "step": 994 - }, - { - "epoch": 0.12, - "learning_rate": 0.00028018932122929254, - "loss": 0.4778, - "step": 995 - }, - { - "epoch": 0.12, - "learning_rate": 0.00028023009573111603, - "loss": 0.4823, - "step": 996 - }, - { - "epoch": 0.12, - "learning_rate": 0.00028027082931521887, - "loss": 0.4464, - "step": 997 - }, - { - "epoch": 0.12, - "learning_rate": 0.00028031152206364155, - "loss": 0.4378, - "step": 998 - }, - { - "epoch": 0.12, - "learning_rate": 0.0002803521740581782, - "loss": 0.4672, - "step": 999 - }, - { - "epoch": 0.12, - "learning_rate": 0.0002803927853803773, - "loss": 0.4508, - "step": 1000 - }, - { - "epoch": 0.12, - "learning_rate": 0.000280433356111543, - "loss": 0.4725, - "step": 1001 - }, - { - "epoch": 0.12, - "learning_rate": 0.00028047388633273566, - "loss": 0.4427, - "step": 1002 - }, - { - "epoch": 0.12, - "learning_rate": 0.0002805143761247734, - "loss": 0.4477, - "step": 1003 - }, - { - "epoch": 0.12, - "learning_rate": 0.00028055482556823235, - "loss": 0.4439, - "step": 1004 - }, - { - "epoch": 0.12, - "learning_rate": 0.00028059523474344833, - "loss": 0.4221, - "step": 1005 - }, - { - "epoch": 0.12, - "learning_rate": 0.0002806356037305172, - "loss": 0.4773, - "step": 1006 - }, - { - "epoch": 0.12, - "learning_rate": 0.00028067593260929625, - "loss": 0.4427, - "step": 1007 - }, - { - "epoch": 0.12, - "learning_rate": 0.0002807162214594049, - "loss": 0.4335, - "step": 1008 - }, - { - "epoch": 0.12, - "learning_rate": 0.00028075647036022576, - "loss": 0.4286, - "step": 1009 - }, - { - "epoch": 0.12, - "learning_rate": 0.00028079667939090555, - "loss": 0.4457, - "step": 1010 - }, - { - "epoch": 0.12, - "learning_rate": 0.00028083684863035606, - "loss": 0.4359, - "step": 1011 - }, - { - "epoch": 0.12, - "learning_rate": 0.0002808769781572549, - "loss": 0.4594, - "step": 1012 - }, - { - "epoch": 0.13, - "learning_rate": 0.0002809170680500466, - "loss": 0.4462, - "step": 1013 - }, - { - "epoch": 0.13, - "learning_rate": 0.00028095711838694367, - "loss": 0.4552, - "step": 1014 - }, - { - "epoch": 0.13, - "learning_rate": 0.00028099712924592706, - "loss": 0.4474, - "step": 1015 - }, - { - "epoch": 0.13, - "learning_rate": 0.00028103710070474753, - "loss": 0.475, - "step": 1016 - }, - { - "epoch": 0.13, - "learning_rate": 0.0002810770328409263, - "loss": 0.4435, - "step": 1017 - }, - { - "epoch": 0.13, - "learning_rate": 0.00028111692573175605, - "loss": 0.4257, - "step": 1018 - }, - { - "epoch": 0.13, - "learning_rate": 0.00028115677945430185, - "loss": 0.47, - "step": 1019 - }, - { - "epoch": 0.13, - "learning_rate": 0.00028119659408540185, - "loss": 0.4352, - "step": 1020 - }, - { - "epoch": 0.13, - "learning_rate": 0.0002812363697016685, - "loss": 0.4268, - "step": 1021 - }, - { - "epoch": 0.13, - "learning_rate": 0.00028127610637948916, - "loss": 0.4404, - "step": 1022 - }, - { - "epoch": 0.13, - "learning_rate": 0.0002813158041950269, - "loss": 0.4361, - "step": 1023 - }, - { - "epoch": 0.13, - "learning_rate": 0.00028135546322422195, - "loss": 0.445, - "step": 1024 - }, - { - "epoch": 0.13, - "learning_rate": 0.0002813950835427918, - "loss": 0.4548, - "step": 1025 - }, - { - "epoch": 0.13, - "learning_rate": 0.00028143466522623255, - "loss": 0.4391, - "step": 1026 - }, - { - "epoch": 0.13, - "learning_rate": 0.00028147420834981975, - "loss": 0.4662, - "step": 1027 - }, - { - "epoch": 0.13, - "learning_rate": 0.000281513712988609, - "loss": 0.4569, - "step": 1028 - }, - { - "epoch": 0.13, - "learning_rate": 0.0002815531792174372, - "loss": 0.4372, - "step": 1029 - }, - { - "epoch": 0.13, - "learning_rate": 0.000281592607110923, - "loss": 0.4373, - "step": 1030 - }, - { - "epoch": 0.13, - "learning_rate": 0.0002816319967434677, - "loss": 0.4343, - "step": 1031 - }, - { - "epoch": 0.13, - "learning_rate": 0.00028167134818925656, - "loss": 0.4371, - "step": 1032 - }, - { - "epoch": 0.13, - "learning_rate": 0.0002817106615222591, - "loss": 0.4253, - "step": 1033 - }, - { - "epoch": 0.13, - "learning_rate": 0.0002817499368162299, - "loss": 0.4398, - "step": 1034 - }, - { - "epoch": 0.13, - "learning_rate": 0.00028178917414471016, - "loss": 0.4409, - "step": 1035 - }, - { - "epoch": 0.13, - "learning_rate": 0.0002818283735810276, - "loss": 0.4495, - "step": 1036 - }, - { - "epoch": 0.13, - "learning_rate": 0.00028186753519829783, - "loss": 0.44, - "step": 1037 - }, - { - "epoch": 0.13, - "learning_rate": 0.0002819066590694251, - "loss": 0.4381, - "step": 1038 - }, - { - "epoch": 0.13, - "learning_rate": 0.00028194574526710294, - "loss": 0.4385, - "step": 1039 - }, - { - "epoch": 0.13, - "learning_rate": 0.00028198479386381533, - "loss": 0.4337, - "step": 1040 - }, - { - "epoch": 0.13, - "learning_rate": 0.0002820238049318369, - "loss": 0.4654, - "step": 1041 - }, - { - "epoch": 0.13, - "learning_rate": 0.00028206277854323435, - "loss": 0.4396, - "step": 1042 - }, - { - "epoch": 0.13, - "learning_rate": 0.0002821017147698669, - "loss": 0.4554, - "step": 1043 - }, - { - "epoch": 0.13, - "learning_rate": 0.00028214061368338726, - "loss": 0.4491, - "step": 1044 - }, - { - "epoch": 0.13, - "learning_rate": 0.0002821794753552423, - "loss": 0.4397, - "step": 1045 - }, - { - "epoch": 0.13, - "learning_rate": 0.0002822182998566738, - "loss": 0.4367, - "step": 1046 - }, - { - "epoch": 0.13, - "learning_rate": 0.0002822570872587194, - "loss": 0.4498, - "step": 1047 - }, - { - "epoch": 0.13, - "learning_rate": 0.00028229583763221327, - "loss": 0.4135, - "step": 1048 - }, - { - "epoch": 0.13, - "learning_rate": 0.0002823345510477869, - "loss": 0.4354, - "step": 1049 - }, - { - "epoch": 0.13, - "learning_rate": 0.00028237322757586987, - "loss": 0.4622, - "step": 1050 - }, - { - "epoch": 0.13, - "learning_rate": 0.0002824118672866907, - "loss": 0.4132, - "step": 1051 - }, - { - "epoch": 0.13, - "learning_rate": 0.0002824504702502774, - "loss": 0.4522, - "step": 1052 - }, - { - "epoch": 0.13, - "learning_rate": 0.00028248903653645845, - "loss": 0.4507, - "step": 1053 - }, - { - "epoch": 0.13, - "learning_rate": 0.0002825275662148636, - "loss": 0.4423, - "step": 1054 - }, - { - "epoch": 0.13, - "learning_rate": 0.00028256605935492434, - "loss": 0.4654, - "step": 1055 - }, - { - "epoch": 0.13, - "learning_rate": 0.00028260451602587486, - "loss": 0.4284, - "step": 1056 - }, - { - "epoch": 0.13, - "learning_rate": 0.00028264293629675274, - "loss": 0.4347, - "step": 1057 - }, - { - "epoch": 0.13, - "learning_rate": 0.00028268132023639986, - "loss": 0.4303, - "step": 1058 - }, - { - "epoch": 0.13, - "learning_rate": 0.0002827196679134628, - "loss": 0.4349, - "step": 1059 - }, - { - "epoch": 0.13, - "learning_rate": 0.00028275797939639376, - "loss": 0.4323, - "step": 1060 - }, - { - "epoch": 0.13, - "learning_rate": 0.0002827962547534515, - "loss": 0.4448, - "step": 1061 - }, - { - "epoch": 0.13, - "learning_rate": 0.0002828344940527016, - "loss": 0.452, - "step": 1062 - }, - { - "epoch": 0.13, - "learning_rate": 0.0002828726973620178, - "loss": 0.431, - "step": 1063 - }, - { - "epoch": 0.13, - "learning_rate": 0.000282910864749082, - "loss": 0.4316, - "step": 1064 - }, - { - "epoch": 0.13, - "learning_rate": 0.00028294899628138556, - "loss": 0.4349, - "step": 1065 - }, - { - "epoch": 0.13, - "learning_rate": 0.0002829870920262298, - "loss": 0.4357, - "step": 1066 - }, - { - "epoch": 0.13, - "learning_rate": 0.0002830251520507267, - "loss": 0.4238, - "step": 1067 - }, - { - "epoch": 0.13, - "learning_rate": 0.0002830631764217997, - "loss": 0.4184, - "step": 1068 - }, - { - "epoch": 0.13, - "learning_rate": 0.0002831011652061842, - "loss": 0.4372, - "step": 1069 - }, - { - "epoch": 0.13, - "learning_rate": 0.00028313911847042847, - "loss": 0.4529, - "step": 1070 - }, - { - "epoch": 0.13, - "learning_rate": 0.0002831770362808945, - "loss": 0.4528, - "step": 1071 - }, - { - "epoch": 0.13, - "learning_rate": 0.000283214918703758, - "loss": 0.4502, - "step": 1072 - }, - { - "epoch": 0.13, - "learning_rate": 0.00028325276580501, - "loss": 0.4133, - "step": 1073 - }, - { - "epoch": 0.13, - "learning_rate": 0.00028329057765045693, - "loss": 0.4732, - "step": 1074 - }, - { - "epoch": 0.13, - "learning_rate": 0.00028332835430572154, - "loss": 0.4525, - "step": 1075 - }, - { - "epoch": 0.13, - "learning_rate": 0.0002833660958362436, - "loss": 0.4437, - "step": 1076 - }, - { - "epoch": 0.13, - "learning_rate": 0.00028340380230728023, - "loss": 0.4451, - "step": 1077 - }, - { - "epoch": 0.13, - "learning_rate": 0.0002834414737839072, - "loss": 0.4206, - "step": 1078 - }, - { - "epoch": 0.13, - "learning_rate": 0.00028347911033101906, - "loss": 0.4239, - "step": 1079 - }, - { - "epoch": 0.13, - "learning_rate": 0.0002835167120133301, - "loss": 0.4328, - "step": 1080 - }, - { - "epoch": 0.13, - "learning_rate": 0.0002835542788953749, - "loss": 0.4375, - "step": 1081 - }, - { - "epoch": 0.13, - "learning_rate": 0.000283591811041509, - "loss": 0.4013, - "step": 1082 - }, - { - "epoch": 0.13, - "learning_rate": 0.0002836293085159097, - "loss": 0.4219, - "step": 1083 - }, - { - "epoch": 0.13, - "learning_rate": 0.0002836667713825764, - "loss": 0.4245, - "step": 1084 - }, - { - "epoch": 0.13, - "learning_rate": 0.0002837041997053316, - "loss": 0.4432, - "step": 1085 - }, - { - "epoch": 0.13, - "learning_rate": 0.0002837415935478215, - "loss": 0.4285, - "step": 1086 - }, - { - "epoch": 0.13, - "learning_rate": 0.0002837789529735164, - "loss": 0.4089, - "step": 1087 - }, - { - "epoch": 0.13, - "learning_rate": 0.0002838162780457115, - "loss": 0.4151, - "step": 1088 - }, - { - "epoch": 0.13, - "learning_rate": 0.00028385356882752776, - "loss": 0.4158, - "step": 1089 - }, - { - "epoch": 0.13, - "learning_rate": 0.0002838908253819121, - "loss": 0.435, - "step": 1090 - }, - { - "epoch": 0.13, - "learning_rate": 0.00028392804777163834, - "loss": 0.4442, - "step": 1091 - }, - { - "epoch": 0.13, - "learning_rate": 0.0002839652360593079, - "loss": 0.4437, - "step": 1092 - }, - { - "epoch": 0.13, - "learning_rate": 0.0002840023903073501, - "loss": 0.413, - "step": 1093 - }, - { - "epoch": 0.14, - "learning_rate": 0.0002840395105780231, - "loss": 0.4253, - "step": 1094 - }, - { - "epoch": 0.14, - "learning_rate": 0.00028407659693341434, - "loss": 0.4242, - "step": 1095 - }, - { - "epoch": 0.14, - "learning_rate": 0.0002841136494354414, - "loss": 0.4234, - "step": 1096 - }, - { - "epoch": 0.14, - "learning_rate": 0.00028415066814585217, - "loss": 0.435, - "step": 1097 - }, - { - "epoch": 0.14, - "learning_rate": 0.00028418765312622604, - "loss": 0.4406, - "step": 1098 - }, - { - "epoch": 0.14, - "learning_rate": 0.0002842246044379741, - "loss": 0.4301, - "step": 1099 - }, - { - "epoch": 0.14, - "learning_rate": 0.00028426152214233984, - "loss": 0.4188, - "step": 1100 - }, - { - "epoch": 0.14, - "learning_rate": 0.00028429840630039984, - "loss": 0.4165, - "step": 1101 - }, - { - "epoch": 0.14, - "learning_rate": 0.00028433525697306434, - "loss": 0.4324, - "step": 1102 - }, - { - "epoch": 0.14, - "learning_rate": 0.000284372074221078, - "loss": 0.4151, - "step": 1103 - }, - { - "epoch": 0.14, - "learning_rate": 0.0002844088581050198, - "loss": 0.428, - "step": 1104 - }, - { - "epoch": 0.14, - "learning_rate": 0.0002844456086853049, - "loss": 0.4288, - "step": 1105 - }, - { - "epoch": 0.14, - "learning_rate": 0.000284482326022184, - "loss": 0.4379, - "step": 1106 - }, - { - "epoch": 0.14, - "learning_rate": 0.00028451901017574464, - "loss": 0.4254, - "step": 1107 - }, - { - "epoch": 0.14, - "learning_rate": 0.00028455566120591156, - "loss": 0.4088, - "step": 1108 - }, - { - "epoch": 0.14, - "learning_rate": 0.0002845922791724473, - "loss": 0.4341, - "step": 1109 - }, - { - "epoch": 0.14, - "learning_rate": 0.0002846288641349528, - "loss": 0.4112, - "step": 1110 - }, - { - "epoch": 0.14, - "learning_rate": 0.00028466541615286816, - "loss": 0.417, - "step": 1111 - }, - { - "epoch": 0.14, - "learning_rate": 0.00028470193528547276, - "loss": 0.4248, - "step": 1112 - }, - { - "epoch": 0.14, - "learning_rate": 0.0002847384215918864, - "loss": 0.4153, - "step": 1113 - }, - { - "epoch": 0.14, - "learning_rate": 0.00028477487513106934, - "loss": 0.418, - "step": 1114 - }, - { - "epoch": 0.14, - "learning_rate": 0.0002848112959618233, - "loss": 0.4307, - "step": 1115 - }, - { - "epoch": 0.14, - "learning_rate": 0.00028484768414279186, - "loss": 0.4327, - "step": 1116 - }, - { - "epoch": 0.14, - "learning_rate": 0.000284884039732461, - "loss": 0.419, - "step": 1117 - }, - { - "epoch": 0.14, - "learning_rate": 0.00028492036278915964, - "loss": 0.4232, - "step": 1118 - }, - { - "epoch": 0.14, - "learning_rate": 0.0002849566533710602, - "loss": 0.4347, - "step": 1119 - }, - { - "epoch": 0.14, - "learning_rate": 0.00028499291153617957, - "loss": 0.4151, - "step": 1120 - }, - { - "epoch": 0.14, - "learning_rate": 0.00028502913734237875, - "loss": 0.4013, - "step": 1121 - }, - { - "epoch": 0.14, - "learning_rate": 0.0002850653308473644, - "loss": 0.4161, - "step": 1122 - }, - { - "epoch": 0.14, - "learning_rate": 0.0002851014921086888, - "loss": 0.435, - "step": 1123 - }, - { - "epoch": 0.14, - "learning_rate": 0.0002851376211837506, - "loss": 0.4295, - "step": 1124 - }, - { - "epoch": 0.14, - "learning_rate": 0.0002851737181297951, - "loss": 0.4049, - "step": 1125 - }, - { - "epoch": 0.14, - "learning_rate": 0.00028520978300391537, - "loss": 0.4101, - "step": 1126 - }, - { - "epoch": 0.14, - "learning_rate": 0.0002852458158630522, - "loss": 0.448, - "step": 1127 - }, - { - "epoch": 0.14, - "learning_rate": 0.0002852818167639949, - "loss": 0.4397, - "step": 1128 - }, - { - "epoch": 0.14, - "learning_rate": 0.0002853177857633818, - "loss": 0.4431, - "step": 1129 - }, - { - "epoch": 0.14, - "learning_rate": 0.0002853537229177009, - "loss": 0.445, - "step": 1130 - }, - { - "epoch": 0.14, - "learning_rate": 0.00028538962828329034, - "loss": 0.418, - "step": 1131 - }, - { - "epoch": 0.14, - "learning_rate": 0.0002854255019163386, - "loss": 0.4224, - "step": 1132 - }, - { - "epoch": 0.14, - "learning_rate": 0.00028546134387288555, - "loss": 0.4042, - "step": 1133 - }, - { - "epoch": 0.14, - "learning_rate": 0.0002854971542088227, - "loss": 0.4482, - "step": 1134 - }, - { - "epoch": 0.14, - "learning_rate": 0.00028553293297989377, - "loss": 0.4411, - "step": 1135 - }, - { - "epoch": 0.14, - "learning_rate": 0.0002855686802416952, - "loss": 0.439, - "step": 1136 - }, - { - "epoch": 0.14, - "learning_rate": 0.0002856043960496767, - "loss": 0.4373, - "step": 1137 - }, - { - "epoch": 0.14, - "learning_rate": 0.00028564008045914156, - "loss": 0.4082, - "step": 1138 - }, - { - "epoch": 0.14, - "learning_rate": 0.0002856757335252476, - "loss": 0.4283, - "step": 1139 - }, - { - "epoch": 0.14, - "learning_rate": 0.00028571135530300725, - "loss": 0.443, - "step": 1140 - }, - { - "epoch": 0.14, - "learning_rate": 0.0002857469458472883, - "loss": 0.4361, - "step": 1141 - }, - { - "epoch": 0.14, - "learning_rate": 0.0002857825052128144, - "loss": 0.4223, - "step": 1142 - }, - { - "epoch": 0.14, - "learning_rate": 0.00028581803345416535, - "loss": 0.4295, - "step": 1143 - }, - { - "epoch": 0.14, - "learning_rate": 0.0002858535306257779, - "loss": 0.4249, - "step": 1144 - }, - { - "epoch": 0.14, - "learning_rate": 0.00028588899678194603, - "loss": 0.417, - "step": 1145 - }, - { - "epoch": 0.14, - "learning_rate": 0.0002859244319768215, - "loss": 0.4172, - "step": 1146 - }, - { - "epoch": 0.14, - "learning_rate": 0.0002859598362644146, - "loss": 0.4155, - "step": 1147 - }, - { - "epoch": 0.14, - "learning_rate": 0.000285995209698594, - "loss": 0.4198, - "step": 1148 - }, - { - "epoch": 0.14, - "learning_rate": 0.0002860305523330881, - "loss": 0.4313, - "step": 1149 - }, - { - "epoch": 0.14, - "learning_rate": 0.00028606586422148485, - "loss": 0.4431, - "step": 1150 - }, - { - "epoch": 0.14, - "learning_rate": 0.0002861011454172324, - "loss": 0.4321, - "step": 1151 - }, - { - "epoch": 0.14, - "learning_rate": 0.00028613639597363977, - "loss": 0.4517, - "step": 1152 - }, - { - "epoch": 0.14, - "learning_rate": 0.0002861716159438772, - "loss": 0.4283, - "step": 1153 - }, - { - "epoch": 0.14, - "learning_rate": 0.00028620680538097676, - "loss": 0.4147, - "step": 1154 - }, - { - "epoch": 0.14, - "learning_rate": 0.0002862419643378325, - "loss": 0.4289, - "step": 1155 - }, - { - "epoch": 0.14, - "learning_rate": 0.0002862770928672011, - "loss": 0.4238, - "step": 1156 - }, - { - "epoch": 0.14, - "learning_rate": 0.00028631219102170273, - "loss": 0.4273, - "step": 1157 - }, - { - "epoch": 0.14, - "learning_rate": 0.0002863472588538208, - "loss": 0.437, - "step": 1158 - }, - { - "epoch": 0.14, - "learning_rate": 0.00028638229641590317, - "loss": 0.4259, - "step": 1159 - }, - { - "epoch": 0.14, - "learning_rate": 0.00028641730376016195, - "loss": 0.4251, - "step": 1160 - }, - { - "epoch": 0.14, - "learning_rate": 0.0002864522809386744, - "loss": 0.4035, - "step": 1161 - }, - { - "epoch": 0.14, - "learning_rate": 0.0002864872280033833, - "loss": 0.4217, - "step": 1162 - }, - { - "epoch": 0.14, - "learning_rate": 0.00028652214500609735, - "loss": 0.4223, - "step": 1163 - }, - { - "epoch": 0.14, - "learning_rate": 0.00028655703199849164, - "loss": 0.4182, - "step": 1164 - }, - { - "epoch": 0.14, - "learning_rate": 0.0002865918890321082, - "loss": 0.4135, - "step": 1165 - }, - { - "epoch": 0.14, - "learning_rate": 0.00028662671615835636, - "loss": 0.4309, - "step": 1166 - }, - { - "epoch": 0.14, - "learning_rate": 0.00028666151342851315, - "loss": 0.4178, - "step": 1167 - }, - { - "epoch": 0.14, - "learning_rate": 0.00028669628089372405, - "loss": 0.4305, - "step": 1168 - }, - { - "epoch": 0.14, - "learning_rate": 0.00028673101860500293, - "loss": 0.4157, - "step": 1169 - }, - { - "epoch": 0.14, - "learning_rate": 0.00028676572661323315, - "loss": 0.4465, - "step": 1170 - }, - { - "epoch": 0.14, - "learning_rate": 0.00028680040496916734, - "loss": 0.4187, - "step": 1171 - }, - { - "epoch": 0.14, - "learning_rate": 0.0002868350537234283, - "loss": 0.4345, - "step": 1172 - }, - { - "epoch": 0.14, - "learning_rate": 0.0002868696729265094, - "loss": 0.4374, - "step": 1173 - }, - { - "epoch": 0.14, - "learning_rate": 0.00028690426262877473, - "loss": 0.4243, - "step": 1174 - }, - { - "epoch": 0.15, - "learning_rate": 0.0002869388228804599, - "loss": 0.4277, - "step": 1175 - }, - { - "epoch": 0.15, - "learning_rate": 0.0002869733537316721, - "loss": 0.4294, - "step": 1176 - }, - { - "epoch": 0.15, - "learning_rate": 0.0002870078552323911, - "loss": 0.419, - "step": 1177 - }, - { - "epoch": 0.15, - "learning_rate": 0.00028704232743246894, - "loss": 0.4083, - "step": 1178 - }, - { - "epoch": 0.15, - "learning_rate": 0.00028707677038163114, - "loss": 0.4224, - "step": 1179 - }, - { - "epoch": 0.15, - "learning_rate": 0.0002871111841294763, - "loss": 0.4012, - "step": 1180 - }, - { - "epoch": 0.15, - "learning_rate": 0.00028714556872547745, - "loss": 0.4168, - "step": 1181 - }, - { - "epoch": 0.15, - "learning_rate": 0.00028717992421898166, - "loss": 0.4354, - "step": 1182 - }, - { - "epoch": 0.15, - "learning_rate": 0.00028721425065921094, - "loss": 0.4218, - "step": 1183 - }, - { - "epoch": 0.15, - "learning_rate": 0.00028724854809526247, - "loss": 0.4259, - "step": 1184 - }, - { - "epoch": 0.15, - "learning_rate": 0.0002872828165761092, - "loss": 0.4198, - "step": 1185 - }, - { - "epoch": 0.15, - "learning_rate": 0.0002873170561506001, - "loss": 0.4346, - "step": 1186 - }, - { - "epoch": 0.15, - "learning_rate": 0.00028735126686746046, - "loss": 0.4267, - "step": 1187 - }, - { - "epoch": 0.15, - "learning_rate": 0.00028738544877529267, - "loss": 0.4052, - "step": 1188 - }, - { - "epoch": 0.15, - "learning_rate": 0.0002874196019225764, - "loss": 0.421, - "step": 1189 - }, - { - "epoch": 0.15, - "learning_rate": 0.00028745372635766907, - "loss": 0.4341, - "step": 1190 - }, - { - "epoch": 0.15, - "learning_rate": 0.0002874878221288062, - "loss": 0.4097, - "step": 1191 - }, - { - "epoch": 0.15, - "learning_rate": 0.00028752188928410187, - "loss": 0.4228, - "step": 1192 - }, - { - "epoch": 0.15, - "learning_rate": 0.00028755592787154896, - "loss": 0.4103, - "step": 1193 - }, - { - "epoch": 0.15, - "learning_rate": 0.00028758993793902006, - "loss": 0.4027, - "step": 1194 - }, - { - "epoch": 0.15, - "learning_rate": 0.00028762391953426723, - "loss": 0.4021, - "step": 1195 - }, - { - "epoch": 0.15, - "learning_rate": 0.00028765787270492284, - "loss": 0.4121, - "step": 1196 - }, - { - "epoch": 0.15, - "learning_rate": 0.0002876917974984998, - "loss": 0.4247, - "step": 1197 - }, - { - "epoch": 0.15, - "learning_rate": 0.000287725693962392, - "loss": 0.4336, - "step": 1198 - }, - { - "epoch": 0.15, - "learning_rate": 0.00028775956214387464, - "loss": 0.4094, - "step": 1199 - }, - { - "epoch": 0.15, - "learning_rate": 0.0002877934020901048, - "loss": 0.4035, - "step": 1200 - }, - { - "epoch": 0.15, - "learning_rate": 0.00028782721384812155, - "loss": 0.4052, - "step": 1201 - }, - { - "epoch": 0.15, - "learning_rate": 0.00028786099746484664, - "loss": 0.4194, - "step": 1202 - }, - { - "epoch": 0.15, - "learning_rate": 0.00028789475298708476, - "loss": 0.4016, - "step": 1203 - }, - { - "epoch": 0.15, - "learning_rate": 0.0002879284804615238, - "loss": 0.4198, - "step": 1204 - }, - { - "epoch": 0.15, - "learning_rate": 0.0002879621799347356, - "loss": 0.4219, - "step": 1205 - }, - { - "epoch": 0.15, - "learning_rate": 0.00028799585145317585, - "loss": 0.4131, - "step": 1206 - }, - { - "epoch": 0.15, - "learning_rate": 0.0002880294950631848, - "loss": 0.4335, - "step": 1207 - }, - { - "epoch": 0.15, - "learning_rate": 0.0002880631108109877, - "loss": 0.4195, - "step": 1208 - }, - { - "epoch": 0.15, - "learning_rate": 0.0002880966987426949, - "loss": 0.4251, - "step": 1209 - }, - { - "epoch": 0.15, - "learning_rate": 0.0002881302589043024, - "loss": 0.414, - "step": 1210 - }, - { - "epoch": 0.15, - "learning_rate": 0.00028816379134169234, - "loss": 0.4108, - "step": 1211 - }, - { - "epoch": 0.15, - "learning_rate": 0.00028819729610063307, - "loss": 0.4066, - "step": 1212 - }, - { - "epoch": 0.15, - "learning_rate": 0.0002882307732267798, - "loss": 0.3976, - "step": 1213 - }, - { - "epoch": 0.15, - "learning_rate": 0.0002882642227656748, - "loss": 0.4034, - "step": 1214 - }, - { - "epoch": 0.15, - "learning_rate": 0.00028829764476274793, - "loss": 0.4188, - "step": 1215 - }, - { - "epoch": 0.15, - "learning_rate": 0.0002883310392633169, - "loss": 0.4071, - "step": 1216 - }, - { - "epoch": 0.15, - "learning_rate": 0.00028836440631258757, - "loss": 0.4347, - "step": 1217 - }, - { - "epoch": 0.15, - "learning_rate": 0.00028839774595565453, - "loss": 0.4123, - "step": 1218 - }, - { - "epoch": 0.15, - "learning_rate": 0.0002884310582375013, - "loss": 0.4125, - "step": 1219 - }, - { - "epoch": 0.15, - "learning_rate": 0.00028846434320300074, - "loss": 0.3997, - "step": 1220 - }, - { - "epoch": 0.15, - "learning_rate": 0.00028849760089691537, - "loss": 0.416, - "step": 1221 - }, - { - "epoch": 0.15, - "learning_rate": 0.0002885308313638979, - "loss": 0.4419, - "step": 1222 - }, - { - "epoch": 0.15, - "learning_rate": 0.00028856403464849127, - "loss": 0.4248, - "step": 1223 - }, - { - "epoch": 0.15, - "learning_rate": 0.0002885972107951294, - "loss": 0.4011, - "step": 1224 - }, - { - "epoch": 0.15, - "learning_rate": 0.00028863035984813713, - "loss": 0.3929, - "step": 1225 - }, - { - "epoch": 0.15, - "learning_rate": 0.0002886634818517311, - "loss": 0.4197, - "step": 1226 - }, - { - "epoch": 0.15, - "learning_rate": 0.00028869657685001943, - "loss": 0.4145, - "step": 1227 - }, - { - "epoch": 0.15, - "learning_rate": 0.00028872964488700273, - "loss": 0.4254, - "step": 1228 - }, - { - "epoch": 0.15, - "learning_rate": 0.000288762686006574, - "loss": 0.4012, - "step": 1229 - }, - { - "epoch": 0.15, - "learning_rate": 0.0002887957002525193, - "loss": 0.4222, - "step": 1230 - }, - { - "epoch": 0.15, - "learning_rate": 0.0002888286876685177, - "loss": 0.4054, - "step": 1231 - }, - { - "epoch": 0.15, - "learning_rate": 0.0002888616482981421, - "loss": 0.3961, - "step": 1232 - }, - { - "epoch": 0.15, - "learning_rate": 0.00028889458218485923, - "loss": 0.4081, - "step": 1233 - }, - { - "epoch": 0.15, - "learning_rate": 0.00028892748937203006, - "loss": 0.4152, - "step": 1234 - }, - { - "epoch": 0.15, - "learning_rate": 0.0002889603699029103, - "loss": 0.4197, - "step": 1235 - }, - { - "epoch": 0.15, - "learning_rate": 0.00028899322382065047, - "loss": 0.4201, - "step": 1236 - }, - { - "epoch": 0.15, - "learning_rate": 0.0002890260511682966, - "loss": 0.419, - "step": 1237 - }, - { - "epoch": 0.15, - "learning_rate": 0.0002890588519887902, - "loss": 0.4207, - "step": 1238 - }, - { - "epoch": 0.15, - "learning_rate": 0.0002890916263249689, - "loss": 0.4354, - "step": 1239 - }, - { - "epoch": 0.15, - "learning_rate": 0.00028912437421956655, - "loss": 0.4028, - "step": 1240 - }, - { - "epoch": 0.15, - "learning_rate": 0.0002891570957152136, - "loss": 0.441, - "step": 1241 - }, - { - "epoch": 0.15, - "learning_rate": 0.0002891897908544377, - "loss": 0.4152, - "step": 1242 - }, - { - "epoch": 0.15, - "learning_rate": 0.00028922245967966353, - "loss": 0.42, - "step": 1243 - }, - { - "epoch": 0.15, - "learning_rate": 0.00028925510223321363, - "loss": 0.4421, - "step": 1244 - }, - { - "epoch": 0.15, - "learning_rate": 0.00028928771855730854, - "loss": 0.4381, - "step": 1245 - }, - { - "epoch": 0.15, - "learning_rate": 0.000289320308694067, - "loss": 0.4262, - "step": 1246 - }, - { - "epoch": 0.15, - "learning_rate": 0.00028935287268550626, - "loss": 0.4056, - "step": 1247 - }, - { - "epoch": 0.15, - "learning_rate": 0.0002893854105735428, - "loss": 0.4079, - "step": 1248 - }, - { - "epoch": 0.15, - "learning_rate": 0.00028941792239999225, - "loss": 0.4065, - "step": 1249 - }, - { - "epoch": 0.15, - "learning_rate": 0.0002894504082065698, - "loss": 0.3951, - "step": 1250 - }, - { - "epoch": 0.15, - "learning_rate": 0.00028948286803489063, - "loss": 0.4268, - "step": 1251 - }, - { - "epoch": 0.15, - "learning_rate": 0.0002895153019264701, - "loss": 0.4085, - "step": 1252 - }, - { - "epoch": 0.15, - "learning_rate": 0.0002895477099227242, - "loss": 0.3843, - "step": 1253 - }, - { - "epoch": 0.15, - "learning_rate": 0.0002895800920649698, - "loss": 0.4219, - "step": 1254 - }, - { - "epoch": 0.15, - "learning_rate": 0.0002896124483944249, - "loss": 0.4259, - "step": 1255 - }, - { - "epoch": 0.16, - "learning_rate": 0.00028964477895220903, - "loss": 0.3958, - "step": 1256 - }, - { - "epoch": 0.16, - "learning_rate": 0.0002896770837793436, - "loss": 0.4136, - "step": 1257 - }, - { - "epoch": 0.16, - "learning_rate": 0.00028970936291675207, - "loss": 0.3929, - "step": 1258 - }, - { - "epoch": 0.16, - "learning_rate": 0.00028974161640526043, - "loss": 0.4131, - "step": 1259 - }, - { - "epoch": 0.16, - "learning_rate": 0.0002897738442855974, - "loss": 0.3992, - "step": 1260 - }, - { - "epoch": 0.16, - "learning_rate": 0.00028980604659839467, - "loss": 0.3999, - "step": 1261 - }, - { - "epoch": 0.16, - "learning_rate": 0.00028983822338418745, - "loss": 0.4006, - "step": 1262 - }, - { - "epoch": 0.16, - "learning_rate": 0.0002898703746834146, - "loss": 0.3978, - "step": 1263 - }, - { - "epoch": 0.16, - "learning_rate": 0.00028990250053641893, - "loss": 0.4036, - "step": 1264 - }, - { - "epoch": 0.16, - "learning_rate": 0.0002899346009834474, - "loss": 0.4395, - "step": 1265 - }, - { - "epoch": 0.16, - "learning_rate": 0.0002899666760646518, - "loss": 0.3984, - "step": 1266 - }, - { - "epoch": 0.16, - "learning_rate": 0.00028999872582008873, - "loss": 0.4199, - "step": 1267 - }, - { - "epoch": 0.16, - "learning_rate": 0.00029003075028971993, - "loss": 0.4175, - "step": 1268 - }, - { - "epoch": 0.16, - "learning_rate": 0.0002900627495134127, - "loss": 0.4037, - "step": 1269 - }, - { - "epoch": 0.16, - "learning_rate": 0.00029009472353094004, - "loss": 0.3978, - "step": 1270 - }, - { - "epoch": 0.16, - "learning_rate": 0.000290126672381981, - "loss": 0.4215, - "step": 1271 - }, - { - "epoch": 0.16, - "learning_rate": 0.0002901585961061213, - "loss": 0.4192, - "step": 1272 - }, - { - "epoch": 0.16, - "learning_rate": 0.0002901904947428529, - "loss": 0.4099, - "step": 1273 - }, - { - "epoch": 0.16, - "learning_rate": 0.0002902223683315752, - "loss": 0.4089, - "step": 1274 - }, - { - "epoch": 0.16, - "learning_rate": 0.00029025421691159436, - "loss": 0.433, - "step": 1275 - }, - { - "epoch": 0.16, - "learning_rate": 0.00029028604052212456, - "loss": 0.3959, - "step": 1276 - }, - { - "epoch": 0.16, - "learning_rate": 0.0002903178392022875, - "loss": 0.4198, - "step": 1277 - }, - { - "epoch": 0.16, - "learning_rate": 0.000290349612991113, - "loss": 0.3913, - "step": 1278 - }, - { - "epoch": 0.16, - "learning_rate": 0.00029038136192753973, - "loss": 0.4089, - "step": 1279 - }, - { - "epoch": 0.16, - "learning_rate": 0.00029041308605041446, - "loss": 0.4092, - "step": 1280 - }, - { - "epoch": 0.16, - "learning_rate": 0.0002904447853984933, - "loss": 0.4129, - "step": 1281 - }, - { - "epoch": 0.16, - "learning_rate": 0.00029047646001044165, - "loss": 0.4264, - "step": 1282 - }, - { - "epoch": 0.16, - "learning_rate": 0.00029050810992483435, - "loss": 0.4333, - "step": 1283 - }, - { - "epoch": 0.16, - "learning_rate": 0.00029053973518015604, - "loss": 0.3712, - "step": 1284 - }, - { - "epoch": 0.16, - "learning_rate": 0.0002905713358148016, - "loss": 0.414, - "step": 1285 - }, - { - "epoch": 0.16, - "learning_rate": 0.00029060291186707614, - "loss": 0.4007, - "step": 1286 - }, - { - "epoch": 0.16, - "learning_rate": 0.0002906344633751957, - "loss": 0.4022, - "step": 1287 - }, - { - "epoch": 0.16, - "learning_rate": 0.00029066599037728713, - "loss": 0.4143, - "step": 1288 - }, - { - "epoch": 0.16, - "learning_rate": 0.0002906974929113883, - "loss": 0.4098, - "step": 1289 - }, - { - "epoch": 0.16, - "learning_rate": 0.0002907289710154491, - "loss": 0.3874, - "step": 1290 - }, - { - "epoch": 0.16, - "learning_rate": 0.00029076042472733066, - "loss": 0.4096, - "step": 1291 - }, - { - "epoch": 0.16, - "learning_rate": 0.0002907918540848065, - "loss": 0.4048, - "step": 1292 - }, - { - "epoch": 0.16, - "learning_rate": 0.00029082325912556227, - "loss": 0.3939, - "step": 1293 - }, - { - "epoch": 0.16, - "learning_rate": 0.0002908546398871964, - "loss": 0.4247, - "step": 1294 - }, - { - "epoch": 0.16, - "learning_rate": 0.0002908859964072201, - "loss": 0.4229, - "step": 1295 - }, - { - "epoch": 0.16, - "learning_rate": 0.0002909173287230576, - "loss": 0.4163, - "step": 1296 - }, - { - "epoch": 0.16, - "learning_rate": 0.00029094863687204677, - "loss": 0.3905, - "step": 1297 - }, - { - "epoch": 0.16, - "learning_rate": 0.00029097992089143886, - "loss": 0.3996, - "step": 1298 - }, - { - "epoch": 0.16, - "learning_rate": 0.0002910111808183994, - "loss": 0.4143, - "step": 1299 - }, - { - "epoch": 0.16, - "learning_rate": 0.0002910424166900078, - "loss": 0.3859, - "step": 1300 - }, - { - "epoch": 0.16, - "learning_rate": 0.0002910736285432581, - "loss": 0.409, - "step": 1301 - }, - { - "epoch": 0.16, - "learning_rate": 0.00029110481641505913, - "loss": 0.4267, - "step": 1302 - }, - { - "epoch": 0.16, - "learning_rate": 0.00029113598034223446, - "loss": 0.4228, - "step": 1303 - }, - { - "epoch": 0.16, - "learning_rate": 0.00029116712036152326, - "loss": 0.4146, - "step": 1304 - }, - { - "epoch": 0.16, - "learning_rate": 0.0002911982365095798, - "loss": 0.4272, - "step": 1305 - }, - { - "epoch": 0.16, - "learning_rate": 0.0002912293288229745, - "loss": 0.4149, - "step": 1306 - }, - { - "epoch": 0.16, - "learning_rate": 0.00029126039733819354, - "loss": 0.4107, - "step": 1307 - }, - { - "epoch": 0.16, - "learning_rate": 0.0002912914420916396, - "loss": 0.4193, - "step": 1308 - }, - { - "epoch": 0.16, - "learning_rate": 0.00029132246311963173, - "loss": 0.4086, - "step": 1309 - }, - { - "epoch": 0.16, - "learning_rate": 0.0002913534604584058, - "loss": 0.3951, - "step": 1310 - }, - { - "epoch": 0.16, - "learning_rate": 0.00029138443414411476, - "loss": 0.4005, - "step": 1311 - }, - { - "epoch": 0.16, - "learning_rate": 0.0002914153842128289, - "loss": 0.3949, - "step": 1312 - }, - { - "epoch": 0.16, - "learning_rate": 0.0002914463107005361, - "loss": 0.3896, - "step": 1313 - }, - { - "epoch": 0.16, - "learning_rate": 0.00029147721364314186, - "loss": 0.4093, - "step": 1314 - }, - { - "epoch": 0.16, - "learning_rate": 0.00029150809307646987, - "loss": 0.3913, - "step": 1315 - }, - { - "epoch": 0.16, - "learning_rate": 0.00029153894903626216, - "loss": 0.3845, - "step": 1316 - }, - { - "epoch": 0.16, - "learning_rate": 0.0002915697815581791, - "loss": 0.4197, - "step": 1317 - }, - { - "epoch": 0.16, - "learning_rate": 0.0002916005906778002, - "loss": 0.4223, - "step": 1318 - }, - { - "epoch": 0.16, - "learning_rate": 0.00029163137643062375, - "loss": 0.402, - "step": 1319 - }, - { - "epoch": 0.16, - "learning_rate": 0.00029166213885206736, - "loss": 0.3909, - "step": 1320 - }, - { - "epoch": 0.16, - "learning_rate": 0.0002916928779774683, - "loss": 0.4095, - "step": 1321 - }, - { - "epoch": 0.16, - "learning_rate": 0.0002917235938420835, - "loss": 0.4122, - "step": 1322 - }, - { - "epoch": 0.16, - "learning_rate": 0.00029175428648109, - "loss": 0.3877, - "step": 1323 - }, - { - "epoch": 0.16, - "learning_rate": 0.000291784955929585, - "loss": 0.4214, - "step": 1324 - }, - { - "epoch": 0.16, - "learning_rate": 0.00029181560222258626, - "loss": 0.3903, - "step": 1325 - }, - { - "epoch": 0.16, - "learning_rate": 0.0002918462253950324, - "loss": 0.3975, - "step": 1326 - }, - { - "epoch": 0.16, - "learning_rate": 0.00029187682548178275, - "loss": 0.4114, - "step": 1327 - }, - { - "epoch": 0.16, - "learning_rate": 0.0002919074025176182, - "loss": 0.4036, - "step": 1328 - }, - { - "epoch": 0.16, - "learning_rate": 0.00029193795653724083, - "loss": 0.447, - "step": 1329 - }, - { - "epoch": 0.16, - "learning_rate": 0.0002919684875752745, - "loss": 0.4123, - "step": 1330 - }, - { - "epoch": 0.16, - "learning_rate": 0.000291998995666265, - "loss": 0.4008, - "step": 1331 - }, - { - "epoch": 0.16, - "learning_rate": 0.00029202948084468034, - "loss": 0.4227, - "step": 1332 - }, - { - "epoch": 0.16, - "learning_rate": 0.00029205994314491086, - "loss": 0.3873, - "step": 1333 - }, - { - "epoch": 0.16, - "learning_rate": 0.00029209038260126946, - "loss": 0.4191, - "step": 1334 - }, - { - "epoch": 0.16, - "learning_rate": 0.0002921207992479922, - "loss": 0.4063, - "step": 1335 - }, - { - "epoch": 0.16, - "learning_rate": 0.0002921511931192378, - "loss": 0.3946, - "step": 1336 - }, - { - "epoch": 0.17, - "learning_rate": 0.0002921815642490888, - "loss": 0.3948, - "step": 1337 - }, - { - "epoch": 0.17, - "learning_rate": 0.00029221191267155076, - "loss": 0.3975, - "step": 1338 - }, - { - "epoch": 0.17, - "learning_rate": 0.0002922422384205535, - "loss": 0.411, - "step": 1339 - }, - { - "epoch": 0.17, - "learning_rate": 0.0002922725415299505, - "loss": 0.3987, - "step": 1340 - }, - { - "epoch": 0.17, - "learning_rate": 0.00029230282203351963, - "loss": 0.3787, - "step": 1341 - }, - { - "epoch": 0.17, - "learning_rate": 0.00029233307996496334, - "loss": 0.4065, - "step": 1342 - }, - { - "epoch": 0.17, - "learning_rate": 0.0002923633153579085, - "loss": 0.4009, - "step": 1343 - }, - { - "epoch": 0.17, - "learning_rate": 0.00029239352824590704, - "loss": 0.4095, - "step": 1344 - }, - { - "epoch": 0.17, - "learning_rate": 0.0002924237186624361, - "loss": 0.3925, - "step": 1345 - }, - { - "epoch": 0.17, - "learning_rate": 0.000292453886640898, - "loss": 0.4035, - "step": 1346 - }, - { - "epoch": 0.17, - "learning_rate": 0.00029248403221462076, - "loss": 0.3853, - "step": 1347 - }, - { - "epoch": 0.17, - "learning_rate": 0.00029251415541685827, - "loss": 0.3953, - "step": 1348 - }, - { - "epoch": 0.17, - "learning_rate": 0.00029254425628079015, - "loss": 0.4087, - "step": 1349 - }, - { - "epoch": 0.17, - "learning_rate": 0.0002925743348395226, - "loss": 0.4123, - "step": 1350 - }, - { - "epoch": 0.17, - "learning_rate": 0.00029260439112608813, - "loss": 0.397, - "step": 1351 - }, - { - "epoch": 0.17, - "learning_rate": 0.0002926344251734459, - "loss": 0.4088, - "step": 1352 - }, - { - "epoch": 0.17, - "learning_rate": 0.00029266443701448183, - "loss": 0.3997, - "step": 1353 - }, - { - "epoch": 0.17, - "learning_rate": 0.00029269442668200936, - "loss": 0.3984, - "step": 1354 - }, - { - "epoch": 0.17, - "learning_rate": 0.0002927243942087689, - "loss": 0.3946, - "step": 1355 - }, - { - "epoch": 0.17, - "learning_rate": 0.00029275433962742844, - "loss": 0.4056, - "step": 1356 - }, - { - "epoch": 0.17, - "learning_rate": 0.0002927842629705839, - "loss": 0.4312, - "step": 1357 - }, - { - "epoch": 0.17, - "learning_rate": 0.0002928141642707589, - "loss": 0.4103, - "step": 1358 - }, - { - "epoch": 0.17, - "learning_rate": 0.0002928440435604055, - "loss": 0.3861, - "step": 1359 - }, - { - "epoch": 0.17, - "learning_rate": 0.000292873900871904, - "loss": 0.4058, - "step": 1360 - }, - { - "epoch": 0.17, - "learning_rate": 0.0002929037362375634, - "loss": 0.4124, - "step": 1361 - }, - { - "epoch": 0.17, - "learning_rate": 0.0002929335496896213, - "loss": 0.3969, - "step": 1362 - }, - { - "epoch": 0.17, - "learning_rate": 0.00029296334126024454, - "loss": 0.4099, - "step": 1363 - }, - { - "epoch": 0.17, - "learning_rate": 0.0002929931109815291, - "loss": 0.4255, - "step": 1364 - }, - { - "epoch": 0.17, - "learning_rate": 0.0002930228588855004, - "loss": 0.3973, - "step": 1365 - }, - { - "epoch": 0.17, - "learning_rate": 0.0002930525850041135, - "loss": 0.379, - "step": 1366 - }, - { - "epoch": 0.17, - "learning_rate": 0.0002930822893692533, - "loss": 0.4217, - "step": 1367 - }, - { - "epoch": 0.17, - "learning_rate": 0.0002931119720127347, - "loss": 0.4188, - "step": 1368 - }, - { - "epoch": 0.17, - "learning_rate": 0.00029314163296630303, - "loss": 0.3913, - "step": 1369 - }, - { - "epoch": 0.17, - "learning_rate": 0.0002931712722616339, - "loss": 0.3771, - "step": 1370 - }, - { - "epoch": 0.17, - "learning_rate": 0.0002932008899303336, - "loss": 0.4103, - "step": 1371 - }, - { - "epoch": 0.17, - "learning_rate": 0.00029323048600393936, - "loss": 0.4002, - "step": 1372 - }, - { - "epoch": 0.17, - "learning_rate": 0.0002932600605139195, - "loss": 0.4103, - "step": 1373 - }, - { - "epoch": 0.17, - "learning_rate": 0.0002932896134916735, - "loss": 0.3923, - "step": 1374 - }, - { - "epoch": 0.17, - "learning_rate": 0.00029331914496853235, - "loss": 0.4122, - "step": 1375 - }, - { - "epoch": 0.17, - "learning_rate": 0.00029334865497575877, - "loss": 0.4051, - "step": 1376 - }, - { - "epoch": 0.17, - "learning_rate": 0.0002933781435445472, - "loss": 0.4063, - "step": 1377 - }, - { - "epoch": 0.17, - "learning_rate": 0.0002934076107060243, - "loss": 0.3856, - "step": 1378 - }, - { - "epoch": 0.17, - "learning_rate": 0.0002934370564912489, - "loss": 0.3986, - "step": 1379 - }, - { - "epoch": 0.17, - "learning_rate": 0.0002934664809312123, - "loss": 0.3982, - "step": 1380 - }, - { - "epoch": 0.17, - "learning_rate": 0.00029349588405683854, - "loss": 0.3904, - "step": 1381 - }, - { - "epoch": 0.17, - "learning_rate": 0.0002935252658989843, - "loss": 0.3968, - "step": 1382 - }, - { - "epoch": 0.17, - "learning_rate": 0.00029355462648843954, - "loss": 0.4029, - "step": 1383 - }, - { - "epoch": 0.17, - "learning_rate": 0.0002935839658559273, - "loss": 0.4061, - "step": 1384 - }, - { - "epoch": 0.17, - "learning_rate": 0.000293613284032104, - "loss": 0.3938, - "step": 1385 - }, - { - "epoch": 0.17, - "learning_rate": 0.00029364258104755994, - "loss": 0.3904, - "step": 1386 - }, - { - "epoch": 0.17, - "learning_rate": 0.00029367185693281894, - "loss": 0.3844, - "step": 1387 - }, - { - "epoch": 0.17, - "learning_rate": 0.00029370111171833906, - "loss": 0.3925, - "step": 1388 - }, - { - "epoch": 0.17, - "learning_rate": 0.00029373034543451234, - "loss": 0.4025, - "step": 1389 - }, - { - "epoch": 0.17, - "learning_rate": 0.00029375955811166527, - "loss": 0.3691, - "step": 1390 - }, - { - "epoch": 0.17, - "learning_rate": 0.00029378874978005907, - "loss": 0.405, - "step": 1391 - }, - { - "epoch": 0.17, - "learning_rate": 0.0002938179204698895, - "loss": 0.3786, - "step": 1392 - }, - { - "epoch": 0.17, - "learning_rate": 0.0002938470702112873, - "loss": 0.4088, - "step": 1393 - }, - { - "epoch": 0.17, - "learning_rate": 0.00029387619903431853, - "loss": 0.3951, - "step": 1394 - }, - { - "epoch": 0.17, - "learning_rate": 0.00029390530696898437, - "loss": 0.3766, - "step": 1395 - }, - { - "epoch": 0.17, - "learning_rate": 0.00029393439404522156, - "loss": 0.4063, - "step": 1396 - }, - { - "epoch": 0.17, - "learning_rate": 0.0002939634602929026, - "loss": 0.4103, - "step": 1397 - }, - { - "epoch": 0.17, - "learning_rate": 0.00029399250574183575, - "loss": 0.3641, - "step": 1398 - }, - { - "epoch": 0.17, - "learning_rate": 0.00029402153042176537, - "loss": 0.3992, - "step": 1399 - }, - { - "epoch": 0.17, - "learning_rate": 0.000294050534362372, - "loss": 0.3915, - "step": 1400 - }, - { - "epoch": 0.17, - "learning_rate": 0.0002940795175932729, - "loss": 0.392, - "step": 1401 - }, - { - "epoch": 0.17, - "learning_rate": 0.0002941084801440215, - "loss": 0.416, - "step": 1402 - }, - { - "epoch": 0.17, - "learning_rate": 0.0002941374220441083, - "loss": 0.3898, - "step": 1403 - }, - { - "epoch": 0.17, - "learning_rate": 0.00029416634332296067, - "loss": 0.395, - "step": 1404 - }, - { - "epoch": 0.17, - "learning_rate": 0.0002941952440099431, - "loss": 0.3934, - "step": 1405 - }, - { - "epoch": 0.17, - "learning_rate": 0.00029422412413435746, - "loss": 0.3995, - "step": 1406 - }, - { - "epoch": 0.17, - "learning_rate": 0.0002942529837254431, - "loss": 0.4109, - "step": 1407 - }, - { - "epoch": 0.17, - "learning_rate": 0.000294281822812377, - "loss": 0.3856, - "step": 1408 - }, - { - "epoch": 0.17, - "learning_rate": 0.00029431064142427415, - "loss": 0.38, - "step": 1409 - }, - { - "epoch": 0.17, - "learning_rate": 0.0002943394395901874, - "loss": 0.3953, - "step": 1410 - }, - { - "epoch": 0.17, - "learning_rate": 0.00029436821733910785, - "loss": 0.4023, - "step": 1411 - }, - { - "epoch": 0.17, - "learning_rate": 0.00029439697469996494, - "loss": 0.3733, - "step": 1412 - }, - { - "epoch": 0.17, - "learning_rate": 0.0002944257117016269, - "loss": 0.4034, - "step": 1413 - }, - { - "epoch": 0.17, - "learning_rate": 0.00029445442837290034, - "loss": 0.4289, - "step": 1414 - }, - { - "epoch": 0.17, - "learning_rate": 0.0002944831247425311, - "loss": 0.3891, - "step": 1415 - }, - { - "epoch": 0.17, - "learning_rate": 0.00029451180083920383, - "loss": 0.3989, - "step": 1416 - }, - { - "epoch": 0.17, - "learning_rate": 0.00029454045669154264, - "loss": 0.3937, - "step": 1417 - }, - { - "epoch": 0.17, - "learning_rate": 0.0002945690923281109, - "loss": 0.388, - "step": 1418 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029459770777741167, - "loss": 0.3827, - "step": 1419 - }, - { - "epoch": 0.18, - "learning_rate": 0.0002946263030678877, - "loss": 0.3864, - "step": 1420 - }, - { - "epoch": 0.18, - "learning_rate": 0.0002946548782279218, - "loss": 0.3858, - "step": 1421 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029468343328583675, - "loss": 0.3848, - "step": 1422 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029471196826989554, - "loss": 0.4107, - "step": 1423 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029474048320830186, - "loss": 0.3984, - "step": 1424 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029476897812919975, - "loss": 0.4014, - "step": 1425 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029479745306067406, - "loss": 0.4054, - "step": 1426 - }, - { - "epoch": 0.18, - "learning_rate": 0.0002948259080307507, - "loss": 0.4088, - "step": 1427 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029485434306739664, - "loss": 0.4074, - "step": 1428 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029488275819851997, - "loss": 0.408, - "step": 1429 - }, - { - "epoch": 0.18, - "learning_rate": 0.0002949111534519704, - "loss": 0.4015, - "step": 1430 - }, - { - "epoch": 0.18, - "learning_rate": 0.0002949395288555391, - "loss": 0.3958, - "step": 1431 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029496788443695915, - "loss": 0.3994, - "step": 1432 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029499622022390536, - "loss": 0.3893, - "step": 1433 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029502453624399475, - "loss": 0.4179, - "step": 1434 - }, - { - "epoch": 0.18, - "learning_rate": 0.0002950528325247866, - "loss": 0.4039, - "step": 1435 - }, - { - "epoch": 0.18, - "learning_rate": 0.0002950811090937824, - "loss": 0.3834, - "step": 1436 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029510936597842654, - "loss": 0.3876, - "step": 1437 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029513760320610584, - "loss": 0.3968, - "step": 1438 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029516582080415014, - "loss": 0.3919, - "step": 1439 - }, - { - "epoch": 0.18, - "learning_rate": 0.0002951940187998323, - "loss": 0.4216, - "step": 1440 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029522219722036833, - "loss": 0.387, - "step": 1441 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029525035609291773, - "loss": 0.4042, - "step": 1442 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029527849544458336, - "loss": 0.4045, - "step": 1443 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029530661530241184, - "loss": 0.4041, - "step": 1444 - }, - { - "epoch": 0.18, - "learning_rate": 0.0002953347156933936, - "loss": 0.395, - "step": 1445 - }, - { - "epoch": 0.18, - "learning_rate": 0.0002953627966444631, - "loss": 0.3833, - "step": 1446 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029539085818249884, - "loss": 0.4019, - "step": 1447 - }, - { - "epoch": 0.18, - "learning_rate": 0.0002954189003343237, - "loss": 0.3956, - "step": 1448 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029544692312670495, - "loss": 0.3998, - "step": 1449 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029547492658635446, - "loss": 0.3721, - "step": 1450 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029550291073992895, - "loss": 0.3684, - "step": 1451 - }, - { - "epoch": 0.18, - "learning_rate": 0.0002955308756140299, - "loss": 0.4065, - "step": 1452 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029555882123520405, - "loss": 0.3755, - "step": 1453 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029558674762994306, - "loss": 0.3818, - "step": 1454 - }, - { - "epoch": 0.18, - "learning_rate": 0.0002956146548246842, - "loss": 0.3799, - "step": 1455 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029564254284581006, - "loss": 0.3982, - "step": 1456 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029567041171964914, - "loss": 0.3943, - "step": 1457 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029569826147247545, - "loss": 0.4118, - "step": 1458 - }, - { - "epoch": 0.18, - "learning_rate": 0.0002957260921305092, - "loss": 0.4061, - "step": 1459 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029575390371991655, - "loss": 0.393, - "step": 1460 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029578169626681, - "loss": 0.3929, - "step": 1461 - }, - { - "epoch": 0.18, - "learning_rate": 0.0002958094697972483, - "loss": 0.4101, - "step": 1462 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029583722433723707, - "loss": 0.3943, - "step": 1463 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029586495991272826, - "loss": 0.3806, - "step": 1464 - }, - { - "epoch": 0.18, - "learning_rate": 0.0002958926765496208, - "loss": 0.3953, - "step": 1465 - }, - { - "epoch": 0.18, - "learning_rate": 0.0002959203742737607, - "loss": 0.3975, - "step": 1466 - }, - { - "epoch": 0.18, - "learning_rate": 0.000295948053110941, - "loss": 0.3964, - "step": 1467 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029597571308690205, - "loss": 0.4083, - "step": 1468 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029600335422733147, - "loss": 0.3816, - "step": 1469 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029603097655786465, - "loss": 0.4047, - "step": 1470 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029605858010408454, - "loss": 0.3799, - "step": 1471 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029608616489152197, - "loss": 0.3929, - "step": 1472 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029611373094565587, - "loss": 0.3759, - "step": 1473 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029614127829191304, - "loss": 0.3866, - "step": 1474 - }, - { - "epoch": 0.18, - "learning_rate": 0.0002961688069556688, - "loss": 0.3982, - "step": 1475 - }, - { - "epoch": 0.18, - "learning_rate": 0.0002961963169622468, - "loss": 0.4022, - "step": 1476 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029622380833691913, - "loss": 0.4045, - "step": 1477 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029625128110490664, - "loss": 0.3937, - "step": 1478 - }, - { - "epoch": 0.18, - "learning_rate": 0.0002962787352913791, - "loss": 0.4042, - "step": 1479 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029630617092145503, - "loss": 0.4106, - "step": 1480 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029633358802020227, - "loss": 0.404, - "step": 1481 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029636098661263774, - "loss": 0.3709, - "step": 1482 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029638836672372785, - "loss": 0.4147, - "step": 1483 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029641572837838854, - "loss": 0.3771, - "step": 1484 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029644307160148523, - "loss": 0.4171, - "step": 1485 - }, - { - "epoch": 0.18, - "learning_rate": 0.0002964703964178332, - "loss": 0.3946, - "step": 1486 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029649770285219767, - "loss": 0.378, - "step": 1487 - }, - { - "epoch": 0.18, - "learning_rate": 0.000296524990929294, - "loss": 0.377, - "step": 1488 - }, - { - "epoch": 0.18, - "learning_rate": 0.0002965522606737877, - "loss": 0.4076, - "step": 1489 - }, - { - "epoch": 0.18, - "learning_rate": 0.0002965795121102943, - "loss": 0.3847, - "step": 1490 - }, - { - "epoch": 0.18, - "learning_rate": 0.0002966067452633803, - "loss": 0.3909, - "step": 1491 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029663396015756243, - "loss": 0.3895, - "step": 1492 - }, - { - "epoch": 0.18, - "learning_rate": 0.0002966611568173082, - "loss": 0.3933, - "step": 1493 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029668833526703606, - "loss": 0.3992, - "step": 1494 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029671549553111535, - "loss": 0.4125, - "step": 1495 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029674263763386656, - "loss": 0.3881, - "step": 1496 - }, - { - "epoch": 0.18, - "learning_rate": 0.0002967697615995616, - "loss": 0.3984, - "step": 1497 - }, - { - "epoch": 0.18, - "learning_rate": 0.0002967968674524233, - "loss": 0.4045, - "step": 1498 - }, - { - "epoch": 0.18, - "learning_rate": 0.00029682395521662643, - "loss": 0.3982, - "step": 1499 - }, - { - "epoch": 0.19, - "learning_rate": 0.00029685102491629726, - "loss": 0.3913, - "step": 1500 - }, - { - "epoch": 0.19, - "learning_rate": 0.0002968780765755138, - "loss": 0.3992, - "step": 1501 - }, - { - "epoch": 0.19, - "learning_rate": 0.000296905110218306, - "loss": 0.3741, - "step": 1502 - }, - { - "epoch": 0.19, - "learning_rate": 0.00029693212586865574, - "loss": 0.4102, - "step": 1503 - }, - { - "epoch": 0.19, - "learning_rate": 0.00029695912355049705, - "loss": 0.3841, - "step": 1504 - }, - { - "epoch": 0.19, - "learning_rate": 0.00029698610328771633, - "loss": 0.3757, - "step": 1505 - }, - { - "epoch": 0.19, - "learning_rate": 0.00029701306510415237, - "loss": 0.3639, - "step": 1506 - }, - { - "epoch": 0.19, - "learning_rate": 0.0002970400090235965, - "loss": 0.4082, - "step": 1507 - }, - { - "epoch": 0.19, - "learning_rate": 0.0002970669350697925, - "loss": 0.3987, - "step": 1508 - }, - { - "epoch": 0.19, - "learning_rate": 0.0002970938432664372, - "loss": 0.3799, - "step": 1509 - }, - { - "epoch": 0.19, - "learning_rate": 0.0002971207336371802, - "loss": 0.4006, - "step": 1510 - }, - { - "epoch": 0.19, - "learning_rate": 0.00029714760620562416, - "loss": 0.4136, - "step": 1511 - }, - { - "epoch": 0.19, - "learning_rate": 0.00029717446099532485, - "loss": 0.3948, - "step": 1512 - }, - { - "epoch": 0.19, - "learning_rate": 0.0002972012980297914, - "loss": 0.3818, - "step": 1513 - }, - { - "epoch": 0.19, - "learning_rate": 0.00029722811733248636, - "loss": 0.3888, - "step": 1514 - }, - { - "epoch": 0.19, - "learning_rate": 0.0002972549189268256, - "loss": 0.3878, - "step": 1515 - }, - { - "epoch": 0.19, - "learning_rate": 0.00029728170283617884, - "loss": 0.3943, - "step": 1516 - }, - { - "epoch": 0.19, - "learning_rate": 0.0002973084690838695, - "loss": 0.3892, - "step": 1517 - }, - { - "epoch": 0.19, - "learning_rate": 0.00029733521769317487, - "loss": 0.3961, - "step": 1518 - }, - { - "epoch": 0.19, - "learning_rate": 0.0002973619486873264, - "loss": 0.3915, - "step": 1519 - }, - { - "epoch": 0.19, - "learning_rate": 0.00029738866208950946, - "loss": 0.3961, - "step": 1520 - }, - { - "epoch": 0.19, - "learning_rate": 0.0002974153579228637, - "loss": 0.3748, - "step": 1521 - }, - { - "epoch": 0.19, - "learning_rate": 0.0002974420362104833, - "loss": 0.3856, - "step": 1522 - }, - { - "epoch": 0.19, - "learning_rate": 0.00029746869697541684, - "loss": 0.3967, - "step": 1523 - }, - { - "epoch": 0.19, - "learning_rate": 0.0002974953402406675, - "loss": 0.4067, - "step": 1524 - }, - { - "epoch": 0.19, - "learning_rate": 0.00029752196602919324, - "loss": 0.4166, - "step": 1525 - }, - { - "epoch": 0.19, - "learning_rate": 0.0002975485743639069, - "loss": 0.3976, - "step": 1526 - }, - { - "epoch": 0.19, - "learning_rate": 0.0002975751652676761, - "loss": 0.4076, - "step": 1527 - }, - { - "epoch": 0.19, - "learning_rate": 0.0002976017387633237, - "loss": 0.3809, - "step": 1528 - }, - { - "epoch": 0.19, - "learning_rate": 0.0002976282948736278, - "loss": 0.4054, - "step": 1529 - }, - { - "epoch": 0.19, - "learning_rate": 0.0002976548336213219, - "loss": 0.3897, - "step": 1530 - }, - { - "epoch": 0.19, - "learning_rate": 0.0002976813550290946, - "loss": 0.4101, - "step": 1531 - }, - { - "epoch": 0.19, - "learning_rate": 0.00029770785911959033, - "loss": 0.3959, - "step": 1532 - }, - { - "epoch": 0.19, - "learning_rate": 0.00029773434591540913, - "loss": 0.3828, - "step": 1533 - }, - { - "epoch": 0.19, - "learning_rate": 0.00029776081543910686, - "loss": 0.3968, - "step": 1534 - }, - { - "epoch": 0.19, - "learning_rate": 0.0002977872677131952, - "loss": 0.3771, - "step": 1535 - }, - { - "epoch": 0.19, - "learning_rate": 0.000297813702760142, - "loss": 0.3566, - "step": 1536 - }, - { - "epoch": 0.19, - "learning_rate": 0.000297840120602371, - "loss": 0.3954, - "step": 1537 - }, - { - "epoch": 0.19, - "learning_rate": 0.0002978665212622623, - "loss": 0.3871, - "step": 1538 - }, - { - "epoch": 0.19, - "learning_rate": 0.0002978929047621526, - "loss": 0.4112, - "step": 1539 - }, - { - "epoch": 0.19, - "learning_rate": 0.00029791927112433463, - "loss": 0.3885, - "step": 1540 - }, - { - "epoch": 0.19, - "learning_rate": 0.000297945620371058, - "loss": 0.4028, - "step": 1541 - }, - { - "epoch": 0.19, - "learning_rate": 0.00029797195252452904, - "loss": 0.3684, - "step": 1542 - }, - { - "epoch": 0.19, - "learning_rate": 0.0002979982676069107, - "loss": 0.3796, - "step": 1543 - }, - { - "epoch": 0.19, - "learning_rate": 0.000298024565640323, - "loss": 0.3783, - "step": 1544 - }, - { - "epoch": 0.19, - "learning_rate": 0.000298050846646843, - "loss": 0.3914, - "step": 1545 - }, - { - "epoch": 0.19, - "learning_rate": 0.0002980771106485047, - "loss": 0.3971, - "step": 1546 - }, - { - "epoch": 0.19, - "learning_rate": 0.00029810335766729967, - "loss": 0.389, - "step": 1547 - }, - { - "epoch": 0.19, - "learning_rate": 0.0002981295877251766, - "loss": 0.3809, - "step": 1548 - }, - { - "epoch": 0.19, - "learning_rate": 0.0002981558008440418, - "loss": 0.3857, - "step": 1549 - }, - { - "epoch": 0.19, - "learning_rate": 0.00029818199704575906, - "loss": 0.3941, - "step": 1550 - }, - { - "epoch": 0.19, - "learning_rate": 0.00029820817635214995, - "loss": 0.3848, - "step": 1551 - }, - { - "epoch": 0.19, - "learning_rate": 0.00029823433878499385, - "loss": 0.3798, - "step": 1552 - }, - { - "epoch": 0.19, - "learning_rate": 0.0002982604843660279, - "loss": 0.3834, - "step": 1553 - }, - { - "epoch": 0.19, - "learning_rate": 0.0002982866131169476, - "loss": 0.3982, - "step": 1554 - }, - { - "epoch": 0.19, - "learning_rate": 0.0002983127250594062, - "loss": 0.382, - "step": 1555 - }, - { - "epoch": 0.19, - "learning_rate": 0.00029833882021501536, - "loss": 0.3891, - "step": 1556 - }, - { - "epoch": 0.19, - "learning_rate": 0.0002983648986053451, - "loss": 0.3836, - "step": 1557 - }, - { - "epoch": 0.19, - "learning_rate": 0.00029839096025192387, - "loss": 0.3822, - "step": 1558 - }, - { - "epoch": 0.19, - "learning_rate": 0.00029841700517623876, - "loss": 0.4034, - "step": 1559 - }, - { - "epoch": 0.19, - "learning_rate": 0.00029844303339973536, - "loss": 0.3979, - "step": 1560 - }, - { - "epoch": 0.19, - "learning_rate": 0.0002984690449438181, - "loss": 0.3823, - "step": 1561 - }, - { - "epoch": 0.19, - "learning_rate": 0.0002984950398298503, - "loss": 0.3798, - "step": 1562 - }, - { - "epoch": 0.19, - "learning_rate": 0.00029852101807915433, - "loss": 0.4015, - "step": 1563 - }, - { - "epoch": 0.19, - "learning_rate": 0.0002985469797130116, - "loss": 0.3894, - "step": 1564 - }, - { - "epoch": 0.19, - "learning_rate": 0.0002985729247526626, - "loss": 0.412, - "step": 1565 - }, - { - "epoch": 0.19, - "learning_rate": 0.0002985988532193073, - "loss": 0.3975, - "step": 1566 - }, - { - "epoch": 0.19, - "learning_rate": 0.00029862476513410494, - "loss": 0.3965, - "step": 1567 - }, - { - "epoch": 0.19, - "learning_rate": 0.0002986506605181743, - "loss": 0.3869, - "step": 1568 - }, - { - "epoch": 0.19, - "learning_rate": 0.0002986765393925938, - "loss": 0.411, - "step": 1569 - }, - { - "epoch": 0.19, - "learning_rate": 0.00029870240177840154, - "loss": 0.4026, - "step": 1570 - }, - { - "epoch": 0.19, - "learning_rate": 0.00029872824769659544, - "loss": 0.3831, - "step": 1571 - }, - { - "epoch": 0.19, - "learning_rate": 0.0002987540771681333, - "loss": 0.3936, - "step": 1572 - }, - { - "epoch": 0.19, - "learning_rate": 0.00029877989021393294, - "loss": 0.3723, - "step": 1573 - }, - { - "epoch": 0.19, - "learning_rate": 0.0002988056868548724, - "loss": 0.3849, - "step": 1574 - }, - { - "epoch": 0.19, - "learning_rate": 0.0002988314671117899, - "loss": 0.3705, - "step": 1575 - }, - { - "epoch": 0.19, - "learning_rate": 0.0002988572310054838, - "loss": 0.3841, - "step": 1576 - }, - { - "epoch": 0.19, - "learning_rate": 0.0002988829785567132, - "loss": 0.3811, - "step": 1577 - }, - { - "epoch": 0.19, - "learning_rate": 0.00029890870978619734, - "loss": 0.3779, - "step": 1578 - }, - { - "epoch": 0.19, - "learning_rate": 0.00029893442471461655, - "loss": 0.386, - "step": 1579 - }, - { - "epoch": 0.19, - "learning_rate": 0.00029896012336261144, - "loss": 0.3835, - "step": 1580 - }, - { - "epoch": 0.2, - "learning_rate": 0.0002989858057507836, - "loss": 0.3733, - "step": 1581 - }, - { - "epoch": 0.2, - "learning_rate": 0.0002990114718996957, - "loss": 0.3588, - "step": 1582 - }, - { - "epoch": 0.2, - "learning_rate": 0.00029903712182987127, - "loss": 0.375, - "step": 1583 - }, - { - "epoch": 0.2, - "learning_rate": 0.0002990627555617949, - "loss": 0.3711, - "step": 1584 - }, - { - "epoch": 0.2, - "learning_rate": 0.00029908837311591244, - "loss": 0.3673, - "step": 1585 - }, - { - "epoch": 0.2, - "learning_rate": 0.0002991139745126313, - "loss": 0.3886, - "step": 1586 - }, - { - "epoch": 0.2, - "learning_rate": 0.0002991395597723199, - "loss": 0.4131, - "step": 1587 - }, - { - "epoch": 0.2, - "learning_rate": 0.0002991651289153084, - "loss": 0.3958, - "step": 1588 - }, - { - "epoch": 0.2, - "learning_rate": 0.0002991906819618886, - "loss": 0.3816, - "step": 1589 - }, - { - "epoch": 0.2, - "learning_rate": 0.00029921621893231384, - "loss": 0.3853, - "step": 1590 - }, - { - "epoch": 0.2, - "learning_rate": 0.0002992417398467993, - "loss": 0.3926, - "step": 1591 - }, - { - "epoch": 0.2, - "learning_rate": 0.00029926724472552227, - "loss": 0.3768, - "step": 1592 - }, - { - "epoch": 0.2, - "learning_rate": 0.0002992927335886217, - "loss": 0.3807, - "step": 1593 - }, - { - "epoch": 0.2, - "learning_rate": 0.00029931820645619884, - "loss": 0.3819, - "step": 1594 - }, - { - "epoch": 0.2, - "learning_rate": 0.00029934366334831707, - "loss": 0.3733, - "step": 1595 - }, - { - "epoch": 0.2, - "learning_rate": 0.000299369104285002, - "loss": 0.3735, - "step": 1596 - }, - { - "epoch": 0.2, - "learning_rate": 0.0002993945292862417, - "loss": 0.3842, - "step": 1597 - }, - { - "epoch": 0.2, - "learning_rate": 0.0002994199383719866, - "loss": 0.3988, - "step": 1598 - }, - { - "epoch": 0.2, - "learning_rate": 0.0002994453315621498, - "loss": 0.3906, - "step": 1599 - }, - { - "epoch": 0.2, - "learning_rate": 0.00029947070887660697, - "loss": 0.4013, - "step": 1600 - }, - { - "epoch": 0.2, - "learning_rate": 0.0002994960703351965, - "loss": 0.3779, - "step": 1601 - }, - { - "epoch": 0.2, - "learning_rate": 0.0002995214159577197, - "loss": 0.3927, - "step": 1602 - }, - { - "epoch": 0.2, - "learning_rate": 0.00029954674576394076, - "loss": 0.3865, - "step": 1603 - }, - { - "epoch": 0.2, - "learning_rate": 0.00029957205977358697, - "loss": 0.3761, - "step": 1604 - }, - { - "epoch": 0.2, - "learning_rate": 0.00029959735800634855, - "loss": 0.3946, - "step": 1605 - }, - { - "epoch": 0.2, - "learning_rate": 0.0002996226404818791, - "loss": 0.3883, - "step": 1606 - }, - { - "epoch": 0.2, - "learning_rate": 0.0002996479072197955, - "loss": 0.3751, - "step": 1607 - }, - { - "epoch": 0.2, - "learning_rate": 0.000299673158239678, - "loss": 0.3919, - "step": 1608 - }, - { - "epoch": 0.2, - "learning_rate": 0.0002996983935610703, - "loss": 0.3835, - "step": 1609 - }, - { - "epoch": 0.2, - "learning_rate": 0.00029972361320347964, - "loss": 0.3794, - "step": 1610 - }, - { - "epoch": 0.2, - "learning_rate": 0.00029974881718637696, - "loss": 0.3848, - "step": 1611 - }, - { - "epoch": 0.2, - "learning_rate": 0.00029977400552919705, - "loss": 0.3829, - "step": 1612 - }, - { - "epoch": 0.2, - "learning_rate": 0.00029979917825133845, - "loss": 0.3756, - "step": 1613 - }, - { - "epoch": 0.2, - "learning_rate": 0.0002998243353721636, - "loss": 0.3674, - "step": 1614 - }, - { - "epoch": 0.2, - "learning_rate": 0.00029984947691099895, - "loss": 0.3789, - "step": 1615 - }, - { - "epoch": 0.2, - "learning_rate": 0.0002998746028871353, - "loss": 0.3816, - "step": 1616 - }, - { - "epoch": 0.2, - "learning_rate": 0.0002998997133198272, - "loss": 0.3798, - "step": 1617 - }, - { - "epoch": 0.2, - "learning_rate": 0.00029992480822829394, - "loss": 0.4015, - "step": 1618 - }, - { - "epoch": 0.2, - "learning_rate": 0.000299949887631719, - "loss": 0.3917, - "step": 1619 - }, - { - "epoch": 0.2, - "learning_rate": 0.00029997495154925015, - "loss": 0.3913, - "step": 1620 - }, - { - "epoch": 0.2, - "learning_rate": 0.0003, - "loss": 0.3836, - "step": 1621 - }, - { - "epoch": 0.2, - "learning_rate": 0.0003, - "loss": 0.3818, - "step": 1622 - }, - { - "epoch": 0.2, - "learning_rate": 0.0003, - "loss": 0.3878, - "step": 1623 - }, - { - "epoch": 0.2, - "learning_rate": 0.0003, - "loss": 0.3727, - "step": 1624 - }, - { - "epoch": 0.2, - "learning_rate": 0.0003, - "loss": 0.3784, - "step": 1625 - }, - { - "epoch": 0.2, - "learning_rate": 0.0003, - "loss": 0.3917, - "step": 1626 - }, - { - "epoch": 0.2, - "learning_rate": 0.0003, - "loss": 0.3948, - "step": 1627 - }, - { - "epoch": 0.2, - "learning_rate": 0.0003, - "loss": 0.391, - "step": 1628 - }, - { - "epoch": 0.2, - "learning_rate": 0.0003, - "loss": 0.3967, - "step": 1629 - }, - { - "epoch": 0.2, - "learning_rate": 0.0003, - "loss": 0.3973, - "step": 1630 - }, - { - "epoch": 0.2, - "learning_rate": 0.0003, - "loss": 0.3712, - "step": 1631 - }, - { - "epoch": 0.2, - "learning_rate": 0.0003, - "loss": 0.373, - "step": 1632 - }, - { - "epoch": 0.2, - "learning_rate": 0.0003, - "loss": 0.3804, - "step": 1633 - }, - { - "epoch": 0.2, - "learning_rate": 0.0003, - "loss": 0.3919, - "step": 1634 - }, - { - "epoch": 0.2, - "learning_rate": 0.0003, - "loss": 0.396, - "step": 1635 - }, - { - "epoch": 0.2, - "learning_rate": 0.0003, - "loss": 0.3678, - "step": 1636 - }, - { - "epoch": 0.2, - "learning_rate": 0.0003, - "loss": 0.3932, - "step": 1637 - }, - { - "epoch": 0.2, - "learning_rate": 0.0003, - "loss": 0.3854, - "step": 1638 - }, - { - "epoch": 0.2, - "learning_rate": 0.0003, - "loss": 0.3774, - "step": 1639 - }, - { - "epoch": 0.2, - "learning_rate": 0.0003, - "loss": 0.3839, - "step": 1640 - }, - { - "epoch": 0.2, - "learning_rate": 0.0003, - "loss": 0.3897, - "step": 1641 - }, - { - "epoch": 0.2, - "learning_rate": 0.0003, - "loss": 0.3915, - "step": 1642 - }, - { - "epoch": 0.2, - "learning_rate": 0.0003, - "loss": 0.3892, - "step": 1643 - }, - { - "epoch": 0.2, - "learning_rate": 0.0003, - "loss": 0.3849, - "step": 1644 - }, - { - "epoch": 0.2, - "learning_rate": 0.0003, - "loss": 0.3854, - "step": 1645 - }, - { - "epoch": 0.2, - "learning_rate": 0.0003, - "loss": 0.3879, - "step": 1646 - }, - { - "epoch": 0.2, - "learning_rate": 0.0003, - "loss": 0.3826, - "step": 1647 - }, - { - "epoch": 0.2, - "learning_rate": 0.0003, - "loss": 0.3811, - "step": 1648 - }, - { - "epoch": 0.2, - "learning_rate": 0.0003, - "loss": 0.3958, - "step": 1649 - }, - { - "epoch": 0.2, - "learning_rate": 0.0003, - "loss": 0.399, - "step": 1650 - }, - { - "epoch": 0.2, - "learning_rate": 0.0003, - "loss": 0.3772, - "step": 1651 - }, - { - "epoch": 0.2, - "learning_rate": 0.0003, - "loss": 0.3891, - "step": 1652 - }, - { - "epoch": 0.2, - "learning_rate": 0.0003, - "loss": 0.3832, - "step": 1653 - }, - { - "epoch": 0.2, - "learning_rate": 0.0003, - "loss": 0.3797, - "step": 1654 - }, - { - "epoch": 0.2, - "learning_rate": 0.0003, - "loss": 0.3962, - "step": 1655 - }, - { - "epoch": 0.2, - "learning_rate": 0.0003, - "loss": 0.3617, - "step": 1656 - }, - { - "epoch": 0.2, - "learning_rate": 0.0003, - "loss": 0.3921, - "step": 1657 - }, - { - "epoch": 0.2, - "learning_rate": 0.0003, - "loss": 0.3768, - "step": 1658 - }, - { - "epoch": 0.2, - "learning_rate": 0.0003, - "loss": 0.3874, - "step": 1659 - }, - { - "epoch": 0.2, - "learning_rate": 0.0003, - "loss": 0.4, - "step": 1660 - }, - { - "epoch": 0.2, - "learning_rate": 0.0003, - "loss": 0.3806, - "step": 1661 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3784, - "step": 1662 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.367, - "step": 1663 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3901, - "step": 1664 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3912, - "step": 1665 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3705, - "step": 1666 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3737, - "step": 1667 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3766, - "step": 1668 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.4019, - "step": 1669 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3496, - "step": 1670 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.423, - "step": 1671 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3821, - "step": 1672 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3623, - "step": 1673 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3625, - "step": 1674 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3671, - "step": 1675 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3794, - "step": 1676 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3688, - "step": 1677 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3806, - "step": 1678 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3682, - "step": 1679 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3709, - "step": 1680 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3865, - "step": 1681 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.399, - "step": 1682 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3929, - "step": 1683 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3872, - "step": 1684 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3776, - "step": 1685 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.377, - "step": 1686 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.4038, - "step": 1687 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3742, - "step": 1688 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3836, - "step": 1689 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3762, - "step": 1690 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3961, - "step": 1691 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3787, - "step": 1692 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.383, - "step": 1693 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3954, - "step": 1694 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3837, - "step": 1695 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.4015, - "step": 1696 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3883, - "step": 1697 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3722, - "step": 1698 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3808, - "step": 1699 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3513, - "step": 1700 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3699, - "step": 1701 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3779, - "step": 1702 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3847, - "step": 1703 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3874, - "step": 1704 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3818, - "step": 1705 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3645, - "step": 1706 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3842, - "step": 1707 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3874, - "step": 1708 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3691, - "step": 1709 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3713, - "step": 1710 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3868, - "step": 1711 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3797, - "step": 1712 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3745, - "step": 1713 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3931, - "step": 1714 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3795, - "step": 1715 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3895, - "step": 1716 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3705, - "step": 1717 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.365, - "step": 1718 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3814, - "step": 1719 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3782, - "step": 1720 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3857, - "step": 1721 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3818, - "step": 1722 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.39, - "step": 1723 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3957, - "step": 1724 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.388, - "step": 1725 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3803, - "step": 1726 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3847, - "step": 1727 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.362, - "step": 1728 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3848, - "step": 1729 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3684, - "step": 1730 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3652, - "step": 1731 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3815, - "step": 1732 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.4103, - "step": 1733 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3828, - "step": 1734 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3897, - "step": 1735 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3821, - "step": 1736 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3716, - "step": 1737 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3895, - "step": 1738 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3731, - "step": 1739 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.388, - "step": 1740 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3671, - "step": 1741 - }, - { - "epoch": 0.21, - "learning_rate": 0.0003, - "loss": 0.3597, - "step": 1742 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3581, - "step": 1743 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.346, - "step": 1744 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3796, - "step": 1745 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3963, - "step": 1746 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3653, - "step": 1747 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3742, - "step": 1748 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.383, - "step": 1749 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3967, - "step": 1750 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3841, - "step": 1751 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3673, - "step": 1752 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.397, - "step": 1753 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3784, - "step": 1754 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3669, - "step": 1755 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3831, - "step": 1756 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3739, - "step": 1757 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.396, - "step": 1758 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3599, - "step": 1759 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3773, - "step": 1760 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3551, - "step": 1761 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3606, - "step": 1762 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3828, - "step": 1763 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3731, - "step": 1764 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3886, - "step": 1765 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3661, - "step": 1766 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3818, - "step": 1767 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3785, - "step": 1768 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3509, - "step": 1769 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3711, - "step": 1770 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3678, - "step": 1771 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3561, - "step": 1772 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3801, - "step": 1773 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3797, - "step": 1774 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3817, - "step": 1775 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3805, - "step": 1776 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3797, - "step": 1777 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.4055, - "step": 1778 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3811, - "step": 1779 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3727, - "step": 1780 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.402, - "step": 1781 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.393, - "step": 1782 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3682, - "step": 1783 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3748, - "step": 1784 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.385, - "step": 1785 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3697, - "step": 1786 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3706, - "step": 1787 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3734, - "step": 1788 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3637, - "step": 1789 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3495, - "step": 1790 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3768, - "step": 1791 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.387, - "step": 1792 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3711, - "step": 1793 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3651, - "step": 1794 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3811, - "step": 1795 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3763, - "step": 1796 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3659, - "step": 1797 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3639, - "step": 1798 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3685, - "step": 1799 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3894, - "step": 1800 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3775, - "step": 1801 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3858, - "step": 1802 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3696, - "step": 1803 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3545, - "step": 1804 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3746, - "step": 1805 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3668, - "step": 1806 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3709, - "step": 1807 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3575, - "step": 1808 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3565, - "step": 1809 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3841, - "step": 1810 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3612, - "step": 1811 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3638, - "step": 1812 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3753, - "step": 1813 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3872, - "step": 1814 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3632, - "step": 1815 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3868, - "step": 1816 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3815, - "step": 1817 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3691, - "step": 1818 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3891, - "step": 1819 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3553, - "step": 1820 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3788, - "step": 1821 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3933, - "step": 1822 - }, - { - "epoch": 0.22, - "learning_rate": 0.0003, - "loss": 0.3626, - "step": 1823 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3724, - "step": 1824 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3629, - "step": 1825 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3752, - "step": 1826 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3702, - "step": 1827 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3808, - "step": 1828 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.369, - "step": 1829 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3874, - "step": 1830 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3682, - "step": 1831 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3776, - "step": 1832 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3724, - "step": 1833 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3642, - "step": 1834 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3883, - "step": 1835 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3618, - "step": 1836 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3739, - "step": 1837 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.353, - "step": 1838 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.383, - "step": 1839 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3779, - "step": 1840 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.367, - "step": 1841 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3651, - "step": 1842 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3807, - "step": 1843 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3806, - "step": 1844 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3606, - "step": 1845 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3738, - "step": 1846 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3567, - "step": 1847 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.362, - "step": 1848 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3683, - "step": 1849 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3891, - "step": 1850 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3867, - "step": 1851 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.359, - "step": 1852 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3754, - "step": 1853 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.369, - "step": 1854 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.4012, - "step": 1855 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3845, - "step": 1856 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3747, - "step": 1857 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3802, - "step": 1858 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3864, - "step": 1859 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3428, - "step": 1860 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3784, - "step": 1861 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3685, - "step": 1862 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3652, - "step": 1863 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3728, - "step": 1864 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3845, - "step": 1865 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.388, - "step": 1866 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3751, - "step": 1867 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3773, - "step": 1868 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3718, - "step": 1869 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3967, - "step": 1870 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3864, - "step": 1871 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3702, - "step": 1872 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3648, - "step": 1873 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3736, - "step": 1874 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3679, - "step": 1875 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3474, - "step": 1876 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3713, - "step": 1877 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.394, - "step": 1878 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3784, - "step": 1879 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3619, - "step": 1880 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3699, - "step": 1881 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.372, - "step": 1882 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3755, - "step": 1883 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3915, - "step": 1884 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3947, - "step": 1885 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3802, - "step": 1886 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3601, - "step": 1887 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3747, - "step": 1888 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3933, - "step": 1889 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.361, - "step": 1890 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3675, - "step": 1891 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3752, - "step": 1892 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3728, - "step": 1893 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3617, - "step": 1894 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.38, - "step": 1895 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3867, - "step": 1896 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.384, - "step": 1897 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3423, - "step": 1898 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3879, - "step": 1899 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3667, - "step": 1900 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3712, - "step": 1901 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3849, - "step": 1902 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3673, - "step": 1903 - }, - { - "epoch": 0.23, - "learning_rate": 0.0003, - "loss": 0.3619, - "step": 1904 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3785, - "step": 1905 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3792, - "step": 1906 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3674, - "step": 1907 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3658, - "step": 1908 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3725, - "step": 1909 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.38, - "step": 1910 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3764, - "step": 1911 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.381, - "step": 1912 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3685, - "step": 1913 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3607, - "step": 1914 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3746, - "step": 1915 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3802, - "step": 1916 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.378, - "step": 1917 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3694, - "step": 1918 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3684, - "step": 1919 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3785, - "step": 1920 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3683, - "step": 1921 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.376, - "step": 1922 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3292, - "step": 1923 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3762, - "step": 1924 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.368, - "step": 1925 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3668, - "step": 1926 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3518, - "step": 1927 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.363, - "step": 1928 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3903, - "step": 1929 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3625, - "step": 1930 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3604, - "step": 1931 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3545, - "step": 1932 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3807, - "step": 1933 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3584, - "step": 1934 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3567, - "step": 1935 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3813, - "step": 1936 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3721, - "step": 1937 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3667, - "step": 1938 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3771, - "step": 1939 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3831, - "step": 1940 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3715, - "step": 1941 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3451, - "step": 1942 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3563, - "step": 1943 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.369, - "step": 1944 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3694, - "step": 1945 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3513, - "step": 1946 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3449, - "step": 1947 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3731, - "step": 1948 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.368, - "step": 1949 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3719, - "step": 1950 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3702, - "step": 1951 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3676, - "step": 1952 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.383, - "step": 1953 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3507, - "step": 1954 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3595, - "step": 1955 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3725, - "step": 1956 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3706, - "step": 1957 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3487, - "step": 1958 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3758, - "step": 1959 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3656, - "step": 1960 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3511, - "step": 1961 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.378, - "step": 1962 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3793, - "step": 1963 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3592, - "step": 1964 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3624, - "step": 1965 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3644, - "step": 1966 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3685, - "step": 1967 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3453, - "step": 1968 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.366, - "step": 1969 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3854, - "step": 1970 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3476, - "step": 1971 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3497, - "step": 1972 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3527, - "step": 1973 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3757, - "step": 1974 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3583, - "step": 1975 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3599, - "step": 1976 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3462, - "step": 1977 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3754, - "step": 1978 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3804, - "step": 1979 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3747, - "step": 1980 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.35, - "step": 1981 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3685, - "step": 1982 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3567, - "step": 1983 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3769, - "step": 1984 - }, - { - "epoch": 0.24, - "learning_rate": 0.0003, - "loss": 0.3647, - "step": 1985 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3707, - "step": 1986 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3654, - "step": 1987 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3606, - "step": 1988 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.392, - "step": 1989 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3629, - "step": 1990 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3607, - "step": 1991 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3735, - "step": 1992 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3475, - "step": 1993 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3691, - "step": 1994 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3489, - "step": 1995 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3726, - "step": 1996 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3724, - "step": 1997 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3385, - "step": 1998 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3638, - "step": 1999 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3748, - "step": 2000 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.368, - "step": 2001 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3706, - "step": 2002 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3755, - "step": 2003 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3488, - "step": 2004 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3588, - "step": 2005 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3767, - "step": 2006 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.359, - "step": 2007 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3639, - "step": 2008 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3784, - "step": 2009 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3556, - "step": 2010 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3706, - "step": 2011 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3615, - "step": 2012 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3497, - "step": 2013 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3772, - "step": 2014 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3495, - "step": 2015 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3748, - "step": 2016 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.35, - "step": 2017 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3617, - "step": 2018 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3552, - "step": 2019 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3438, - "step": 2020 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3624, - "step": 2021 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3621, - "step": 2022 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3621, - "step": 2023 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3508, - "step": 2024 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3675, - "step": 2025 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3597, - "step": 2026 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.382, - "step": 2027 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3497, - "step": 2028 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.36, - "step": 2029 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3723, - "step": 2030 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3667, - "step": 2031 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3703, - "step": 2032 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3514, - "step": 2033 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3389, - "step": 2034 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3586, - "step": 2035 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3676, - "step": 2036 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.346, - "step": 2037 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3786, - "step": 2038 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3523, - "step": 2039 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3437, - "step": 2040 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3756, - "step": 2041 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3663, - "step": 2042 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.362, - "step": 2043 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3678, - "step": 2044 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.36, - "step": 2045 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3563, - "step": 2046 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3452, - "step": 2047 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3485, - "step": 2048 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3768, - "step": 2049 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3452, - "step": 2050 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3538, - "step": 2051 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3592, - "step": 2052 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3673, - "step": 2053 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3483, - "step": 2054 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3602, - "step": 2055 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3723, - "step": 2056 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3396, - "step": 2057 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3426, - "step": 2058 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3684, - "step": 2059 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3816, - "step": 2060 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3439, - "step": 2061 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3681, - "step": 2062 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3605, - "step": 2063 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3705, - "step": 2064 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3477, - "step": 2065 - }, - { - "epoch": 0.25, - "learning_rate": 0.0003, - "loss": 0.3626, - "step": 2066 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3602, - "step": 2067 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3444, - "step": 2068 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3562, - "step": 2069 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3565, - "step": 2070 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3564, - "step": 2071 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3551, - "step": 2072 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3509, - "step": 2073 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3642, - "step": 2074 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3599, - "step": 2075 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3731, - "step": 2076 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3675, - "step": 2077 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3424, - "step": 2078 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3507, - "step": 2079 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3552, - "step": 2080 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3604, - "step": 2081 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3464, - "step": 2082 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3623, - "step": 2083 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3578, - "step": 2084 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3507, - "step": 2085 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3508, - "step": 2086 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3512, - "step": 2087 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3593, - "step": 2088 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3821, - "step": 2089 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3516, - "step": 2090 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3547, - "step": 2091 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3452, - "step": 2092 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3512, - "step": 2093 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3504, - "step": 2094 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3518, - "step": 2095 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3608, - "step": 2096 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3615, - "step": 2097 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3551, - "step": 2098 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3904, - "step": 2099 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3477, - "step": 2100 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.36, - "step": 2101 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3408, - "step": 2102 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3447, - "step": 2103 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3674, - "step": 2104 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3516, - "step": 2105 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3543, - "step": 2106 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3566, - "step": 2107 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3497, - "step": 2108 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.365, - "step": 2109 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3419, - "step": 2110 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3405, - "step": 2111 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3509, - "step": 2112 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3631, - "step": 2113 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3447, - "step": 2114 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.345, - "step": 2115 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3681, - "step": 2116 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3728, - "step": 2117 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3559, - "step": 2118 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3481, - "step": 2119 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3551, - "step": 2120 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3397, - "step": 2121 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.349, - "step": 2122 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3364, - "step": 2123 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3672, - "step": 2124 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3369, - "step": 2125 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3446, - "step": 2126 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3477, - "step": 2127 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3486, - "step": 2128 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3395, - "step": 2129 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3596, - "step": 2130 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.348, - "step": 2131 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3523, - "step": 2132 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3351, - "step": 2133 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3439, - "step": 2134 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3578, - "step": 2135 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3557, - "step": 2136 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3787, - "step": 2137 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3458, - "step": 2138 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3427, - "step": 2139 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3635, - "step": 2140 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3704, - "step": 2141 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3565, - "step": 2142 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3768, - "step": 2143 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3334, - "step": 2144 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3363, - "step": 2145 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3178, - "step": 2146 - }, - { - "epoch": 0.26, - "learning_rate": 0.0003, - "loss": 0.3632, - "step": 2147 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3426, - "step": 2148 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3454, - "step": 2149 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3553, - "step": 2150 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3577, - "step": 2151 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3503, - "step": 2152 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3466, - "step": 2153 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3492, - "step": 2154 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3496, - "step": 2155 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3514, - "step": 2156 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3529, - "step": 2157 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3583, - "step": 2158 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3361, - "step": 2159 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3586, - "step": 2160 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3285, - "step": 2161 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3474, - "step": 2162 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3592, - "step": 2163 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3352, - "step": 2164 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3284, - "step": 2165 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3563, - "step": 2166 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.338, - "step": 2167 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3601, - "step": 2168 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3635, - "step": 2169 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3438, - "step": 2170 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.366, - "step": 2171 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3499, - "step": 2172 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3489, - "step": 2173 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3467, - "step": 2174 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3435, - "step": 2175 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3582, - "step": 2176 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3312, - "step": 2177 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3465, - "step": 2178 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3383, - "step": 2179 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3453, - "step": 2180 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3633, - "step": 2181 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3316, - "step": 2182 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3634, - "step": 2183 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3549, - "step": 2184 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3486, - "step": 2185 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3554, - "step": 2186 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.347, - "step": 2187 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3577, - "step": 2188 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3513, - "step": 2189 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3572, - "step": 2190 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.359, - "step": 2191 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.341, - "step": 2192 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3554, - "step": 2193 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3385, - "step": 2194 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3638, - "step": 2195 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3317, - "step": 2196 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3506, - "step": 2197 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3528, - "step": 2198 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.33, - "step": 2199 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3557, - "step": 2200 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3507, - "step": 2201 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3562, - "step": 2202 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3452, - "step": 2203 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3638, - "step": 2204 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3487, - "step": 2205 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3603, - "step": 2206 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3641, - "step": 2207 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3649, - "step": 2208 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3509, - "step": 2209 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3473, - "step": 2210 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3525, - "step": 2211 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3502, - "step": 2212 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3449, - "step": 2213 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3654, - "step": 2214 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3496, - "step": 2215 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3505, - "step": 2216 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3438, - "step": 2217 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3474, - "step": 2218 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3449, - "step": 2219 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3432, - "step": 2220 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.341, - "step": 2221 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3637, - "step": 2222 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3276, - "step": 2223 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3462, - "step": 2224 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3366, - "step": 2225 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.343, - "step": 2226 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3367, - "step": 2227 - }, - { - "epoch": 0.27, - "learning_rate": 0.0003, - "loss": 0.3596, - "step": 2228 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3564, - "step": 2229 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3352, - "step": 2230 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3511, - "step": 2231 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3362, - "step": 2232 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3626, - "step": 2233 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3487, - "step": 2234 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.339, - "step": 2235 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3265, - "step": 2236 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3383, - "step": 2237 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3548, - "step": 2238 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3785, - "step": 2239 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3469, - "step": 2240 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3502, - "step": 2241 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3549, - "step": 2242 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3498, - "step": 2243 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3415, - "step": 2244 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3683, - "step": 2245 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3605, - "step": 2246 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3449, - "step": 2247 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3414, - "step": 2248 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3537, - "step": 2249 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.345, - "step": 2250 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3427, - "step": 2251 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3548, - "step": 2252 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3554, - "step": 2253 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3458, - "step": 2254 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3437, - "step": 2255 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3561, - "step": 2256 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3421, - "step": 2257 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3295, - "step": 2258 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3445, - "step": 2259 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3366, - "step": 2260 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3484, - "step": 2261 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3331, - "step": 2262 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3543, - "step": 2263 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3168, - "step": 2264 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3404, - "step": 2265 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3501, - "step": 2266 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3378, - "step": 2267 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3472, - "step": 2268 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3454, - "step": 2269 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3462, - "step": 2270 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3489, - "step": 2271 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3543, - "step": 2272 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3664, - "step": 2273 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3501, - "step": 2274 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3474, - "step": 2275 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3442, - "step": 2276 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3361, - "step": 2277 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3381, - "step": 2278 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3562, - "step": 2279 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3674, - "step": 2280 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3552, - "step": 2281 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3666, - "step": 2282 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3518, - "step": 2283 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3576, - "step": 2284 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3434, - "step": 2285 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3335, - "step": 2286 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3421, - "step": 2287 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3492, - "step": 2288 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3232, - "step": 2289 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3409, - "step": 2290 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3501, - "step": 2291 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3558, - "step": 2292 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3462, - "step": 2293 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3262, - "step": 2294 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3545, - "step": 2295 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.342, - "step": 2296 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3626, - "step": 2297 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3555, - "step": 2298 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3457, - "step": 2299 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3411, - "step": 2300 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3484, - "step": 2301 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3264, - "step": 2302 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.325, - "step": 2303 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.335, - "step": 2304 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3517, - "step": 2305 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3497, - "step": 2306 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3446, - "step": 2307 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.338, - "step": 2308 - }, - { - "epoch": 0.28, - "learning_rate": 0.0003, - "loss": 0.3481, - "step": 2309 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3323, - "step": 2310 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3536, - "step": 2311 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3472, - "step": 2312 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3549, - "step": 2313 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3378, - "step": 2314 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3371, - "step": 2315 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3425, - "step": 2316 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3261, - "step": 2317 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3268, - "step": 2318 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3489, - "step": 2319 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3355, - "step": 2320 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3463, - "step": 2321 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3551, - "step": 2322 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3396, - "step": 2323 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3573, - "step": 2324 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.356, - "step": 2325 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3509, - "step": 2326 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3412, - "step": 2327 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.338, - "step": 2328 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.342, - "step": 2329 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3597, - "step": 2330 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3547, - "step": 2331 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3293, - "step": 2332 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.342, - "step": 2333 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.346, - "step": 2334 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3422, - "step": 2335 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.339, - "step": 2336 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3539, - "step": 2337 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3484, - "step": 2338 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3628, - "step": 2339 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3214, - "step": 2340 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3363, - "step": 2341 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3434, - "step": 2342 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3435, - "step": 2343 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3371, - "step": 2344 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3435, - "step": 2345 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3506, - "step": 2346 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3376, - "step": 2347 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3556, - "step": 2348 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3249, - "step": 2349 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3515, - "step": 2350 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3296, - "step": 2351 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3336, - "step": 2352 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.363, - "step": 2353 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3522, - "step": 2354 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3405, - "step": 2355 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3628, - "step": 2356 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.352, - "step": 2357 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3253, - "step": 2358 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3463, - "step": 2359 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3209, - "step": 2360 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3477, - "step": 2361 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3222, - "step": 2362 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3383, - "step": 2363 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3289, - "step": 2364 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3438, - "step": 2365 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3375, - "step": 2366 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3455, - "step": 2367 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3725, - "step": 2368 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3355, - "step": 2369 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3441, - "step": 2370 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3301, - "step": 2371 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3505, - "step": 2372 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3282, - "step": 2373 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.335, - "step": 2374 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3667, - "step": 2375 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3494, - "step": 2376 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3324, - "step": 2377 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3536, - "step": 2378 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3525, - "step": 2379 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3416, - "step": 2380 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.341, - "step": 2381 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.346, - "step": 2382 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3365, - "step": 2383 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3495, - "step": 2384 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3473, - "step": 2385 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3423, - "step": 2386 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3185, - "step": 2387 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3524, - "step": 2388 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.3297, - "step": 2389 - }, - { - "epoch": 0.29, - "learning_rate": 0.0003, - "loss": 0.343, - "step": 2390 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3256, - "step": 2391 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3439, - "step": 2392 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.347, - "step": 2393 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3338, - "step": 2394 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.347, - "step": 2395 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3449, - "step": 2396 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.343, - "step": 2397 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3366, - "step": 2398 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3771, - "step": 2399 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.337, - "step": 2400 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3451, - "step": 2401 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3323, - "step": 2402 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3309, - "step": 2403 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3416, - "step": 2404 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.317, - "step": 2405 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3509, - "step": 2406 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3358, - "step": 2407 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3591, - "step": 2408 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3329, - "step": 2409 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3369, - "step": 2410 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3413, - "step": 2411 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3548, - "step": 2412 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3288, - "step": 2413 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3449, - "step": 2414 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3416, - "step": 2415 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.326, - "step": 2416 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3264, - "step": 2417 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.345, - "step": 2418 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3468, - "step": 2419 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3351, - "step": 2420 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3333, - "step": 2421 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3281, - "step": 2422 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3398, - "step": 2423 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3413, - "step": 2424 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3323, - "step": 2425 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3614, - "step": 2426 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3362, - "step": 2427 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3447, - "step": 2428 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3447, - "step": 2429 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3315, - "step": 2430 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3157, - "step": 2431 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3376, - "step": 2432 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3506, - "step": 2433 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3231, - "step": 2434 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3191, - "step": 2435 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3451, - "step": 2436 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3432, - "step": 2437 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3387, - "step": 2438 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3335, - "step": 2439 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3503, - "step": 2440 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3477, - "step": 2441 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3312, - "step": 2442 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3308, - "step": 2443 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3387, - "step": 2444 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3393, - "step": 2445 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3313, - "step": 2446 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3514, - "step": 2447 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.349, - "step": 2448 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3431, - "step": 2449 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3395, - "step": 2450 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.312, - "step": 2451 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3599, - "step": 2452 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3256, - "step": 2453 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3452, - "step": 2454 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3354, - "step": 2455 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3246, - "step": 2456 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.333, - "step": 2457 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3167, - "step": 2458 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3309, - "step": 2459 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3478, - "step": 2460 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3371, - "step": 2461 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3425, - "step": 2462 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3608, - "step": 2463 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3436, - "step": 2464 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3283, - "step": 2465 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3217, - "step": 2466 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3281, - "step": 2467 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3336, - "step": 2468 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3372, - "step": 2469 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3573, - "step": 2470 - }, - { - "epoch": 0.3, - "learning_rate": 0.0003, - "loss": 0.3392, - "step": 2471 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3375, - "step": 2472 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3403, - "step": 2473 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3378, - "step": 2474 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3473, - "step": 2475 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3213, - "step": 2476 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3428, - "step": 2477 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3397, - "step": 2478 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3338, - "step": 2479 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3449, - "step": 2480 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3145, - "step": 2481 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3345, - "step": 2482 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.33, - "step": 2483 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3632, - "step": 2484 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3508, - "step": 2485 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.331, - "step": 2486 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.32, - "step": 2487 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3395, - "step": 2488 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3391, - "step": 2489 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3413, - "step": 2490 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3341, - "step": 2491 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3413, - "step": 2492 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3202, - "step": 2493 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3391, - "step": 2494 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3304, - "step": 2495 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3564, - "step": 2496 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3397, - "step": 2497 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3316, - "step": 2498 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3581, - "step": 2499 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3286, - "step": 2500 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3469, - "step": 2501 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3203, - "step": 2502 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.332, - "step": 2503 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3442, - "step": 2504 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3385, - "step": 2505 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3238, - "step": 2506 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3294, - "step": 2507 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3613, - "step": 2508 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.336, - "step": 2509 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3183, - "step": 2510 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3431, - "step": 2511 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3385, - "step": 2512 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3347, - "step": 2513 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3416, - "step": 2514 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.335, - "step": 2515 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3243, - "step": 2516 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3289, - "step": 2517 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3539, - "step": 2518 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3494, - "step": 2519 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.336, - "step": 2520 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.345, - "step": 2521 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3446, - "step": 2522 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3538, - "step": 2523 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3269, - "step": 2524 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3435, - "step": 2525 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3358, - "step": 2526 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.332, - "step": 2527 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3238, - "step": 2528 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3495, - "step": 2529 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3356, - "step": 2530 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.332, - "step": 2531 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3358, - "step": 2532 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3325, - "step": 2533 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3555, - "step": 2534 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3543, - "step": 2535 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3381, - "step": 2536 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3333, - "step": 2537 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3508, - "step": 2538 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.318, - "step": 2539 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3651, - "step": 2540 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3321, - "step": 2541 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3147, - "step": 2542 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.341, - "step": 2543 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3328, - "step": 2544 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.335, - "step": 2545 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3446, - "step": 2546 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3437, - "step": 2547 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3441, - "step": 2548 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3574, - "step": 2549 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3351, - "step": 2550 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.3173, - "step": 2551 - }, - { - "epoch": 0.31, - "learning_rate": 0.0003, - "loss": 0.338, - "step": 2552 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3312, - "step": 2553 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3312, - "step": 2554 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3251, - "step": 2555 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3325, - "step": 2556 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3174, - "step": 2557 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3403, - "step": 2558 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.347, - "step": 2559 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.338, - "step": 2560 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3267, - "step": 2561 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3326, - "step": 2562 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3319, - "step": 2563 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3323, - "step": 2564 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3429, - "step": 2565 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3389, - "step": 2566 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3492, - "step": 2567 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3136, - "step": 2568 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3307, - "step": 2569 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3303, - "step": 2570 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3339, - "step": 2571 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3512, - "step": 2572 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3171, - "step": 2573 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3216, - "step": 2574 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3239, - "step": 2575 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3404, - "step": 2576 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3208, - "step": 2577 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3279, - "step": 2578 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3434, - "step": 2579 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3225, - "step": 2580 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3317, - "step": 2581 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3363, - "step": 2582 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3231, - "step": 2583 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3268, - "step": 2584 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3383, - "step": 2585 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.334, - "step": 2586 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.32, - "step": 2587 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3299, - "step": 2588 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3381, - "step": 2589 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3422, - "step": 2590 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3485, - "step": 2591 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3376, - "step": 2592 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3474, - "step": 2593 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3197, - "step": 2594 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3242, - "step": 2595 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3272, - "step": 2596 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3398, - "step": 2597 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3391, - "step": 2598 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3345, - "step": 2599 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.324, - "step": 2600 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3255, - "step": 2601 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3367, - "step": 2602 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3289, - "step": 2603 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3327, - "step": 2604 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3176, - "step": 2605 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3268, - "step": 2606 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3326, - "step": 2607 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3551, - "step": 2608 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3193, - "step": 2609 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3358, - "step": 2610 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.342, - "step": 2611 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3384, - "step": 2612 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3292, - "step": 2613 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3341, - "step": 2614 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3513, - "step": 2615 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3228, - "step": 2616 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3387, - "step": 2617 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3206, - "step": 2618 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3323, - "step": 2619 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3315, - "step": 2620 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3255, - "step": 2621 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3478, - "step": 2622 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3245, - "step": 2623 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3282, - "step": 2624 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3375, - "step": 2625 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3104, - "step": 2626 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3384, - "step": 2627 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.326, - "step": 2628 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3256, - "step": 2629 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3405, - "step": 2630 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.333, - "step": 2631 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3165, - "step": 2632 - }, - { - "epoch": 0.32, - "learning_rate": 0.0003, - "loss": 0.3365, - "step": 2633 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3143, - "step": 2634 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.329, - "step": 2635 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3222, - "step": 2636 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3272, - "step": 2637 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3426, - "step": 2638 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3302, - "step": 2639 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3306, - "step": 2640 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3374, - "step": 2641 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3231, - "step": 2642 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3269, - "step": 2643 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3299, - "step": 2644 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3371, - "step": 2645 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3279, - "step": 2646 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.345, - "step": 2647 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3309, - "step": 2648 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3149, - "step": 2649 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3384, - "step": 2650 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3223, - "step": 2651 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3401, - "step": 2652 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3352, - "step": 2653 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3442, - "step": 2654 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3252, - "step": 2655 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3348, - "step": 2656 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3455, - "step": 2657 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3417, - "step": 2658 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3255, - "step": 2659 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3198, - "step": 2660 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3184, - "step": 2661 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3186, - "step": 2662 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3095, - "step": 2663 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3362, - "step": 2664 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3296, - "step": 2665 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3396, - "step": 2666 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3239, - "step": 2667 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3096, - "step": 2668 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3557, - "step": 2669 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3314, - "step": 2670 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3172, - "step": 2671 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3313, - "step": 2672 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3469, - "step": 2673 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3177, - "step": 2674 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3309, - "step": 2675 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3432, - "step": 2676 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3409, - "step": 2677 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3259, - "step": 2678 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3086, - "step": 2679 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3273, - "step": 2680 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3518, - "step": 2681 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3421, - "step": 2682 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3388, - "step": 2683 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3321, - "step": 2684 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3339, - "step": 2685 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3295, - "step": 2686 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3386, - "step": 2687 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3444, - "step": 2688 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3302, - "step": 2689 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3368, - "step": 2690 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3141, - "step": 2691 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3231, - "step": 2692 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3301, - "step": 2693 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3193, - "step": 2694 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3363, - "step": 2695 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3498, - "step": 2696 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3238, - "step": 2697 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3264, - "step": 2698 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.324, - "step": 2699 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3269, - "step": 2700 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3327, - "step": 2701 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3407, - "step": 2702 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3311, - "step": 2703 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3261, - "step": 2704 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3483, - "step": 2705 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3249, - "step": 2706 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3512, - "step": 2707 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3358, - "step": 2708 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3303, - "step": 2709 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3216, - "step": 2710 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3392, - "step": 2711 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3278, - "step": 2712 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3279, - "step": 2713 - }, - { - "epoch": 0.33, - "learning_rate": 0.0003, - "loss": 0.3149, - "step": 2714 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3209, - "step": 2715 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.316, - "step": 2716 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3299, - "step": 2717 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3313, - "step": 2718 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3325, - "step": 2719 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3409, - "step": 2720 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3168, - "step": 2721 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3406, - "step": 2722 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3399, - "step": 2723 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3421, - "step": 2724 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3469, - "step": 2725 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3272, - "step": 2726 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3167, - "step": 2727 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3503, - "step": 2728 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3421, - "step": 2729 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3272, - "step": 2730 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3221, - "step": 2731 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3095, - "step": 2732 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3339, - "step": 2733 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3329, - "step": 2734 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3347, - "step": 2735 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3142, - "step": 2736 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3363, - "step": 2737 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3287, - "step": 2738 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3296, - "step": 2739 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3355, - "step": 2740 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3439, - "step": 2741 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3215, - "step": 2742 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3372, - "step": 2743 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3219, - "step": 2744 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.336, - "step": 2745 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3107, - "step": 2746 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3371, - "step": 2747 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3286, - "step": 2748 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3184, - "step": 2749 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.332, - "step": 2750 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3474, - "step": 2751 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3131, - "step": 2752 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3223, - "step": 2753 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3352, - "step": 2754 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3295, - "step": 2755 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3336, - "step": 2756 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.34, - "step": 2757 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3332, - "step": 2758 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3303, - "step": 2759 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3111, - "step": 2760 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3313, - "step": 2761 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3221, - "step": 2762 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.336, - "step": 2763 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3261, - "step": 2764 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3179, - "step": 2765 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3404, - "step": 2766 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3414, - "step": 2767 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3381, - "step": 2768 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3258, - "step": 2769 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3307, - "step": 2770 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3184, - "step": 2771 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3419, - "step": 2772 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3198, - "step": 2773 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3206, - "step": 2774 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.333, - "step": 2775 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3163, - "step": 2776 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3343, - "step": 2777 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3302, - "step": 2778 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3258, - "step": 2779 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3263, - "step": 2780 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3275, - "step": 2781 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.329, - "step": 2782 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.323, - "step": 2783 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3376, - "step": 2784 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.317, - "step": 2785 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3413, - "step": 2786 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3243, - "step": 2787 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3249, - "step": 2788 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.325, - "step": 2789 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3425, - "step": 2790 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3415, - "step": 2791 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3525, - "step": 2792 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3272, - "step": 2793 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3231, - "step": 2794 - }, - { - "epoch": 0.34, - "learning_rate": 0.0003, - "loss": 0.3278, - "step": 2795 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3184, - "step": 2796 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3246, - "step": 2797 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3304, - "step": 2798 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3317, - "step": 2799 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3236, - "step": 2800 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3114, - "step": 2801 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3357, - "step": 2802 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3438, - "step": 2803 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3233, - "step": 2804 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3336, - "step": 2805 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3118, - "step": 2806 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3236, - "step": 2807 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.339, - "step": 2808 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3153, - "step": 2809 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3291, - "step": 2810 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3307, - "step": 2811 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3289, - "step": 2812 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3193, - "step": 2813 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3271, - "step": 2814 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3256, - "step": 2815 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.321, - "step": 2816 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3047, - "step": 2817 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3197, - "step": 2818 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3272, - "step": 2819 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3277, - "step": 2820 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3175, - "step": 2821 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3257, - "step": 2822 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3415, - "step": 2823 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3407, - "step": 2824 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3341, - "step": 2825 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3416, - "step": 2826 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3391, - "step": 2827 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3199, - "step": 2828 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3205, - "step": 2829 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3159, - "step": 2830 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3151, - "step": 2831 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3383, - "step": 2832 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3469, - "step": 2833 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.32, - "step": 2834 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3376, - "step": 2835 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3351, - "step": 2836 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3337, - "step": 2837 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3402, - "step": 2838 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3223, - "step": 2839 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3496, - "step": 2840 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3263, - "step": 2841 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.331, - "step": 2842 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3263, - "step": 2843 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.317, - "step": 2844 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3313, - "step": 2845 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3108, - "step": 2846 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3317, - "step": 2847 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3294, - "step": 2848 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3448, - "step": 2849 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3321, - "step": 2850 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3324, - "step": 2851 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3229, - "step": 2852 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3175, - "step": 2853 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3137, - "step": 2854 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3472, - "step": 2855 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.333, - "step": 2856 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3335, - "step": 2857 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.335, - "step": 2858 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3371, - "step": 2859 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3254, - "step": 2860 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3219, - "step": 2861 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3398, - "step": 2862 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3094, - "step": 2863 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3206, - "step": 2864 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3177, - "step": 2865 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3018, - "step": 2866 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3174, - "step": 2867 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.325, - "step": 2868 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3274, - "step": 2869 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.2992, - "step": 2870 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3185, - "step": 2871 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3081, - "step": 2872 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3153, - "step": 2873 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3257, - "step": 2874 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3466, - "step": 2875 - }, - { - "epoch": 0.35, - "learning_rate": 0.0003, - "loss": 0.3304, - "step": 2876 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3301, - "step": 2877 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3235, - "step": 2878 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3469, - "step": 2879 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3237, - "step": 2880 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3556, - "step": 2881 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3111, - "step": 2882 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.321, - "step": 2883 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.325, - "step": 2884 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3181, - "step": 2885 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3438, - "step": 2886 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3293, - "step": 2887 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3319, - "step": 2888 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3269, - "step": 2889 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3282, - "step": 2890 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3055, - "step": 2891 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3202, - "step": 2892 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3192, - "step": 2893 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3404, - "step": 2894 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3225, - "step": 2895 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3391, - "step": 2896 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3122, - "step": 2897 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3403, - "step": 2898 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3397, - "step": 2899 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3311, - "step": 2900 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3193, - "step": 2901 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3068, - "step": 2902 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3022, - "step": 2903 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3396, - "step": 2904 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.326, - "step": 2905 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3323, - "step": 2906 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3258, - "step": 2907 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3045, - "step": 2908 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3123, - "step": 2909 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3126, - "step": 2910 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3229, - "step": 2911 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3084, - "step": 2912 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3122, - "step": 2913 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3183, - "step": 2914 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3231, - "step": 2915 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3156, - "step": 2916 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3438, - "step": 2917 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3331, - "step": 2918 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3375, - "step": 2919 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3171, - "step": 2920 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3059, - "step": 2921 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3207, - "step": 2922 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3218, - "step": 2923 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3344, - "step": 2924 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3115, - "step": 2925 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3091, - "step": 2926 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3244, - "step": 2927 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3161, - "step": 2928 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3392, - "step": 2929 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3321, - "step": 2930 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3175, - "step": 2931 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3256, - "step": 2932 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3152, - "step": 2933 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3073, - "step": 2934 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3055, - "step": 2935 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3323, - "step": 2936 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3072, - "step": 2937 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3322, - "step": 2938 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3184, - "step": 2939 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3316, - "step": 2940 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.315, - "step": 2941 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3342, - "step": 2942 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3186, - "step": 2943 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3258, - "step": 2944 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3213, - "step": 2945 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3356, - "step": 2946 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3168, - "step": 2947 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3296, - "step": 2948 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3135, - "step": 2949 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3138, - "step": 2950 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3157, - "step": 2951 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3254, - "step": 2952 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3281, - "step": 2953 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3262, - "step": 2954 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3062, - "step": 2955 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.3056, - "step": 2956 - }, - { - "epoch": 0.36, - "learning_rate": 0.0003, - "loss": 0.2901, - "step": 2957 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3551, - "step": 2958 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3154, - "step": 2959 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3358, - "step": 2960 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3232, - "step": 2961 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3411, - "step": 2962 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.327, - "step": 2963 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3312, - "step": 2964 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3265, - "step": 2965 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3125, - "step": 2966 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3044, - "step": 2967 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3292, - "step": 2968 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3406, - "step": 2969 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3306, - "step": 2970 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3071, - "step": 2971 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3278, - "step": 2972 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3134, - "step": 2973 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3011, - "step": 2974 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3197, - "step": 2975 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3209, - "step": 2976 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.328, - "step": 2977 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3276, - "step": 2978 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3026, - "step": 2979 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3262, - "step": 2980 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3305, - "step": 2981 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3199, - "step": 2982 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3447, - "step": 2983 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3114, - "step": 2984 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3079, - "step": 2985 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3106, - "step": 2986 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3318, - "step": 2987 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3048, - "step": 2988 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3277, - "step": 2989 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3329, - "step": 2990 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3365, - "step": 2991 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3175, - "step": 2992 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3274, - "step": 2993 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3082, - "step": 2994 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3236, - "step": 2995 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3271, - "step": 2996 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3138, - "step": 2997 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3222, - "step": 2998 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3163, - "step": 2999 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3093, - "step": 3000 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3134, - "step": 3001 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3245, - "step": 3002 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3121, - "step": 3003 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3121, - "step": 3004 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3266, - "step": 3005 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3294, - "step": 3006 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3053, - "step": 3007 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3185, - "step": 3008 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3424, - "step": 3009 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3164, - "step": 3010 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3064, - "step": 3011 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.346, - "step": 3012 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3257, - "step": 3013 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3162, - "step": 3014 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3221, - "step": 3015 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3303, - "step": 3016 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3149, - "step": 3017 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3156, - "step": 3018 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3276, - "step": 3019 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3149, - "step": 3020 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3109, - "step": 3021 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3075, - "step": 3022 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.2905, - "step": 3023 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3119, - "step": 3024 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3046, - "step": 3025 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3085, - "step": 3026 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.2997, - "step": 3027 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.314, - "step": 3028 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3206, - "step": 3029 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3141, - "step": 3030 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3369, - "step": 3031 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3332, - "step": 3032 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.326, - "step": 3033 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3183, - "step": 3034 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3158, - "step": 3035 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3208, - "step": 3036 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3102, - "step": 3037 - }, - { - "epoch": 0.37, - "learning_rate": 0.0003, - "loss": 0.3252, - "step": 3038 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3422, - "step": 3039 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3282, - "step": 3040 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3259, - "step": 3041 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3134, - "step": 3042 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3411, - "step": 3043 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3352, - "step": 3044 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3446, - "step": 3045 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3147, - "step": 3046 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3341, - "step": 3047 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3093, - "step": 3048 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.31, - "step": 3049 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3353, - "step": 3050 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3413, - "step": 3051 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3204, - "step": 3052 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3203, - "step": 3053 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3143, - "step": 3054 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3313, - "step": 3055 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3131, - "step": 3056 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3245, - "step": 3057 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3477, - "step": 3058 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3285, - "step": 3059 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3319, - "step": 3060 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3138, - "step": 3061 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3107, - "step": 3062 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3195, - "step": 3063 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.305, - "step": 3064 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3216, - "step": 3065 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3036, - "step": 3066 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3063, - "step": 3067 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3092, - "step": 3068 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3288, - "step": 3069 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3122, - "step": 3070 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3348, - "step": 3071 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3241, - "step": 3072 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3269, - "step": 3073 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3424, - "step": 3074 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3077, - "step": 3075 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3152, - "step": 3076 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3302, - "step": 3077 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3212, - "step": 3078 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3264, - "step": 3079 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3489, - "step": 3080 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3137, - "step": 3081 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3092, - "step": 3082 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3231, - "step": 3083 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3268, - "step": 3084 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3152, - "step": 3085 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3328, - "step": 3086 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3337, - "step": 3087 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3066, - "step": 3088 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3226, - "step": 3089 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3087, - "step": 3090 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3174, - "step": 3091 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.304, - "step": 3092 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3174, - "step": 3093 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.309, - "step": 3094 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3197, - "step": 3095 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3389, - "step": 3096 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3344, - "step": 3097 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3002, - "step": 3098 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.2929, - "step": 3099 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3161, - "step": 3100 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3284, - "step": 3101 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3172, - "step": 3102 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3245, - "step": 3103 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3161, - "step": 3104 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3085, - "step": 3105 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3176, - "step": 3106 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3032, - "step": 3107 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.307, - "step": 3108 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.306, - "step": 3109 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3288, - "step": 3110 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3171, - "step": 3111 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3176, - "step": 3112 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3052, - "step": 3113 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3187, - "step": 3114 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3156, - "step": 3115 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3317, - "step": 3116 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.2987, - "step": 3117 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.3047, - "step": 3118 - }, - { - "epoch": 0.38, - "learning_rate": 0.0003, - "loss": 0.2929, - "step": 3119 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3074, - "step": 3120 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3088, - "step": 3121 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3247, - "step": 3122 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3173, - "step": 3123 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3134, - "step": 3124 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3041, - "step": 3125 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3104, - "step": 3126 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3073, - "step": 3127 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3158, - "step": 3128 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.291, - "step": 3129 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3152, - "step": 3130 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3033, - "step": 3131 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3091, - "step": 3132 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3128, - "step": 3133 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3092, - "step": 3134 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.298, - "step": 3135 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.2992, - "step": 3136 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3241, - "step": 3137 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.309, - "step": 3138 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3223, - "step": 3139 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3115, - "step": 3140 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3192, - "step": 3141 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3275, - "step": 3142 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3229, - "step": 3143 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3369, - "step": 3144 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3025, - "step": 3145 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3, - "step": 3146 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.319, - "step": 3147 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3118, - "step": 3148 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3213, - "step": 3149 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3164, - "step": 3150 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3283, - "step": 3151 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3318, - "step": 3152 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3231, - "step": 3153 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3077, - "step": 3154 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3291, - "step": 3155 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3105, - "step": 3156 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3057, - "step": 3157 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3215, - "step": 3158 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3233, - "step": 3159 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3044, - "step": 3160 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.304, - "step": 3161 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3267, - "step": 3162 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.2964, - "step": 3163 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3444, - "step": 3164 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3102, - "step": 3165 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3273, - "step": 3166 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3106, - "step": 3167 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3008, - "step": 3168 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.304, - "step": 3169 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3264, - "step": 3170 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3283, - "step": 3171 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3077, - "step": 3172 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3076, - "step": 3173 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3134, - "step": 3174 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3016, - "step": 3175 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3006, - "step": 3176 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3158, - "step": 3177 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3038, - "step": 3178 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3132, - "step": 3179 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3141, - "step": 3180 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.2942, - "step": 3181 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3155, - "step": 3182 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.308, - "step": 3183 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3241, - "step": 3184 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3178, - "step": 3185 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3227, - "step": 3186 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3161, - "step": 3187 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3266, - "step": 3188 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.325, - "step": 3189 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3001, - "step": 3190 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3193, - "step": 3191 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3216, - "step": 3192 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3142, - "step": 3193 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3138, - "step": 3194 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3021, - "step": 3195 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.2959, - "step": 3196 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3063, - "step": 3197 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3213, - "step": 3198 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3082, - "step": 3199 - }, - { - "epoch": 0.39, - "learning_rate": 0.0003, - "loss": 0.3166, - "step": 3200 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3089, - "step": 3201 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3232, - "step": 3202 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3253, - "step": 3203 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3118, - "step": 3204 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3093, - "step": 3205 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3321, - "step": 3206 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3186, - "step": 3207 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3226, - "step": 3208 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.322, - "step": 3209 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.2964, - "step": 3210 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3388, - "step": 3211 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3087, - "step": 3212 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3291, - "step": 3213 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3185, - "step": 3214 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3153, - "step": 3215 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3183, - "step": 3216 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3262, - "step": 3217 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3043, - "step": 3218 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3196, - "step": 3219 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3162, - "step": 3220 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3156, - "step": 3221 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3119, - "step": 3222 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3228, - "step": 3223 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3016, - "step": 3224 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3086, - "step": 3225 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.333, - "step": 3226 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3185, - "step": 3227 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3177, - "step": 3228 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3118, - "step": 3229 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3266, - "step": 3230 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3006, - "step": 3231 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3248, - "step": 3232 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3142, - "step": 3233 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.312, - "step": 3234 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.311, - "step": 3235 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3091, - "step": 3236 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3263, - "step": 3237 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3102, - "step": 3238 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3396, - "step": 3239 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3264, - "step": 3240 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3127, - "step": 3241 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.293, - "step": 3242 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3296, - "step": 3243 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3188, - "step": 3244 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3007, - "step": 3245 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3086, - "step": 3246 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3139, - "step": 3247 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3255, - "step": 3248 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3076, - "step": 3249 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.319, - "step": 3250 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3128, - "step": 3251 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3225, - "step": 3252 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.2995, - "step": 3253 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3089, - "step": 3254 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3013, - "step": 3255 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3065, - "step": 3256 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3149, - "step": 3257 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3256, - "step": 3258 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3082, - "step": 3259 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3187, - "step": 3260 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3164, - "step": 3261 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3125, - "step": 3262 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3214, - "step": 3263 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3186, - "step": 3264 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.2881, - "step": 3265 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3174, - "step": 3266 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3308, - "step": 3267 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3152, - "step": 3268 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3187, - "step": 3269 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3195, - "step": 3270 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3059, - "step": 3271 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3213, - "step": 3272 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3271, - "step": 3273 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3085, - "step": 3274 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3067, - "step": 3275 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3149, - "step": 3276 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3015, - "step": 3277 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3166, - "step": 3278 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3341, - "step": 3279 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.3041, - "step": 3280 - }, - { - "epoch": 0.4, - "learning_rate": 0.0003, - "loss": 0.296, - "step": 3281 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.2973, - "step": 3282 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3036, - "step": 3283 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3186, - "step": 3284 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3063, - "step": 3285 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3099, - "step": 3286 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3176, - "step": 3287 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3204, - "step": 3288 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3128, - "step": 3289 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3201, - "step": 3290 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3142, - "step": 3291 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3256, - "step": 3292 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3017, - "step": 3293 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.306, - "step": 3294 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3142, - "step": 3295 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3265, - "step": 3296 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3034, - "step": 3297 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3262, - "step": 3298 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.322, - "step": 3299 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3241, - "step": 3300 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3146, - "step": 3301 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3176, - "step": 3302 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3233, - "step": 3303 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3152, - "step": 3304 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3119, - "step": 3305 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.32, - "step": 3306 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.2907, - "step": 3307 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3167, - "step": 3308 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3112, - "step": 3309 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3118, - "step": 3310 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3039, - "step": 3311 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3217, - "step": 3312 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3088, - "step": 3313 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3085, - "step": 3314 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3094, - "step": 3315 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3283, - "step": 3316 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3055, - "step": 3317 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3046, - "step": 3318 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.2946, - "step": 3319 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.29, - "step": 3320 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3127, - "step": 3321 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3081, - "step": 3322 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3057, - "step": 3323 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.335, - "step": 3324 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3131, - "step": 3325 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3201, - "step": 3326 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3192, - "step": 3327 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.2968, - "step": 3328 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3026, - "step": 3329 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3092, - "step": 3330 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3136, - "step": 3331 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3158, - "step": 3332 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3112, - "step": 3333 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3138, - "step": 3334 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3042, - "step": 3335 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.2963, - "step": 3336 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.313, - "step": 3337 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3103, - "step": 3338 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3227, - "step": 3339 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3227, - "step": 3340 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.314, - "step": 3341 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3341, - "step": 3342 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3141, - "step": 3343 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.2989, - "step": 3344 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.2844, - "step": 3345 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.2967, - "step": 3346 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3007, - "step": 3347 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3215, - "step": 3348 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3273, - "step": 3349 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3015, - "step": 3350 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.2947, - "step": 3351 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3023, - "step": 3352 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3038, - "step": 3353 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3146, - "step": 3354 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3121, - "step": 3355 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3129, - "step": 3356 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3127, - "step": 3357 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3102, - "step": 3358 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3153, - "step": 3359 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3023, - "step": 3360 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.3164, - "step": 3361 - }, - { - "epoch": 0.41, - "learning_rate": 0.0003, - "loss": 0.2959, - "step": 3362 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.2981, - "step": 3363 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3006, - "step": 3364 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3157, - "step": 3365 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3215, - "step": 3366 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3089, - "step": 3367 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3312, - "step": 3368 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.302, - "step": 3369 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3071, - "step": 3370 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3083, - "step": 3371 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3052, - "step": 3372 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.325, - "step": 3373 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.2984, - "step": 3374 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3034, - "step": 3375 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.318, - "step": 3376 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3137, - "step": 3377 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3229, - "step": 3378 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3094, - "step": 3379 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3238, - "step": 3380 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3058, - "step": 3381 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3132, - "step": 3382 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3187, - "step": 3383 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.2916, - "step": 3384 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3132, - "step": 3385 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.2964, - "step": 3386 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.316, - "step": 3387 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3127, - "step": 3388 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3141, - "step": 3389 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.2796, - "step": 3390 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.2965, - "step": 3391 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.306, - "step": 3392 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3313, - "step": 3393 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3045, - "step": 3394 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3036, - "step": 3395 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3092, - "step": 3396 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3063, - "step": 3397 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3009, - "step": 3398 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3065, - "step": 3399 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.2909, - "step": 3400 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3152, - "step": 3401 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.2941, - "step": 3402 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3061, - "step": 3403 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3099, - "step": 3404 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3056, - "step": 3405 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3112, - "step": 3406 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3194, - "step": 3407 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3176, - "step": 3408 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3041, - "step": 3409 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3211, - "step": 3410 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3266, - "step": 3411 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3069, - "step": 3412 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.299, - "step": 3413 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3057, - "step": 3414 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3337, - "step": 3415 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3178, - "step": 3416 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3116, - "step": 3417 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3229, - "step": 3418 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3331, - "step": 3419 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3029, - "step": 3420 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3199, - "step": 3421 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3081, - "step": 3422 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3127, - "step": 3423 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3148, - "step": 3424 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3036, - "step": 3425 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3277, - "step": 3426 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3267, - "step": 3427 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3165, - "step": 3428 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3102, - "step": 3429 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3096, - "step": 3430 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3187, - "step": 3431 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3045, - "step": 3432 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3147, - "step": 3433 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3032, - "step": 3434 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.306, - "step": 3435 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3286, - "step": 3436 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3128, - "step": 3437 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3284, - "step": 3438 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3051, - "step": 3439 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3096, - "step": 3440 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3041, - "step": 3441 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3358, - "step": 3442 - }, - { - "epoch": 0.42, - "learning_rate": 0.0003, - "loss": 0.3117, - "step": 3443 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.2964, - "step": 3444 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3085, - "step": 3445 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3218, - "step": 3446 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.2988, - "step": 3447 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.2938, - "step": 3448 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.2929, - "step": 3449 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3221, - "step": 3450 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3099, - "step": 3451 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3286, - "step": 3452 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3222, - "step": 3453 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.306, - "step": 3454 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3012, - "step": 3455 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3038, - "step": 3456 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.2928, - "step": 3457 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3079, - "step": 3458 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3173, - "step": 3459 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3012, - "step": 3460 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3216, - "step": 3461 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3179, - "step": 3462 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.2991, - "step": 3463 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.295, - "step": 3464 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3178, - "step": 3465 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3004, - "step": 3466 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3217, - "step": 3467 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3352, - "step": 3468 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3085, - "step": 3469 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.311, - "step": 3470 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.2958, - "step": 3471 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3087, - "step": 3472 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.2913, - "step": 3473 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3183, - "step": 3474 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.296, - "step": 3475 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.2956, - "step": 3476 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3088, - "step": 3477 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3135, - "step": 3478 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.313, - "step": 3479 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3002, - "step": 3480 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3059, - "step": 3481 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3197, - "step": 3482 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3308, - "step": 3483 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3212, - "step": 3484 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.2971, - "step": 3485 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3111, - "step": 3486 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.2907, - "step": 3487 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.2917, - "step": 3488 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.309, - "step": 3489 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3234, - "step": 3490 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.31, - "step": 3491 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.2937, - "step": 3492 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.2983, - "step": 3493 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3053, - "step": 3494 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3185, - "step": 3495 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3084, - "step": 3496 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.304, - "step": 3497 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3051, - "step": 3498 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.2829, - "step": 3499 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.316, - "step": 3500 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3076, - "step": 3501 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3381, - "step": 3502 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3193, - "step": 3503 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.2867, - "step": 3504 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3026, - "step": 3505 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3045, - "step": 3506 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3002, - "step": 3507 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.2921, - "step": 3508 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3257, - "step": 3509 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3176, - "step": 3510 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3307, - "step": 3511 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3253, - "step": 3512 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3077, - "step": 3513 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.316, - "step": 3514 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3073, - "step": 3515 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3169, - "step": 3516 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3121, - "step": 3517 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3092, - "step": 3518 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3046, - "step": 3519 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3244, - "step": 3520 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3181, - "step": 3521 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3003, - "step": 3522 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3216, - "step": 3523 - }, - { - "epoch": 0.43, - "learning_rate": 0.0003, - "loss": 0.3066, - "step": 3524 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.3171, - "step": 3525 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.2936, - "step": 3526 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.307, - "step": 3527 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.307, - "step": 3528 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.3043, - "step": 3529 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.306, - "step": 3530 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.308, - "step": 3531 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.3149, - "step": 3532 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.3034, - "step": 3533 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.2965, - "step": 3534 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.3034, - "step": 3535 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.2826, - "step": 3536 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.3131, - "step": 3537 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.3249, - "step": 3538 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.3049, - "step": 3539 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.3176, - "step": 3540 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.3078, - "step": 3541 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.2907, - "step": 3542 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.3085, - "step": 3543 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.304, - "step": 3544 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.2962, - "step": 3545 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.3057, - "step": 3546 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.3207, - "step": 3547 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.298, - "step": 3548 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.2962, - "step": 3549 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.2846, - "step": 3550 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.2976, - "step": 3551 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.3022, - "step": 3552 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.2878, - "step": 3553 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.3038, - "step": 3554 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.2942, - "step": 3555 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.3187, - "step": 3556 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.3169, - "step": 3557 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.3061, - "step": 3558 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.2896, - "step": 3559 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.3111, - "step": 3560 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.3004, - "step": 3561 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.3097, - "step": 3562 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.2898, - "step": 3563 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.3058, - "step": 3564 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.307, - "step": 3565 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.3103, - "step": 3566 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.3111, - "step": 3567 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.3083, - "step": 3568 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.322, - "step": 3569 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.318, - "step": 3570 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.3082, - "step": 3571 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.31, - "step": 3572 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.3228, - "step": 3573 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.3029, - "step": 3574 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.3155, - "step": 3575 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.3018, - "step": 3576 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.3131, - "step": 3577 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.3117, - "step": 3578 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.3056, - "step": 3579 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.3025, - "step": 3580 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.318, - "step": 3581 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.31, - "step": 3582 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.32, - "step": 3583 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.31, - "step": 3584 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.3057, - "step": 3585 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.2994, - "step": 3586 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.3138, - "step": 3587 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.2956, - "step": 3588 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.3091, - "step": 3589 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.3022, - "step": 3590 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.3182, - "step": 3591 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.312, - "step": 3592 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.3034, - "step": 3593 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.3349, - "step": 3594 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.3242, - "step": 3595 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.2911, - "step": 3596 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.304, - "step": 3597 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.3257, - "step": 3598 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.307, - "step": 3599 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.3207, - "step": 3600 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.3174, - "step": 3601 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.318, - "step": 3602 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.316, - "step": 3603 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.2942, - "step": 3604 - }, - { - "epoch": 0.44, - "learning_rate": 0.0003, - "loss": 0.3177, - "step": 3605 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3071, - "step": 3606 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3085, - "step": 3607 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3067, - "step": 3608 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3213, - "step": 3609 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3104, - "step": 3610 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.2951, - "step": 3611 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3127, - "step": 3612 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3047, - "step": 3613 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3122, - "step": 3614 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3005, - "step": 3615 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.2958, - "step": 3616 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3151, - "step": 3617 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.2908, - "step": 3618 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3204, - "step": 3619 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.2957, - "step": 3620 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3002, - "step": 3621 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3016, - "step": 3622 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3127, - "step": 3623 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3029, - "step": 3624 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.2853, - "step": 3625 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3174, - "step": 3626 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3048, - "step": 3627 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.2966, - "step": 3628 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3236, - "step": 3629 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.2872, - "step": 3630 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.2924, - "step": 3631 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.29, - "step": 3632 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3028, - "step": 3633 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3021, - "step": 3634 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3005, - "step": 3635 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3001, - "step": 3636 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3103, - "step": 3637 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.2964, - "step": 3638 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3072, - "step": 3639 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3063, - "step": 3640 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3116, - "step": 3641 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3004, - "step": 3642 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.287, - "step": 3643 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3071, - "step": 3644 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3052, - "step": 3645 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3118, - "step": 3646 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3081, - "step": 3647 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3052, - "step": 3648 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.2928, - "step": 3649 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3123, - "step": 3650 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3066, - "step": 3651 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.2926, - "step": 3652 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.2879, - "step": 3653 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.311, - "step": 3654 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3033, - "step": 3655 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3207, - "step": 3656 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.2955, - "step": 3657 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3053, - "step": 3658 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.2886, - "step": 3659 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3129, - "step": 3660 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.299, - "step": 3661 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.2931, - "step": 3662 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.325, - "step": 3663 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.2935, - "step": 3664 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.2829, - "step": 3665 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.302, - "step": 3666 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3134, - "step": 3667 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3114, - "step": 3668 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3143, - "step": 3669 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3051, - "step": 3670 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3165, - "step": 3671 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3075, - "step": 3672 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3038, - "step": 3673 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.308, - "step": 3674 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3231, - "step": 3675 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3246, - "step": 3676 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.2883, - "step": 3677 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.308, - "step": 3678 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3125, - "step": 3679 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3144, - "step": 3680 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3146, - "step": 3681 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.2821, - "step": 3682 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.2995, - "step": 3683 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.2906, - "step": 3684 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3036, - "step": 3685 - }, - { - "epoch": 0.45, - "learning_rate": 0.0003, - "loss": 0.3059, - "step": 3686 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.2883, - "step": 3687 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.3459, - "step": 3688 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.3054, - "step": 3689 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.3004, - "step": 3690 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.3186, - "step": 3691 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.2977, - "step": 3692 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.3212, - "step": 3693 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.2976, - "step": 3694 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.2847, - "step": 3695 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.2952, - "step": 3696 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.312, - "step": 3697 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.3086, - "step": 3698 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.2995, - "step": 3699 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.3086, - "step": 3700 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.303, - "step": 3701 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.3088, - "step": 3702 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.2889, - "step": 3703 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.3223, - "step": 3704 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.3057, - "step": 3705 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.3078, - "step": 3706 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.2969, - "step": 3707 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.3327, - "step": 3708 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.3084, - "step": 3709 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.3251, - "step": 3710 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.3078, - "step": 3711 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.3088, - "step": 3712 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.3133, - "step": 3713 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.2915, - "step": 3714 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.2965, - "step": 3715 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.3173, - "step": 3716 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.3066, - "step": 3717 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.2958, - "step": 3718 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.2847, - "step": 3719 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.3131, - "step": 3720 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.3126, - "step": 3721 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.303, - "step": 3722 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.3066, - "step": 3723 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.3214, - "step": 3724 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.3111, - "step": 3725 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.2964, - "step": 3726 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.2907, - "step": 3727 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.2928, - "step": 3728 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.3206, - "step": 3729 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.2942, - "step": 3730 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.3053, - "step": 3731 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.2892, - "step": 3732 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.3028, - "step": 3733 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.3155, - "step": 3734 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.3077, - "step": 3735 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.2917, - "step": 3736 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.2957, - "step": 3737 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.3071, - "step": 3738 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.2947, - "step": 3739 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.3213, - "step": 3740 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.2936, - "step": 3741 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.3254, - "step": 3742 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.3211, - "step": 3743 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.3071, - "step": 3744 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.3087, - "step": 3745 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.2901, - "step": 3746 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.3065, - "step": 3747 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.3131, - "step": 3748 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.3065, - "step": 3749 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.2952, - "step": 3750 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.3135, - "step": 3751 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.2976, - "step": 3752 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.2958, - "step": 3753 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.307, - "step": 3754 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.2947, - "step": 3755 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.3092, - "step": 3756 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.3004, - "step": 3757 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.2891, - "step": 3758 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.3041, - "step": 3759 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.2745, - "step": 3760 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.2973, - "step": 3761 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.2993, - "step": 3762 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.2983, - "step": 3763 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.3079, - "step": 3764 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.3081, - "step": 3765 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.2842, - "step": 3766 - }, - { - "epoch": 0.46, - "learning_rate": 0.0003, - "loss": 0.3007, - "step": 3767 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.3043, - "step": 3768 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.2942, - "step": 3769 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.2907, - "step": 3770 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.3041, - "step": 3771 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.3181, - "step": 3772 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.305, - "step": 3773 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.296, - "step": 3774 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.3116, - "step": 3775 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.3104, - "step": 3776 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.2923, - "step": 3777 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.2965, - "step": 3778 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.2827, - "step": 3779 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.3032, - "step": 3780 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.2974, - "step": 3781 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.3036, - "step": 3782 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.304, - "step": 3783 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.3124, - "step": 3784 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.2947, - "step": 3785 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.2914, - "step": 3786 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.2902, - "step": 3787 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.3204, - "step": 3788 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.2979, - "step": 3789 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.3033, - "step": 3790 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.2976, - "step": 3791 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.3047, - "step": 3792 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.2935, - "step": 3793 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.3177, - "step": 3794 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.2869, - "step": 3795 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.286, - "step": 3796 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.3097, - "step": 3797 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.3033, - "step": 3798 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.2806, - "step": 3799 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.3112, - "step": 3800 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.3218, - "step": 3801 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.2861, - "step": 3802 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.3092, - "step": 3803 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.2918, - "step": 3804 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.2856, - "step": 3805 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.3063, - "step": 3806 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.3009, - "step": 3807 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.2927, - "step": 3808 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.3147, - "step": 3809 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.2798, - "step": 3810 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.3114, - "step": 3811 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.2953, - "step": 3812 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.2952, - "step": 3813 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.307, - "step": 3814 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.2916, - "step": 3815 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.2835, - "step": 3816 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.3095, - "step": 3817 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.2904, - "step": 3818 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.3009, - "step": 3819 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.2955, - "step": 3820 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.2871, - "step": 3821 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.29, - "step": 3822 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.3046, - "step": 3823 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.3057, - "step": 3824 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.3062, - "step": 3825 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.302, - "step": 3826 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.3011, - "step": 3827 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.313, - "step": 3828 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.3132, - "step": 3829 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.2808, - "step": 3830 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.2965, - "step": 3831 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.3307, - "step": 3832 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.3032, - "step": 3833 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.2995, - "step": 3834 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.3054, - "step": 3835 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.2998, - "step": 3836 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.2992, - "step": 3837 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.2877, - "step": 3838 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.2998, - "step": 3839 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.2997, - "step": 3840 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.2967, - "step": 3841 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.3135, - "step": 3842 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.3128, - "step": 3843 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.2906, - "step": 3844 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.3065, - "step": 3845 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.2787, - "step": 3846 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.2939, - "step": 3847 - }, - { - "epoch": 0.47, - "learning_rate": 0.0003, - "loss": 0.315, - "step": 3848 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.286, - "step": 3849 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.2833, - "step": 3850 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.2953, - "step": 3851 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.3134, - "step": 3852 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.2971, - "step": 3853 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.2896, - "step": 3854 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.3053, - "step": 3855 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.2905, - "step": 3856 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.2957, - "step": 3857 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.3057, - "step": 3858 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.3051, - "step": 3859 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.3033, - "step": 3860 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.2891, - "step": 3861 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.2985, - "step": 3862 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.3114, - "step": 3863 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.3062, - "step": 3864 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.2955, - "step": 3865 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.2956, - "step": 3866 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.3076, - "step": 3867 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.2852, - "step": 3868 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.2978, - "step": 3869 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.2979, - "step": 3870 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.3059, - "step": 3871 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.3041, - "step": 3872 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.2971, - "step": 3873 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.3021, - "step": 3874 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.3289, - "step": 3875 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.3029, - "step": 3876 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.2987, - "step": 3877 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.3139, - "step": 3878 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.2965, - "step": 3879 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.3096, - "step": 3880 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.3056, - "step": 3881 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.3064, - "step": 3882 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.2883, - "step": 3883 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.296, - "step": 3884 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.2964, - "step": 3885 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.3049, - "step": 3886 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.2836, - "step": 3887 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.3027, - "step": 3888 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.3037, - "step": 3889 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.3037, - "step": 3890 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.2947, - "step": 3891 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.2888, - "step": 3892 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.3003, - "step": 3893 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.2857, - "step": 3894 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.2925, - "step": 3895 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.3167, - "step": 3896 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.2937, - "step": 3897 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.2904, - "step": 3898 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.2938, - "step": 3899 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.3042, - "step": 3900 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.2903, - "step": 3901 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.3149, - "step": 3902 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.2957, - "step": 3903 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.275, - "step": 3904 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.2863, - "step": 3905 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.2979, - "step": 3906 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.2906, - "step": 3907 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.3005, - "step": 3908 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.313, - "step": 3909 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.3113, - "step": 3910 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.308, - "step": 3911 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.302, - "step": 3912 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.3121, - "step": 3913 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.2993, - "step": 3914 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.3235, - "step": 3915 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.2959, - "step": 3916 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.2895, - "step": 3917 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.3076, - "step": 3918 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.2947, - "step": 3919 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.2946, - "step": 3920 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.3058, - "step": 3921 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.31, - "step": 3922 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.3072, - "step": 3923 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.3117, - "step": 3924 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.3141, - "step": 3925 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.299, - "step": 3926 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.3073, - "step": 3927 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.293, - "step": 3928 - }, - { - "epoch": 0.48, - "learning_rate": 0.0003, - "loss": 0.287, - "step": 3929 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.2856, - "step": 3930 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.2893, - "step": 3931 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.2949, - "step": 3932 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.2946, - "step": 3933 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.3108, - "step": 3934 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.2835, - "step": 3935 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.3228, - "step": 3936 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.3161, - "step": 3937 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.2772, - "step": 3938 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.2942, - "step": 3939 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.3155, - "step": 3940 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.3139, - "step": 3941 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.3051, - "step": 3942 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.3065, - "step": 3943 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.3018, - "step": 3944 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.3054, - "step": 3945 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.3004, - "step": 3946 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.2942, - "step": 3947 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.2926, - "step": 3948 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.3013, - "step": 3949 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.2981, - "step": 3950 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.2776, - "step": 3951 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.2972, - "step": 3952 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.2937, - "step": 3953 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.2859, - "step": 3954 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.3133, - "step": 3955 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.283, - "step": 3956 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.2856, - "step": 3957 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.3078, - "step": 3958 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.309, - "step": 3959 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.3062, - "step": 3960 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.2875, - "step": 3961 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.3188, - "step": 3962 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.3033, - "step": 3963 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.2985, - "step": 3964 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.2793, - "step": 3965 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.3061, - "step": 3966 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.2955, - "step": 3967 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.2795, - "step": 3968 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.2977, - "step": 3969 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.2986, - "step": 3970 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.3028, - "step": 3971 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.292, - "step": 3972 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.2746, - "step": 3973 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.2998, - "step": 3974 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.2951, - "step": 3975 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.2923, - "step": 3976 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.3002, - "step": 3977 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.3108, - "step": 3978 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.3047, - "step": 3979 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.2806, - "step": 3980 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.2953, - "step": 3981 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.3052, - "step": 3982 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.3055, - "step": 3983 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.2875, - "step": 3984 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.3055, - "step": 3985 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.3059, - "step": 3986 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.3004, - "step": 3987 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.2981, - "step": 3988 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.2932, - "step": 3989 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.2751, - "step": 3990 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.3162, - "step": 3991 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.2991, - "step": 3992 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.2933, - "step": 3993 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.3106, - "step": 3994 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.3023, - "step": 3995 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.3009, - "step": 3996 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.2969, - "step": 3997 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.2884, - "step": 3998 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.313, - "step": 3999 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.2953, - "step": 4000 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.2897, - "step": 4001 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.3117, - "step": 4002 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.3107, - "step": 4003 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.2964, - "step": 4004 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.2862, - "step": 4005 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.2783, - "step": 4006 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.3227, - "step": 4007 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.2979, - "step": 4008 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.3051, - "step": 4009 - }, - { - "epoch": 0.49, - "learning_rate": 0.0003, - "loss": 0.2905, - "step": 4010 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.2962, - "step": 4011 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.2938, - "step": 4012 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.2838, - "step": 4013 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.3038, - "step": 4014 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.2841, - "step": 4015 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.2927, - "step": 4016 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.2947, - "step": 4017 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.2894, - "step": 4018 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.2761, - "step": 4019 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.2822, - "step": 4020 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.305, - "step": 4021 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.3073, - "step": 4022 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.2936, - "step": 4023 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.2928, - "step": 4024 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.3002, - "step": 4025 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.295, - "step": 4026 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.3056, - "step": 4027 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.2944, - "step": 4028 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.284, - "step": 4029 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.2961, - "step": 4030 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.293, - "step": 4031 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.2863, - "step": 4032 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.2964, - "step": 4033 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.2911, - "step": 4034 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.2882, - "step": 4035 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.2729, - "step": 4036 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.2876, - "step": 4037 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.2945, - "step": 4038 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.3055, - "step": 4039 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.3009, - "step": 4040 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.3115, - "step": 4041 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.3126, - "step": 4042 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.3024, - "step": 4043 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.2761, - "step": 4044 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.3217, - "step": 4045 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.2863, - "step": 4046 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.3196, - "step": 4047 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.3123, - "step": 4048 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.2911, - "step": 4049 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.2846, - "step": 4050 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.2962, - "step": 4051 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.2819, - "step": 4052 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.2869, - "step": 4053 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.2888, - "step": 4054 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.2889, - "step": 4055 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.3051, - "step": 4056 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.2906, - "step": 4057 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.3199, - "step": 4058 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.2912, - "step": 4059 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.2983, - "step": 4060 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.3058, - "step": 4061 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.3101, - "step": 4062 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.3005, - "step": 4063 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.2881, - "step": 4064 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.2953, - "step": 4065 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.288, - "step": 4066 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.3063, - "step": 4067 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.2966, - "step": 4068 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.2965, - "step": 4069 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.3057, - "step": 4070 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.294, - "step": 4071 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.289, - "step": 4072 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.2862, - "step": 4073 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.3014, - "step": 4074 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.3113, - "step": 4075 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.2897, - "step": 4076 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.2831, - "step": 4077 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.2907, - "step": 4078 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.2968, - "step": 4079 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.2946, - "step": 4080 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.3082, - "step": 4081 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.2985, - "step": 4082 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.2861, - "step": 4083 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.2943, - "step": 4084 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.3017, - "step": 4085 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.3023, - "step": 4086 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.2927, - "step": 4087 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.3008, - "step": 4088 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.302, - "step": 4089 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.2869, - "step": 4090 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.3042, - "step": 4091 - }, - { - "epoch": 0.5, - "learning_rate": 0.0003, - "loss": 0.3109, - "step": 4092 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2875, - "step": 4093 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2978, - "step": 4094 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2863, - "step": 4095 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.3046, - "step": 4096 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.3034, - "step": 4097 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2858, - "step": 4098 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.295, - "step": 4099 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.3059, - "step": 4100 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2965, - "step": 4101 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.3225, - "step": 4102 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.3176, - "step": 4103 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2911, - "step": 4104 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.3165, - "step": 4105 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.3113, - "step": 4106 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2935, - "step": 4107 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2999, - "step": 4108 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2845, - "step": 4109 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2933, - "step": 4110 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2935, - "step": 4111 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2702, - "step": 4112 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2852, - "step": 4113 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.3202, - "step": 4114 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2934, - "step": 4115 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.294, - "step": 4116 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2989, - "step": 4117 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2885, - "step": 4118 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2915, - "step": 4119 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2972, - "step": 4120 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2837, - "step": 4121 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2918, - "step": 4122 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2675, - "step": 4123 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2924, - "step": 4124 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2888, - "step": 4125 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.3157, - "step": 4126 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.3016, - "step": 4127 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2953, - "step": 4128 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.307, - "step": 4129 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.304, - "step": 4130 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2932, - "step": 4131 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2874, - "step": 4132 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.3012, - "step": 4133 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2897, - "step": 4134 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.3074, - "step": 4135 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2864, - "step": 4136 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.3018, - "step": 4137 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2975, - "step": 4138 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2911, - "step": 4139 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2832, - "step": 4140 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2891, - "step": 4141 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2998, - "step": 4142 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2928, - "step": 4143 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2951, - "step": 4144 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2951, - "step": 4145 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2906, - "step": 4146 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.3025, - "step": 4147 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2928, - "step": 4148 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2971, - "step": 4149 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.3052, - "step": 4150 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2838, - "step": 4151 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2734, - "step": 4152 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2887, - "step": 4153 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2981, - "step": 4154 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.3072, - "step": 4155 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2922, - "step": 4156 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2995, - "step": 4157 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2862, - "step": 4158 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2622, - "step": 4159 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2907, - "step": 4160 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2872, - "step": 4161 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2894, - "step": 4162 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2899, - "step": 4163 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.3022, - "step": 4164 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2766, - "step": 4165 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2859, - "step": 4166 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2987, - "step": 4167 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2858, - "step": 4168 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2836, - "step": 4169 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2898, - "step": 4170 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.3016, - "step": 4171 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2962, - "step": 4172 - }, - { - "epoch": 0.51, - "learning_rate": 0.0003, - "loss": 0.2929, - "step": 4173 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.2893, - "step": 4174 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.296, - "step": 4175 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.294, - "step": 4176 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.2903, - "step": 4177 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.303, - "step": 4178 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.2988, - "step": 4179 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.2953, - "step": 4180 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.3027, - "step": 4181 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.2839, - "step": 4182 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.2747, - "step": 4183 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.3116, - "step": 4184 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.2795, - "step": 4185 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.2926, - "step": 4186 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.3066, - "step": 4187 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.3009, - "step": 4188 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.2856, - "step": 4189 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.2856, - "step": 4190 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.2943, - "step": 4191 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.2994, - "step": 4192 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.2964, - "step": 4193 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.2992, - "step": 4194 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.2981, - "step": 4195 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.2998, - "step": 4196 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.2998, - "step": 4197 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.2893, - "step": 4198 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.3133, - "step": 4199 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.2827, - "step": 4200 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.291, - "step": 4201 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.2904, - "step": 4202 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.3065, - "step": 4203 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.308, - "step": 4204 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.3061, - "step": 4205 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.291, - "step": 4206 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.315, - "step": 4207 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.3022, - "step": 4208 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.2926, - "step": 4209 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.2875, - "step": 4210 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.3122, - "step": 4211 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.2851, - "step": 4212 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.299, - "step": 4213 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.2746, - "step": 4214 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.2847, - "step": 4215 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.3119, - "step": 4216 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.3089, - "step": 4217 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.2847, - "step": 4218 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.3038, - "step": 4219 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.2911, - "step": 4220 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.3058, - "step": 4221 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.2908, - "step": 4222 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.3131, - "step": 4223 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.3059, - "step": 4224 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.2807, - "step": 4225 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.3031, - "step": 4226 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.2888, - "step": 4227 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.29, - "step": 4228 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.2932, - "step": 4229 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.3005, - "step": 4230 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.3076, - "step": 4231 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.2946, - "step": 4232 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.2913, - "step": 4233 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.2889, - "step": 4234 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.2955, - "step": 4235 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.3009, - "step": 4236 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.287, - "step": 4237 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.2787, - "step": 4238 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.2974, - "step": 4239 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.2781, - "step": 4240 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.2986, - "step": 4241 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.2888, - "step": 4242 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.2852, - "step": 4243 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.2946, - "step": 4244 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.2975, - "step": 4245 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.2863, - "step": 4246 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.299, - "step": 4247 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.3011, - "step": 4248 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.2804, - "step": 4249 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.2884, - "step": 4250 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.2805, - "step": 4251 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.3023, - "step": 4252 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.2846, - "step": 4253 - }, - { - "epoch": 0.52, - "learning_rate": 0.0003, - "loss": 0.2826, - "step": 4254 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2945, - "step": 4255 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.3011, - "step": 4256 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2974, - "step": 4257 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.3074, - "step": 4258 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.3037, - "step": 4259 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.3004, - "step": 4260 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2995, - "step": 4261 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2893, - "step": 4262 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2824, - "step": 4263 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2757, - "step": 4264 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2907, - "step": 4265 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2995, - "step": 4266 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.3068, - "step": 4267 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.287, - "step": 4268 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2985, - "step": 4269 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.3036, - "step": 4270 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2906, - "step": 4271 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2755, - "step": 4272 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2889, - "step": 4273 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.29, - "step": 4274 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2848, - "step": 4275 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2798, - "step": 4276 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.3174, - "step": 4277 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2974, - "step": 4278 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.3046, - "step": 4279 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2849, - "step": 4280 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.3009, - "step": 4281 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.298, - "step": 4282 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2946, - "step": 4283 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2795, - "step": 4284 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2841, - "step": 4285 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2636, - "step": 4286 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2904, - "step": 4287 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2865, - "step": 4288 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.293, - "step": 4289 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.296, - "step": 4290 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.302, - "step": 4291 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2999, - "step": 4292 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.3163, - "step": 4293 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2779, - "step": 4294 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2978, - "step": 4295 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2971, - "step": 4296 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.289, - "step": 4297 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2845, - "step": 4298 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2808, - "step": 4299 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2871, - "step": 4300 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2993, - "step": 4301 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.267, - "step": 4302 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.3013, - "step": 4303 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2888, - "step": 4304 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2971, - "step": 4305 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2918, - "step": 4306 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2919, - "step": 4307 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2922, - "step": 4308 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2851, - "step": 4309 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.294, - "step": 4310 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2866, - "step": 4311 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2879, - "step": 4312 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2783, - "step": 4313 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2884, - "step": 4314 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2805, - "step": 4315 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.3071, - "step": 4316 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2967, - "step": 4317 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2812, - "step": 4318 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.3064, - "step": 4319 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2785, - "step": 4320 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2885, - "step": 4321 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.3174, - "step": 4322 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2906, - "step": 4323 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2951, - "step": 4324 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2875, - "step": 4325 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2859, - "step": 4326 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2939, - "step": 4327 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2767, - "step": 4328 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2881, - "step": 4329 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2891, - "step": 4330 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.299, - "step": 4331 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2821, - "step": 4332 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2887, - "step": 4333 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2957, - "step": 4334 - }, - { - "epoch": 0.53, - "learning_rate": 0.0003, - "loss": 0.2917, - "step": 4335 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2866, - "step": 4336 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2953, - "step": 4337 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2941, - "step": 4338 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2891, - "step": 4339 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2942, - "step": 4340 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.3065, - "step": 4341 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2959, - "step": 4342 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2713, - "step": 4343 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2948, - "step": 4344 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.291, - "step": 4345 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.3072, - "step": 4346 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2893, - "step": 4347 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2927, - "step": 4348 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2773, - "step": 4349 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2764, - "step": 4350 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.3007, - "step": 4351 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2757, - "step": 4352 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.3109, - "step": 4353 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2798, - "step": 4354 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.292, - "step": 4355 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.3161, - "step": 4356 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2815, - "step": 4357 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2928, - "step": 4358 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2881, - "step": 4359 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2908, - "step": 4360 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2786, - "step": 4361 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2868, - "step": 4362 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2948, - "step": 4363 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2951, - "step": 4364 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2972, - "step": 4365 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2885, - "step": 4366 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2964, - "step": 4367 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2984, - "step": 4368 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.3094, - "step": 4369 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2783, - "step": 4370 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2848, - "step": 4371 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2698, - "step": 4372 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2966, - "step": 4373 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.301, - "step": 4374 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2878, - "step": 4375 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.3002, - "step": 4376 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2932, - "step": 4377 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2751, - "step": 4378 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2907, - "step": 4379 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.3023, - "step": 4380 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.3036, - "step": 4381 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2764, - "step": 4382 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2722, - "step": 4383 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.282, - "step": 4384 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2831, - "step": 4385 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2971, - "step": 4386 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2727, - "step": 4387 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.3039, - "step": 4388 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2813, - "step": 4389 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2915, - "step": 4390 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2968, - "step": 4391 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2946, - "step": 4392 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2932, - "step": 4393 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2721, - "step": 4394 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2929, - "step": 4395 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2765, - "step": 4396 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2878, - "step": 4397 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2887, - "step": 4398 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.282, - "step": 4399 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2938, - "step": 4400 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2813, - "step": 4401 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2788, - "step": 4402 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2874, - "step": 4403 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2933, - "step": 4404 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.283, - "step": 4405 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2806, - "step": 4406 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2904, - "step": 4407 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2757, - "step": 4408 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2989, - "step": 4409 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2715, - "step": 4410 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2833, - "step": 4411 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.3046, - "step": 4412 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2989, - "step": 4413 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2826, - "step": 4414 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2816, - "step": 4415 - }, - { - "epoch": 0.54, - "learning_rate": 0.0003, - "loss": 0.2856, - "step": 4416 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.276, - "step": 4417 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2875, - "step": 4418 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2913, - "step": 4419 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2938, - "step": 4420 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.3132, - "step": 4421 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.3025, - "step": 4422 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2808, - "step": 4423 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2932, - "step": 4424 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2943, - "step": 4425 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2944, - "step": 4426 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.3005, - "step": 4427 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.3014, - "step": 4428 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2923, - "step": 4429 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2762, - "step": 4430 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.296, - "step": 4431 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2971, - "step": 4432 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2949, - "step": 4433 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2922, - "step": 4434 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2762, - "step": 4435 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.3049, - "step": 4436 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.3117, - "step": 4437 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2981, - "step": 4438 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.3011, - "step": 4439 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.3099, - "step": 4440 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2797, - "step": 4441 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2898, - "step": 4442 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.287, - "step": 4443 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2931, - "step": 4444 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2799, - "step": 4445 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.3005, - "step": 4446 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.3013, - "step": 4447 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.305, - "step": 4448 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2743, - "step": 4449 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2691, - "step": 4450 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2788, - "step": 4451 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2806, - "step": 4452 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2936, - "step": 4453 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2927, - "step": 4454 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.273, - "step": 4455 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2759, - "step": 4456 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2945, - "step": 4457 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2954, - "step": 4458 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2774, - "step": 4459 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2838, - "step": 4460 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2893, - "step": 4461 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2821, - "step": 4462 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.3118, - "step": 4463 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2934, - "step": 4464 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2716, - "step": 4465 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2868, - "step": 4466 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2955, - "step": 4467 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2807, - "step": 4468 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2909, - "step": 4469 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.291, - "step": 4470 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2948, - "step": 4471 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2928, - "step": 4472 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2744, - "step": 4473 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2768, - "step": 4474 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.293, - "step": 4475 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2842, - "step": 4476 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.3014, - "step": 4477 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2894, - "step": 4478 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2733, - "step": 4479 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2915, - "step": 4480 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.3079, - "step": 4481 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2848, - "step": 4482 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.3142, - "step": 4483 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.3016, - "step": 4484 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2958, - "step": 4485 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2753, - "step": 4486 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2655, - "step": 4487 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2868, - "step": 4488 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2864, - "step": 4489 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2848, - "step": 4490 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.3097, - "step": 4491 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2858, - "step": 4492 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2857, - "step": 4493 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2772, - "step": 4494 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2928, - "step": 4495 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.2893, - "step": 4496 - }, - { - "epoch": 0.55, - "learning_rate": 0.0003, - "loss": 0.286, - "step": 4497 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.3057, - "step": 4498 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.3021, - "step": 4499 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2896, - "step": 4500 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2851, - "step": 4501 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2641, - "step": 4502 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2884, - "step": 4503 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.3005, - "step": 4504 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.284, - "step": 4505 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2737, - "step": 4506 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.293, - "step": 4507 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2941, - "step": 4508 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2916, - "step": 4509 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2699, - "step": 4510 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2834, - "step": 4511 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.3026, - "step": 4512 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.3019, - "step": 4513 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.3103, - "step": 4514 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2908, - "step": 4515 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.3041, - "step": 4516 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.3084, - "step": 4517 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2753, - "step": 4518 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.3016, - "step": 4519 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2819, - "step": 4520 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.3029, - "step": 4521 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2896, - "step": 4522 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2763, - "step": 4523 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2973, - "step": 4524 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2869, - "step": 4525 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.3126, - "step": 4526 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2814, - "step": 4527 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2842, - "step": 4528 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.3049, - "step": 4529 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.29, - "step": 4530 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2913, - "step": 4531 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.287, - "step": 4532 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2857, - "step": 4533 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2706, - "step": 4534 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2855, - "step": 4535 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2827, - "step": 4536 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2994, - "step": 4537 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.3055, - "step": 4538 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2995, - "step": 4539 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2832, - "step": 4540 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2976, - "step": 4541 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.299, - "step": 4542 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2811, - "step": 4543 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2818, - "step": 4544 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2833, - "step": 4545 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2808, - "step": 4546 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.3082, - "step": 4547 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2897, - "step": 4548 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2869, - "step": 4549 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2979, - "step": 4550 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2717, - "step": 4551 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2791, - "step": 4552 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.284, - "step": 4553 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.291, - "step": 4554 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2903, - "step": 4555 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2951, - "step": 4556 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2896, - "step": 4557 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2965, - "step": 4558 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2779, - "step": 4559 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2846, - "step": 4560 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2868, - "step": 4561 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2826, - "step": 4562 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2999, - "step": 4563 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2953, - "step": 4564 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2902, - "step": 4565 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2623, - "step": 4566 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2722, - "step": 4567 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2929, - "step": 4568 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2901, - "step": 4569 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2852, - "step": 4570 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.296, - "step": 4571 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2558, - "step": 4572 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.314, - "step": 4573 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2951, - "step": 4574 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2829, - "step": 4575 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2884, - "step": 4576 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2824, - "step": 4577 - }, - { - "epoch": 0.56, - "learning_rate": 0.0003, - "loss": 0.2776, - "step": 4578 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2915, - "step": 4579 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.292, - "step": 4580 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.288, - "step": 4581 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2788, - "step": 4582 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.302, - "step": 4583 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2859, - "step": 4584 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2779, - "step": 4585 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2863, - "step": 4586 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2902, - "step": 4587 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.276, - "step": 4588 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2949, - "step": 4589 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2695, - "step": 4590 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2798, - "step": 4591 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2795, - "step": 4592 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2603, - "step": 4593 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2853, - "step": 4594 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2983, - "step": 4595 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.278, - "step": 4596 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2948, - "step": 4597 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2935, - "step": 4598 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.299, - "step": 4599 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2785, - "step": 4600 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2775, - "step": 4601 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2816, - "step": 4602 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2859, - "step": 4603 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2847, - "step": 4604 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2692, - "step": 4605 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2972, - "step": 4606 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2913, - "step": 4607 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2808, - "step": 4608 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2769, - "step": 4609 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.3019, - "step": 4610 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2899, - "step": 4611 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.3053, - "step": 4612 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.298, - "step": 4613 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2805, - "step": 4614 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2773, - "step": 4615 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2816, - "step": 4616 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2929, - "step": 4617 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2764, - "step": 4618 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2913, - "step": 4619 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.3014, - "step": 4620 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.3053, - "step": 4621 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2859, - "step": 4622 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2831, - "step": 4623 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2924, - "step": 4624 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2945, - "step": 4625 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.3, - "step": 4626 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2981, - "step": 4627 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2926, - "step": 4628 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2762, - "step": 4629 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2837, - "step": 4630 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2811, - "step": 4631 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2938, - "step": 4632 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2928, - "step": 4633 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2983, - "step": 4634 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2916, - "step": 4635 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2757, - "step": 4636 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.3034, - "step": 4637 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2803, - "step": 4638 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2843, - "step": 4639 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2969, - "step": 4640 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2724, - "step": 4641 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2925, - "step": 4642 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2968, - "step": 4643 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.3006, - "step": 4644 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2918, - "step": 4645 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2928, - "step": 4646 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.303, - "step": 4647 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2865, - "step": 4648 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.267, - "step": 4649 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2684, - "step": 4650 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.3046, - "step": 4651 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2911, - "step": 4652 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2873, - "step": 4653 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2902, - "step": 4654 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2952, - "step": 4655 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2759, - "step": 4656 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2741, - "step": 4657 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2969, - "step": 4658 - }, - { - "epoch": 0.57, - "learning_rate": 0.0003, - "loss": 0.2976, - "step": 4659 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2864, - "step": 4660 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2933, - "step": 4661 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.286, - "step": 4662 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.301, - "step": 4663 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.3005, - "step": 4664 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2907, - "step": 4665 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.305, - "step": 4666 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2859, - "step": 4667 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2911, - "step": 4668 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.285, - "step": 4669 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2786, - "step": 4670 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2891, - "step": 4671 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2753, - "step": 4672 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2804, - "step": 4673 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.277, - "step": 4674 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2932, - "step": 4675 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2853, - "step": 4676 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2865, - "step": 4677 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2737, - "step": 4678 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2957, - "step": 4679 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2758, - "step": 4680 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2787, - "step": 4681 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2996, - "step": 4682 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2953, - "step": 4683 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2762, - "step": 4684 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2885, - "step": 4685 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2918, - "step": 4686 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2892, - "step": 4687 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2902, - "step": 4688 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2916, - "step": 4689 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2778, - "step": 4690 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2812, - "step": 4691 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2898, - "step": 4692 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2794, - "step": 4693 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2773, - "step": 4694 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.294, - "step": 4695 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2808, - "step": 4696 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2915, - "step": 4697 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2744, - "step": 4698 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2886, - "step": 4699 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2856, - "step": 4700 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2959, - "step": 4701 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.271, - "step": 4702 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.3025, - "step": 4703 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.3071, - "step": 4704 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2962, - "step": 4705 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2861, - "step": 4706 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2942, - "step": 4707 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2888, - "step": 4708 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2747, - "step": 4709 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.3045, - "step": 4710 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2801, - "step": 4711 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2803, - "step": 4712 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.3096, - "step": 4713 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2909, - "step": 4714 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2879, - "step": 4715 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.3019, - "step": 4716 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2904, - "step": 4717 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2826, - "step": 4718 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.285, - "step": 4719 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2989, - "step": 4720 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2963, - "step": 4721 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2987, - "step": 4722 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2863, - "step": 4723 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2727, - "step": 4724 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2756, - "step": 4725 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.276, - "step": 4726 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2994, - "step": 4727 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2995, - "step": 4728 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2904, - "step": 4729 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2865, - "step": 4730 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2835, - "step": 4731 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2899, - "step": 4732 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2713, - "step": 4733 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2866, - "step": 4734 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2969, - "step": 4735 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2885, - "step": 4736 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.284, - "step": 4737 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2833, - "step": 4738 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2816, - "step": 4739 - }, - { - "epoch": 0.58, - "learning_rate": 0.0003, - "loss": 0.2963, - "step": 4740 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2674, - "step": 4741 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.3015, - "step": 4742 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2887, - "step": 4743 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.273, - "step": 4744 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2839, - "step": 4745 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2888, - "step": 4746 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2939, - "step": 4747 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2724, - "step": 4748 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.311, - "step": 4749 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2913, - "step": 4750 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.269, - "step": 4751 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2859, - "step": 4752 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2833, - "step": 4753 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2963, - "step": 4754 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2916, - "step": 4755 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2908, - "step": 4756 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2651, - "step": 4757 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2911, - "step": 4758 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2963, - "step": 4759 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2822, - "step": 4760 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.28, - "step": 4761 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2808, - "step": 4762 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.3002, - "step": 4763 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2963, - "step": 4764 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2766, - "step": 4765 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2724, - "step": 4766 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2835, - "step": 4767 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2739, - "step": 4768 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2824, - "step": 4769 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2856, - "step": 4770 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2821, - "step": 4771 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.3012, - "step": 4772 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2983, - "step": 4773 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2964, - "step": 4774 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2683, - "step": 4775 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2829, - "step": 4776 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2807, - "step": 4777 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2821, - "step": 4778 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2786, - "step": 4779 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2655, - "step": 4780 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2863, - "step": 4781 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2526, - "step": 4782 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2898, - "step": 4783 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2791, - "step": 4784 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2913, - "step": 4785 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2956, - "step": 4786 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2867, - "step": 4787 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.301, - "step": 4788 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2874, - "step": 4789 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2843, - "step": 4790 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2615, - "step": 4791 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2752, - "step": 4792 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2908, - "step": 4793 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2886, - "step": 4794 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2839, - "step": 4795 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2906, - "step": 4796 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2961, - "step": 4797 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2984, - "step": 4798 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2951, - "step": 4799 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.278, - "step": 4800 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.272, - "step": 4801 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2901, - "step": 4802 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2827, - "step": 4803 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2863, - "step": 4804 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.274, - "step": 4805 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2803, - "step": 4806 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2909, - "step": 4807 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.303, - "step": 4808 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2923, - "step": 4809 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.3041, - "step": 4810 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2772, - "step": 4811 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.282, - "step": 4812 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.3001, - "step": 4813 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2844, - "step": 4814 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2624, - "step": 4815 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.3082, - "step": 4816 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2887, - "step": 4817 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2795, - "step": 4818 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.3035, - "step": 4819 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2945, - "step": 4820 - }, - { - "epoch": 0.59, - "learning_rate": 0.0003, - "loss": 0.2875, - "step": 4821 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2632, - "step": 4822 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2763, - "step": 4823 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2869, - "step": 4824 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2846, - "step": 4825 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2868, - "step": 4826 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2687, - "step": 4827 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2963, - "step": 4828 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.3042, - "step": 4829 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2973, - "step": 4830 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2866, - "step": 4831 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2836, - "step": 4832 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2995, - "step": 4833 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2859, - "step": 4834 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.3016, - "step": 4835 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.3016, - "step": 4836 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2997, - "step": 4837 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2876, - "step": 4838 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2731, - "step": 4839 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.306, - "step": 4840 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2915, - "step": 4841 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2944, - "step": 4842 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2913, - "step": 4843 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2919, - "step": 4844 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2671, - "step": 4845 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.285, - "step": 4846 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2943, - "step": 4847 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2905, - "step": 4848 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2933, - "step": 4849 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2889, - "step": 4850 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2826, - "step": 4851 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.268, - "step": 4852 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2759, - "step": 4853 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2859, - "step": 4854 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2679, - "step": 4855 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2975, - "step": 4856 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.276, - "step": 4857 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2928, - "step": 4858 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2722, - "step": 4859 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2924, - "step": 4860 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.284, - "step": 4861 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2698, - "step": 4862 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2839, - "step": 4863 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2801, - "step": 4864 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2952, - "step": 4865 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.3003, - "step": 4866 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2854, - "step": 4867 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2937, - "step": 4868 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2798, - "step": 4869 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2786, - "step": 4870 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2726, - "step": 4871 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2788, - "step": 4872 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2925, - "step": 4873 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2807, - "step": 4874 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2876, - "step": 4875 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2808, - "step": 4876 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2902, - "step": 4877 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2987, - "step": 4878 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2865, - "step": 4879 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2669, - "step": 4880 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2935, - "step": 4881 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2823, - "step": 4882 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2805, - "step": 4883 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2814, - "step": 4884 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2845, - "step": 4885 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2747, - "step": 4886 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2765, - "step": 4887 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.291, - "step": 4888 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.291, - "step": 4889 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2937, - "step": 4890 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2839, - "step": 4891 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.264, - "step": 4892 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2883, - "step": 4893 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2933, - "step": 4894 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2838, - "step": 4895 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2902, - "step": 4896 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2954, - "step": 4897 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2925, - "step": 4898 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2654, - "step": 4899 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2805, - "step": 4900 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.284, - "step": 4901 - }, - { - "epoch": 0.6, - "learning_rate": 0.0003, - "loss": 0.2903, - "step": 4902 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2833, - "step": 4903 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.281, - "step": 4904 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2751, - "step": 4905 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2863, - "step": 4906 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2803, - "step": 4907 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.29, - "step": 4908 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2875, - "step": 4909 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2863, - "step": 4910 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2729, - "step": 4911 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2837, - "step": 4912 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2686, - "step": 4913 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2764, - "step": 4914 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2831, - "step": 4915 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.294, - "step": 4916 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2765, - "step": 4917 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2946, - "step": 4918 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2891, - "step": 4919 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2992, - "step": 4920 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.287, - "step": 4921 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2821, - "step": 4922 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2803, - "step": 4923 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.274, - "step": 4924 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2694, - "step": 4925 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2788, - "step": 4926 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2845, - "step": 4927 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2769, - "step": 4928 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2735, - "step": 4929 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2837, - "step": 4930 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.287, - "step": 4931 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.3014, - "step": 4932 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2676, - "step": 4933 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2823, - "step": 4934 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2638, - "step": 4935 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2949, - "step": 4936 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2917, - "step": 4937 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2767, - "step": 4938 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2597, - "step": 4939 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2995, - "step": 4940 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2852, - "step": 4941 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2887, - "step": 4942 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2875, - "step": 4943 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2774, - "step": 4944 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2899, - "step": 4945 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2755, - "step": 4946 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2977, - "step": 4947 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2837, - "step": 4948 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2907, - "step": 4949 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2769, - "step": 4950 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2915, - "step": 4951 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2773, - "step": 4952 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2853, - "step": 4953 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2893, - "step": 4954 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2845, - "step": 4955 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.3013, - "step": 4956 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2875, - "step": 4957 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2747, - "step": 4958 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.275, - "step": 4959 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2896, - "step": 4960 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2828, - "step": 4961 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2716, - "step": 4962 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.278, - "step": 4963 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.287, - "step": 4964 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2747, - "step": 4965 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2887, - "step": 4966 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2935, - "step": 4967 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2888, - "step": 4968 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2951, - "step": 4969 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.3038, - "step": 4970 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.3011, - "step": 4971 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2883, - "step": 4972 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.279, - "step": 4973 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.27, - "step": 4974 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2939, - "step": 4975 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2797, - "step": 4976 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2763, - "step": 4977 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2765, - "step": 4978 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2745, - "step": 4979 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2932, - "step": 4980 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2927, - "step": 4981 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2718, - "step": 4982 - }, - { - "epoch": 0.61, - "learning_rate": 0.0003, - "loss": 0.2945, - "step": 4983 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2841, - "step": 4984 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2866, - "step": 4985 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2716, - "step": 4986 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2898, - "step": 4987 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2635, - "step": 4988 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2844, - "step": 4989 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2677, - "step": 4990 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2706, - "step": 4991 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2743, - "step": 4992 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2954, - "step": 4993 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.288, - "step": 4994 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.276, - "step": 4995 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2687, - "step": 4996 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2854, - "step": 4997 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2755, - "step": 4998 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2736, - "step": 4999 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2845, - "step": 5000 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2855, - "step": 5001 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2763, - "step": 5002 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2958, - "step": 5003 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2939, - "step": 5004 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.3015, - "step": 5005 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.296, - "step": 5006 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2808, - "step": 5007 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2916, - "step": 5008 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2646, - "step": 5009 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2893, - "step": 5010 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2847, - "step": 5011 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2815, - "step": 5012 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2801, - "step": 5013 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2871, - "step": 5014 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2775, - "step": 5015 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2918, - "step": 5016 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.274, - "step": 5017 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2906, - "step": 5018 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2809, - "step": 5019 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2823, - "step": 5020 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2748, - "step": 5021 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.296, - "step": 5022 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2776, - "step": 5023 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2942, - "step": 5024 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2772, - "step": 5025 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2917, - "step": 5026 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.3103, - "step": 5027 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2984, - "step": 5028 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2907, - "step": 5029 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2753, - "step": 5030 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2717, - "step": 5031 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2795, - "step": 5032 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2844, - "step": 5033 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2799, - "step": 5034 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2769, - "step": 5035 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.295, - "step": 5036 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2774, - "step": 5037 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2675, - "step": 5038 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2828, - "step": 5039 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2737, - "step": 5040 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.297, - "step": 5041 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2926, - "step": 5042 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2875, - "step": 5043 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2921, - "step": 5044 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2748, - "step": 5045 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2825, - "step": 5046 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2846, - "step": 5047 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2705, - "step": 5048 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2904, - "step": 5049 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2699, - "step": 5050 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2666, - "step": 5051 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.3038, - "step": 5052 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.3012, - "step": 5053 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2577, - "step": 5054 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2816, - "step": 5055 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2826, - "step": 5056 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2715, - "step": 5057 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2815, - "step": 5058 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2771, - "step": 5059 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2951, - "step": 5060 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.276, - "step": 5061 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.284, - "step": 5062 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2782, - "step": 5063 - }, - { - "epoch": 0.62, - "learning_rate": 0.0003, - "loss": 0.2895, - "step": 5064 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2976, - "step": 5065 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.3017, - "step": 5066 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2912, - "step": 5067 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.276, - "step": 5068 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2906, - "step": 5069 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2727, - "step": 5070 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2572, - "step": 5071 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2839, - "step": 5072 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2855, - "step": 5073 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2768, - "step": 5074 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2808, - "step": 5075 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2554, - "step": 5076 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2762, - "step": 5077 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2939, - "step": 5078 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2852, - "step": 5079 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2901, - "step": 5080 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.279, - "step": 5081 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2884, - "step": 5082 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2933, - "step": 5083 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2945, - "step": 5084 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.3144, - "step": 5085 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2909, - "step": 5086 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2864, - "step": 5087 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2667, - "step": 5088 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2946, - "step": 5089 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2871, - "step": 5090 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.3071, - "step": 5091 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2739, - "step": 5092 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2838, - "step": 5093 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2923, - "step": 5094 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2911, - "step": 5095 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2688, - "step": 5096 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2701, - "step": 5097 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.292, - "step": 5098 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2657, - "step": 5099 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2746, - "step": 5100 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2815, - "step": 5101 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2693, - "step": 5102 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2941, - "step": 5103 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.273, - "step": 5104 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2907, - "step": 5105 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2812, - "step": 5106 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2955, - "step": 5107 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2781, - "step": 5108 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2906, - "step": 5109 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2683, - "step": 5110 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2897, - "step": 5111 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2857, - "step": 5112 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.292, - "step": 5113 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2826, - "step": 5114 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2906, - "step": 5115 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2817, - "step": 5116 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.295, - "step": 5117 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2905, - "step": 5118 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2863, - "step": 5119 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2832, - "step": 5120 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2758, - "step": 5121 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.286, - "step": 5122 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.288, - "step": 5123 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2855, - "step": 5124 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2758, - "step": 5125 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2901, - "step": 5126 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2783, - "step": 5127 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2969, - "step": 5128 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.276, - "step": 5129 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2824, - "step": 5130 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2913, - "step": 5131 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2765, - "step": 5132 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2617, - "step": 5133 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2823, - "step": 5134 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2735, - "step": 5135 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2682, - "step": 5136 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2793, - "step": 5137 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2916, - "step": 5138 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2896, - "step": 5139 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2571, - "step": 5140 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2869, - "step": 5141 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2633, - "step": 5142 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2887, - "step": 5143 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2713, - "step": 5144 - }, - { - "epoch": 0.63, - "learning_rate": 0.0003, - "loss": 0.2909, - "step": 5145 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2802, - "step": 5146 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2997, - "step": 5147 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.287, - "step": 5148 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2763, - "step": 5149 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2783, - "step": 5150 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2786, - "step": 5151 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2982, - "step": 5152 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2639, - "step": 5153 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.269, - "step": 5154 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.309, - "step": 5155 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2687, - "step": 5156 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.278, - "step": 5157 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2852, - "step": 5158 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2836, - "step": 5159 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2759, - "step": 5160 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2875, - "step": 5161 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2731, - "step": 5162 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2738, - "step": 5163 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2853, - "step": 5164 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2919, - "step": 5165 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2845, - "step": 5166 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2882, - "step": 5167 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2696, - "step": 5168 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2845, - "step": 5169 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2685, - "step": 5170 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2903, - "step": 5171 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2887, - "step": 5172 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2657, - "step": 5173 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.29, - "step": 5174 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2807, - "step": 5175 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2883, - "step": 5176 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2933, - "step": 5177 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2817, - "step": 5178 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.282, - "step": 5179 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2674, - "step": 5180 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2645, - "step": 5181 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2941, - "step": 5182 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.3027, - "step": 5183 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2738, - "step": 5184 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2952, - "step": 5185 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2666, - "step": 5186 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2852, - "step": 5187 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2814, - "step": 5188 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2979, - "step": 5189 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2843, - "step": 5190 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2729, - "step": 5191 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2694, - "step": 5192 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2825, - "step": 5193 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2744, - "step": 5194 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2839, - "step": 5195 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2869, - "step": 5196 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2964, - "step": 5197 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2607, - "step": 5198 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.272, - "step": 5199 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2811, - "step": 5200 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2707, - "step": 5201 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2899, - "step": 5202 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2777, - "step": 5203 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2747, - "step": 5204 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2766, - "step": 5205 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2812, - "step": 5206 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2748, - "step": 5207 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2695, - "step": 5208 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2766, - "step": 5209 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2879, - "step": 5210 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2786, - "step": 5211 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2801, - "step": 5212 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.29, - "step": 5213 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2884, - "step": 5214 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.3029, - "step": 5215 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2716, - "step": 5216 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2675, - "step": 5217 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2898, - "step": 5218 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2936, - "step": 5219 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2904, - "step": 5220 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2897, - "step": 5221 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2766, - "step": 5222 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2791, - "step": 5223 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.291, - "step": 5224 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2831, - "step": 5225 - }, - { - "epoch": 0.64, - "learning_rate": 0.0003, - "loss": 0.2745, - "step": 5226 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2756, - "step": 5227 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2756, - "step": 5228 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2611, - "step": 5229 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2759, - "step": 5230 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.28, - "step": 5231 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2695, - "step": 5232 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2893, - "step": 5233 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2846, - "step": 5234 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2731, - "step": 5235 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2901, - "step": 5236 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2572, - "step": 5237 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2595, - "step": 5238 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2774, - "step": 5239 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.274, - "step": 5240 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2853, - "step": 5241 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2878, - "step": 5242 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2796, - "step": 5243 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2737, - "step": 5244 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2931, - "step": 5245 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2776, - "step": 5246 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2862, - "step": 5247 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2678, - "step": 5248 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2751, - "step": 5249 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2807, - "step": 5250 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2887, - "step": 5251 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2779, - "step": 5252 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2771, - "step": 5253 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2872, - "step": 5254 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2721, - "step": 5255 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2873, - "step": 5256 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2772, - "step": 5257 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2828, - "step": 5258 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2661, - "step": 5259 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2733, - "step": 5260 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2798, - "step": 5261 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2825, - "step": 5262 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2819, - "step": 5263 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2858, - "step": 5264 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.287, - "step": 5265 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2757, - "step": 5266 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2788, - "step": 5267 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.3023, - "step": 5268 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2781, - "step": 5269 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2834, - "step": 5270 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2773, - "step": 5271 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2752, - "step": 5272 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2741, - "step": 5273 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2833, - "step": 5274 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.294, - "step": 5275 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2905, - "step": 5276 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.286, - "step": 5277 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2809, - "step": 5278 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2814, - "step": 5279 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.269, - "step": 5280 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.282, - "step": 5281 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.277, - "step": 5282 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2908, - "step": 5283 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2911, - "step": 5284 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2738, - "step": 5285 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2734, - "step": 5286 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2943, - "step": 5287 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2765, - "step": 5288 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2613, - "step": 5289 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.289, - "step": 5290 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2656, - "step": 5291 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2835, - "step": 5292 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2851, - "step": 5293 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2635, - "step": 5294 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2783, - "step": 5295 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2714, - "step": 5296 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2863, - "step": 5297 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2586, - "step": 5298 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2889, - "step": 5299 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2805, - "step": 5300 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2691, - "step": 5301 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2849, - "step": 5302 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2731, - "step": 5303 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2678, - "step": 5304 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2728, - "step": 5305 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2806, - "step": 5306 - }, - { - "epoch": 0.65, - "learning_rate": 0.0003, - "loss": 0.2884, - "step": 5307 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2922, - "step": 5308 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2862, - "step": 5309 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2983, - "step": 5310 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2937, - "step": 5311 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2751, - "step": 5312 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.275, - "step": 5313 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2652, - "step": 5314 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2772, - "step": 5315 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.265, - "step": 5316 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2711, - "step": 5317 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.269, - "step": 5318 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.27, - "step": 5319 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.266, - "step": 5320 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2548, - "step": 5321 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2752, - "step": 5322 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2752, - "step": 5323 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2703, - "step": 5324 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2648, - "step": 5325 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2832, - "step": 5326 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2782, - "step": 5327 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2817, - "step": 5328 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2727, - "step": 5329 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2896, - "step": 5330 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2868, - "step": 5331 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.287, - "step": 5332 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2847, - "step": 5333 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2767, - "step": 5334 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2917, - "step": 5335 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2626, - "step": 5336 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2831, - "step": 5337 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2652, - "step": 5338 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2818, - "step": 5339 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2711, - "step": 5340 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2811, - "step": 5341 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2651, - "step": 5342 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2957, - "step": 5343 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.3122, - "step": 5344 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2514, - "step": 5345 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2627, - "step": 5346 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2892, - "step": 5347 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2796, - "step": 5348 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2784, - "step": 5349 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2613, - "step": 5350 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2935, - "step": 5351 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2636, - "step": 5352 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2834, - "step": 5353 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2823, - "step": 5354 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2698, - "step": 5355 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2879, - "step": 5356 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.295, - "step": 5357 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2866, - "step": 5358 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2771, - "step": 5359 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2783, - "step": 5360 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2811, - "step": 5361 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2879, - "step": 5362 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2767, - "step": 5363 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2701, - "step": 5364 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2752, - "step": 5365 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2663, - "step": 5366 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2713, - "step": 5367 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2599, - "step": 5368 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2774, - "step": 5369 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2631, - "step": 5370 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2764, - "step": 5371 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2815, - "step": 5372 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2674, - "step": 5373 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2828, - "step": 5374 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2704, - "step": 5375 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2696, - "step": 5376 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2578, - "step": 5377 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2566, - "step": 5378 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2711, - "step": 5379 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2836, - "step": 5380 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2761, - "step": 5381 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2716, - "step": 5382 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2791, - "step": 5383 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.287, - "step": 5384 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2905, - "step": 5385 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2696, - "step": 5386 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.259, - "step": 5387 - }, - { - "epoch": 0.66, - "learning_rate": 0.0003, - "loss": 0.2759, - "step": 5388 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2995, - "step": 5389 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2923, - "step": 5390 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2765, - "step": 5391 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2937, - "step": 5392 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2847, - "step": 5393 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2725, - "step": 5394 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2779, - "step": 5395 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2664, - "step": 5396 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2928, - "step": 5397 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2889, - "step": 5398 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.269, - "step": 5399 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2731, - "step": 5400 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2656, - "step": 5401 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2793, - "step": 5402 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2727, - "step": 5403 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2632, - "step": 5404 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2711, - "step": 5405 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2775, - "step": 5406 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.271, - "step": 5407 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2687, - "step": 5408 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2898, - "step": 5409 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.266, - "step": 5410 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2717, - "step": 5411 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2794, - "step": 5412 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2754, - "step": 5413 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2955, - "step": 5414 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2948, - "step": 5415 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.296, - "step": 5416 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2899, - "step": 5417 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2926, - "step": 5418 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2817, - "step": 5419 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2799, - "step": 5420 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2813, - "step": 5421 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2928, - "step": 5422 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2838, - "step": 5423 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2736, - "step": 5424 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2716, - "step": 5425 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2709, - "step": 5426 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2942, - "step": 5427 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2764, - "step": 5428 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2751, - "step": 5429 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2739, - "step": 5430 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2868, - "step": 5431 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.278, - "step": 5432 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2875, - "step": 5433 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2829, - "step": 5434 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2567, - "step": 5435 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2751, - "step": 5436 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2811, - "step": 5437 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2618, - "step": 5438 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2811, - "step": 5439 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.276, - "step": 5440 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2814, - "step": 5441 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2843, - "step": 5442 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2826, - "step": 5443 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2826, - "step": 5444 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2687, - "step": 5445 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2632, - "step": 5446 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.265, - "step": 5447 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2837, - "step": 5448 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2761, - "step": 5449 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2626, - "step": 5450 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2646, - "step": 5451 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2955, - "step": 5452 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2591, - "step": 5453 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2887, - "step": 5454 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2743, - "step": 5455 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2598, - "step": 5456 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2689, - "step": 5457 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2777, - "step": 5458 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.288, - "step": 5459 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2781, - "step": 5460 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2891, - "step": 5461 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2921, - "step": 5462 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2759, - "step": 5463 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2587, - "step": 5464 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2769, - "step": 5465 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2715, - "step": 5466 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2829, - "step": 5467 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2845, - "step": 5468 - }, - { - "epoch": 0.67, - "learning_rate": 0.0003, - "loss": 0.2819, - "step": 5469 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2693, - "step": 5470 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2841, - "step": 5471 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2772, - "step": 5472 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2803, - "step": 5473 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2666, - "step": 5474 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2746, - "step": 5475 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2545, - "step": 5476 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2794, - "step": 5477 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2622, - "step": 5478 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2928, - "step": 5479 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2794, - "step": 5480 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2956, - "step": 5481 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.283, - "step": 5482 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2838, - "step": 5483 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2821, - "step": 5484 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2895, - "step": 5485 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2751, - "step": 5486 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2729, - "step": 5487 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2689, - "step": 5488 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.268, - "step": 5489 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2813, - "step": 5490 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2783, - "step": 5491 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2758, - "step": 5492 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2836, - "step": 5493 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2781, - "step": 5494 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2593, - "step": 5495 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.291, - "step": 5496 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2897, - "step": 5497 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2694, - "step": 5498 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2818, - "step": 5499 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2772, - "step": 5500 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2801, - "step": 5501 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2839, - "step": 5502 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.267, - "step": 5503 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.276, - "step": 5504 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2834, - "step": 5505 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2842, - "step": 5506 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2617, - "step": 5507 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.26, - "step": 5508 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2832, - "step": 5509 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2824, - "step": 5510 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2799, - "step": 5511 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2881, - "step": 5512 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.26, - "step": 5513 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2552, - "step": 5514 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2838, - "step": 5515 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2726, - "step": 5516 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2835, - "step": 5517 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2852, - "step": 5518 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2817, - "step": 5519 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2889, - "step": 5520 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2754, - "step": 5521 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2856, - "step": 5522 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2752, - "step": 5523 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2697, - "step": 5524 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2852, - "step": 5525 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.27, - "step": 5526 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2757, - "step": 5527 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2619, - "step": 5528 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2669, - "step": 5529 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2835, - "step": 5530 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.284, - "step": 5531 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.287, - "step": 5532 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2719, - "step": 5533 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.285, - "step": 5534 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.269, - "step": 5535 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2549, - "step": 5536 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2852, - "step": 5537 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2762, - "step": 5538 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2841, - "step": 5539 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.285, - "step": 5540 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2668, - "step": 5541 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2773, - "step": 5542 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2756, - "step": 5543 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2752, - "step": 5544 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.282, - "step": 5545 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2804, - "step": 5546 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2993, - "step": 5547 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.279, - "step": 5548 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.2838, - "step": 5549 - }, - { - "epoch": 0.68, - "learning_rate": 0.0003, - "loss": 0.269, - "step": 5550 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2807, - "step": 5551 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.3014, - "step": 5552 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2592, - "step": 5553 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2663, - "step": 5554 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2859, - "step": 5555 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.276, - "step": 5556 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2643, - "step": 5557 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2788, - "step": 5558 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2656, - "step": 5559 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2589, - "step": 5560 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2715, - "step": 5561 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2724, - "step": 5562 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2869, - "step": 5563 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2727, - "step": 5564 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2907, - "step": 5565 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2632, - "step": 5566 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2793, - "step": 5567 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2725, - "step": 5568 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2669, - "step": 5569 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2743, - "step": 5570 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2795, - "step": 5571 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2782, - "step": 5572 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2759, - "step": 5573 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2834, - "step": 5574 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.268, - "step": 5575 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2937, - "step": 5576 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2759, - "step": 5577 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2821, - "step": 5578 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2531, - "step": 5579 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2894, - "step": 5580 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2925, - "step": 5581 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2689, - "step": 5582 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2781, - "step": 5583 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2725, - "step": 5584 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2839, - "step": 5585 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2861, - "step": 5586 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2726, - "step": 5587 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2726, - "step": 5588 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2851, - "step": 5589 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2701, - "step": 5590 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2754, - "step": 5591 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2924, - "step": 5592 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2804, - "step": 5593 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2902, - "step": 5594 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.288, - "step": 5595 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2774, - "step": 5596 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2652, - "step": 5597 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2804, - "step": 5598 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2676, - "step": 5599 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2712, - "step": 5600 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2754, - "step": 5601 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2761, - "step": 5602 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2632, - "step": 5603 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2817, - "step": 5604 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2719, - "step": 5605 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.284, - "step": 5606 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2712, - "step": 5607 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2655, - "step": 5608 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2811, - "step": 5609 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2924, - "step": 5610 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2744, - "step": 5611 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2692, - "step": 5612 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2822, - "step": 5613 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2728, - "step": 5614 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2782, - "step": 5615 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2778, - "step": 5616 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2703, - "step": 5617 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2784, - "step": 5618 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2713, - "step": 5619 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.3006, - "step": 5620 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2765, - "step": 5621 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2619, - "step": 5622 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2745, - "step": 5623 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2719, - "step": 5624 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2855, - "step": 5625 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2645, - "step": 5626 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2681, - "step": 5627 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2534, - "step": 5628 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2801, - "step": 5629 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2944, - "step": 5630 - }, - { - "epoch": 0.69, - "learning_rate": 0.0003, - "loss": 0.2779, - "step": 5631 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2943, - "step": 5632 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2803, - "step": 5633 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2897, - "step": 5634 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2856, - "step": 5635 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2713, - "step": 5636 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2854, - "step": 5637 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2748, - "step": 5638 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2611, - "step": 5639 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2829, - "step": 5640 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.283, - "step": 5641 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2577, - "step": 5642 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2559, - "step": 5643 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.275, - "step": 5644 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2659, - "step": 5645 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2842, - "step": 5646 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2791, - "step": 5647 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2804, - "step": 5648 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2672, - "step": 5649 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2836, - "step": 5650 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2559, - "step": 5651 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2857, - "step": 5652 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2704, - "step": 5653 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2848, - "step": 5654 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.278, - "step": 5655 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2736, - "step": 5656 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2728, - "step": 5657 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2713, - "step": 5658 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2589, - "step": 5659 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2712, - "step": 5660 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.274, - "step": 5661 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2711, - "step": 5662 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.3011, - "step": 5663 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2865, - "step": 5664 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2563, - "step": 5665 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2903, - "step": 5666 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2658, - "step": 5667 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2769, - "step": 5668 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2765, - "step": 5669 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.308, - "step": 5670 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2736, - "step": 5671 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2761, - "step": 5672 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2722, - "step": 5673 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2751, - "step": 5674 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2722, - "step": 5675 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2705, - "step": 5676 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2736, - "step": 5677 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2749, - "step": 5678 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2763, - "step": 5679 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2673, - "step": 5680 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2721, - "step": 5681 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2785, - "step": 5682 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2748, - "step": 5683 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2898, - "step": 5684 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2815, - "step": 5685 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2618, - "step": 5686 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2784, - "step": 5687 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2731, - "step": 5688 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2983, - "step": 5689 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2966, - "step": 5690 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2951, - "step": 5691 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2735, - "step": 5692 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2592, - "step": 5693 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2692, - "step": 5694 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2609, - "step": 5695 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2823, - "step": 5696 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2772, - "step": 5697 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2746, - "step": 5698 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2832, - "step": 5699 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2745, - "step": 5700 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2792, - "step": 5701 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2584, - "step": 5702 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2742, - "step": 5703 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2678, - "step": 5704 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2601, - "step": 5705 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2615, - "step": 5706 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2899, - "step": 5707 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.3027, - "step": 5708 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.265, - "step": 5709 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2736, - "step": 5710 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2834, - "step": 5711 - }, - { - "epoch": 0.7, - "learning_rate": 0.0003, - "loss": 0.2846, - "step": 5712 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2509, - "step": 5713 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2645, - "step": 5714 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2745, - "step": 5715 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2762, - "step": 5716 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.279, - "step": 5717 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2673, - "step": 5718 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2695, - "step": 5719 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.258, - "step": 5720 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2616, - "step": 5721 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2695, - "step": 5722 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2732, - "step": 5723 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.268, - "step": 5724 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.273, - "step": 5725 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2678, - "step": 5726 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2629, - "step": 5727 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2733, - "step": 5728 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2815, - "step": 5729 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2635, - "step": 5730 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2746, - "step": 5731 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2828, - "step": 5732 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2715, - "step": 5733 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2689, - "step": 5734 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.265, - "step": 5735 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.272, - "step": 5736 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2719, - "step": 5737 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2565, - "step": 5738 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2631, - "step": 5739 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2594, - "step": 5740 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2876, - "step": 5741 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2818, - "step": 5742 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2818, - "step": 5743 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2556, - "step": 5744 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2832, - "step": 5745 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.274, - "step": 5746 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.286, - "step": 5747 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2509, - "step": 5748 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2681, - "step": 5749 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2759, - "step": 5750 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.269, - "step": 5751 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.278, - "step": 5752 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2731, - "step": 5753 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2863, - "step": 5754 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2657, - "step": 5755 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2901, - "step": 5756 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2675, - "step": 5757 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.287, - "step": 5758 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2757, - "step": 5759 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2791, - "step": 5760 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2728, - "step": 5761 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2647, - "step": 5762 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2866, - "step": 5763 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2721, - "step": 5764 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2756, - "step": 5765 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2848, - "step": 5766 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2761, - "step": 5767 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2812, - "step": 5768 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2696, - "step": 5769 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2782, - "step": 5770 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2843, - "step": 5771 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2731, - "step": 5772 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.274, - "step": 5773 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2809, - "step": 5774 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2596, - "step": 5775 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2784, - "step": 5776 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2808, - "step": 5777 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2992, - "step": 5778 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2562, - "step": 5779 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2666, - "step": 5780 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2941, - "step": 5781 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2827, - "step": 5782 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2697, - "step": 5783 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2586, - "step": 5784 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2685, - "step": 5785 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2527, - "step": 5786 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2717, - "step": 5787 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2737, - "step": 5788 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2774, - "step": 5789 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2875, - "step": 5790 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2818, - "step": 5791 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2812, - "step": 5792 - }, - { - "epoch": 0.71, - "learning_rate": 0.0003, - "loss": 0.2733, - "step": 5793 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2711, - "step": 5794 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2624, - "step": 5795 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2611, - "step": 5796 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.289, - "step": 5797 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.265, - "step": 5798 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2674, - "step": 5799 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2894, - "step": 5800 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2709, - "step": 5801 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2783, - "step": 5802 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2787, - "step": 5803 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2665, - "step": 5804 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2717, - "step": 5805 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.253, - "step": 5806 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2636, - "step": 5807 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2805, - "step": 5808 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2893, - "step": 5809 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2784, - "step": 5810 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2759, - "step": 5811 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.288, - "step": 5812 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2812, - "step": 5813 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2718, - "step": 5814 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2719, - "step": 5815 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2698, - "step": 5816 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2813, - "step": 5817 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2745, - "step": 5818 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2721, - "step": 5819 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2662, - "step": 5820 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2673, - "step": 5821 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2625, - "step": 5822 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2813, - "step": 5823 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2819, - "step": 5824 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2697, - "step": 5825 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2747, - "step": 5826 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2784, - "step": 5827 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2827, - "step": 5828 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2701, - "step": 5829 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2732, - "step": 5830 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2759, - "step": 5831 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2607, - "step": 5832 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.268, - "step": 5833 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.251, - "step": 5834 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2797, - "step": 5835 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2685, - "step": 5836 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2837, - "step": 5837 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.26, - "step": 5838 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2697, - "step": 5839 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2585, - "step": 5840 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2696, - "step": 5841 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2899, - "step": 5842 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2735, - "step": 5843 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2736, - "step": 5844 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2669, - "step": 5845 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2601, - "step": 5846 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2839, - "step": 5847 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2784, - "step": 5848 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.265, - "step": 5849 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2651, - "step": 5850 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2864, - "step": 5851 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.288, - "step": 5852 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2792, - "step": 5853 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.267, - "step": 5854 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2697, - "step": 5855 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2707, - "step": 5856 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.283, - "step": 5857 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2804, - "step": 5858 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2784, - "step": 5859 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2893, - "step": 5860 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2777, - "step": 5861 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2826, - "step": 5862 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2833, - "step": 5863 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2659, - "step": 5864 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2714, - "step": 5865 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2758, - "step": 5866 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2706, - "step": 5867 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2704, - "step": 5868 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2595, - "step": 5869 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2764, - "step": 5870 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2597, - "step": 5871 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2782, - "step": 5872 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.274, - "step": 5873 - }, - { - "epoch": 0.72, - "learning_rate": 0.0003, - "loss": 0.2638, - "step": 5874 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.267, - "step": 5875 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2748, - "step": 5876 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.272, - "step": 5877 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.282, - "step": 5878 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2793, - "step": 5879 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2606, - "step": 5880 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2766, - "step": 5881 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2726, - "step": 5882 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2575, - "step": 5883 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2699, - "step": 5884 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2838, - "step": 5885 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2809, - "step": 5886 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2754, - "step": 5887 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2609, - "step": 5888 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2597, - "step": 5889 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2863, - "step": 5890 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2839, - "step": 5891 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2654, - "step": 5892 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.25, - "step": 5893 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2769, - "step": 5894 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2871, - "step": 5895 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2682, - "step": 5896 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2845, - "step": 5897 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2778, - "step": 5898 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2755, - "step": 5899 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2681, - "step": 5900 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2784, - "step": 5901 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2772, - "step": 5902 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2804, - "step": 5903 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.267, - "step": 5904 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2784, - "step": 5905 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2825, - "step": 5906 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.289, - "step": 5907 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2742, - "step": 5908 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2655, - "step": 5909 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2904, - "step": 5910 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2609, - "step": 5911 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2817, - "step": 5912 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2704, - "step": 5913 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2712, - "step": 5914 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2601, - "step": 5915 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2722, - "step": 5916 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2618, - "step": 5917 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2768, - "step": 5918 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2802, - "step": 5919 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2936, - "step": 5920 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2644, - "step": 5921 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2655, - "step": 5922 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2708, - "step": 5923 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2711, - "step": 5924 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2728, - "step": 5925 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2896, - "step": 5926 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2784, - "step": 5927 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2561, - "step": 5928 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2788, - "step": 5929 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2782, - "step": 5930 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2582, - "step": 5931 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2765, - "step": 5932 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2702, - "step": 5933 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2538, - "step": 5934 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2677, - "step": 5935 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2761, - "step": 5936 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.249, - "step": 5937 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2582, - "step": 5938 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.267, - "step": 5939 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.275, - "step": 5940 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2569, - "step": 5941 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2754, - "step": 5942 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2707, - "step": 5943 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2784, - "step": 5944 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2661, - "step": 5945 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2797, - "step": 5946 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2732, - "step": 5947 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2821, - "step": 5948 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2895, - "step": 5949 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.276, - "step": 5950 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2737, - "step": 5951 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2825, - "step": 5952 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2736, - "step": 5953 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2723, - "step": 5954 - }, - { - "epoch": 0.73, - "learning_rate": 0.0003, - "loss": 0.2581, - "step": 5955 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2741, - "step": 5956 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2975, - "step": 5957 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2673, - "step": 5958 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2747, - "step": 5959 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2654, - "step": 5960 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2801, - "step": 5961 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.265, - "step": 5962 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2659, - "step": 5963 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2853, - "step": 5964 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.268, - "step": 5965 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2626, - "step": 5966 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2806, - "step": 5967 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2735, - "step": 5968 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2735, - "step": 5969 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2738, - "step": 5970 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2643, - "step": 5971 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2522, - "step": 5972 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2692, - "step": 5973 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2736, - "step": 5974 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2695, - "step": 5975 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2716, - "step": 5976 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2646, - "step": 5977 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2918, - "step": 5978 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2893, - "step": 5979 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2656, - "step": 5980 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2524, - "step": 5981 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2764, - "step": 5982 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2843, - "step": 5983 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.287, - "step": 5984 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2673, - "step": 5985 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2703, - "step": 5986 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.267, - "step": 5987 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2635, - "step": 5988 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2717, - "step": 5989 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2544, - "step": 5990 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2712, - "step": 5991 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.267, - "step": 5992 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2646, - "step": 5993 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2854, - "step": 5994 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2715, - "step": 5995 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2689, - "step": 5996 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2735, - "step": 5997 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2653, - "step": 5998 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2677, - "step": 5999 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.281, - "step": 6000 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2886, - "step": 6001 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2921, - "step": 6002 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2656, - "step": 6003 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2457, - "step": 6004 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2701, - "step": 6005 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2574, - "step": 6006 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.249, - "step": 6007 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2681, - "step": 6008 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.278, - "step": 6009 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2801, - "step": 6010 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.262, - "step": 6011 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2581, - "step": 6012 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2794, - "step": 6013 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2769, - "step": 6014 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2761, - "step": 6015 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2723, - "step": 6016 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2668, - "step": 6017 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2735, - "step": 6018 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2911, - "step": 6019 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2739, - "step": 6020 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2725, - "step": 6021 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2944, - "step": 6022 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2683, - "step": 6023 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2507, - "step": 6024 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2635, - "step": 6025 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2795, - "step": 6026 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.286, - "step": 6027 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2759, - "step": 6028 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2645, - "step": 6029 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2714, - "step": 6030 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2854, - "step": 6031 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2646, - "step": 6032 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2778, - "step": 6033 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2623, - "step": 6034 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2882, - "step": 6035 - }, - { - "epoch": 0.74, - "learning_rate": 0.0003, - "loss": 0.2674, - "step": 6036 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2855, - "step": 6037 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2612, - "step": 6038 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2798, - "step": 6039 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.273, - "step": 6040 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2811, - "step": 6041 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2824, - "step": 6042 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2763, - "step": 6043 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2691, - "step": 6044 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2648, - "step": 6045 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2667, - "step": 6046 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2699, - "step": 6047 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2778, - "step": 6048 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2683, - "step": 6049 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2715, - "step": 6050 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.256, - "step": 6051 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2695, - "step": 6052 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2757, - "step": 6053 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2642, - "step": 6054 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2783, - "step": 6055 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2868, - "step": 6056 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2881, - "step": 6057 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2696, - "step": 6058 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2837, - "step": 6059 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2652, - "step": 6060 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2652, - "step": 6061 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2819, - "step": 6062 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.263, - "step": 6063 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2697, - "step": 6064 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2843, - "step": 6065 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2667, - "step": 6066 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2635, - "step": 6067 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.259, - "step": 6068 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2748, - "step": 6069 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2684, - "step": 6070 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2807, - "step": 6071 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2628, - "step": 6072 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.262, - "step": 6073 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2807, - "step": 6074 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2899, - "step": 6075 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2752, - "step": 6076 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2667, - "step": 6077 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2898, - "step": 6078 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2779, - "step": 6079 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2743, - "step": 6080 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.269, - "step": 6081 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2776, - "step": 6082 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2741, - "step": 6083 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2714, - "step": 6084 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.269, - "step": 6085 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2685, - "step": 6086 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2693, - "step": 6087 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2636, - "step": 6088 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2641, - "step": 6089 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2792, - "step": 6090 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2813, - "step": 6091 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2619, - "step": 6092 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2688, - "step": 6093 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2645, - "step": 6094 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2594, - "step": 6095 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2546, - "step": 6096 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.265, - "step": 6097 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2733, - "step": 6098 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2549, - "step": 6099 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2594, - "step": 6100 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2615, - "step": 6101 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2606, - "step": 6102 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2653, - "step": 6103 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2849, - "step": 6104 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2545, - "step": 6105 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2755, - "step": 6106 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2643, - "step": 6107 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2701, - "step": 6108 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2621, - "step": 6109 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2675, - "step": 6110 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2622, - "step": 6111 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2648, - "step": 6112 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2728, - "step": 6113 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2675, - "step": 6114 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2773, - "step": 6115 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2701, - "step": 6116 - }, - { - "epoch": 0.75, - "learning_rate": 0.0003, - "loss": 0.2749, - "step": 6117 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2582, - "step": 6118 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2686, - "step": 6119 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2725, - "step": 6120 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2614, - "step": 6121 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2667, - "step": 6122 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2786, - "step": 6123 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2668, - "step": 6124 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2584, - "step": 6125 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2622, - "step": 6126 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2803, - "step": 6127 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2764, - "step": 6128 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2964, - "step": 6129 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2837, - "step": 6130 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2649, - "step": 6131 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2719, - "step": 6132 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2819, - "step": 6133 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2883, - "step": 6134 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2649, - "step": 6135 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2689, - "step": 6136 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2743, - "step": 6137 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2777, - "step": 6138 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2681, - "step": 6139 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2697, - "step": 6140 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2769, - "step": 6141 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2447, - "step": 6142 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2808, - "step": 6143 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2664, - "step": 6144 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2671, - "step": 6145 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2669, - "step": 6146 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2634, - "step": 6147 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2611, - "step": 6148 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2636, - "step": 6149 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2849, - "step": 6150 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2618, - "step": 6151 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2729, - "step": 6152 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2733, - "step": 6153 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2655, - "step": 6154 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2727, - "step": 6155 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2726, - "step": 6156 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2618, - "step": 6157 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2795, - "step": 6158 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2677, - "step": 6159 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2714, - "step": 6160 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2782, - "step": 6161 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2735, - "step": 6162 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2766, - "step": 6163 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2731, - "step": 6164 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2698, - "step": 6165 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2509, - "step": 6166 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2811, - "step": 6167 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.262, - "step": 6168 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2685, - "step": 6169 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2632, - "step": 6170 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2782, - "step": 6171 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2744, - "step": 6172 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.272, - "step": 6173 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2588, - "step": 6174 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2814, - "step": 6175 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2722, - "step": 6176 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2682, - "step": 6177 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2671, - "step": 6178 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2529, - "step": 6179 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2821, - "step": 6180 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2707, - "step": 6181 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2674, - "step": 6182 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.279, - "step": 6183 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2704, - "step": 6184 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.28, - "step": 6185 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2472, - "step": 6186 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2666, - "step": 6187 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2592, - "step": 6188 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2727, - "step": 6189 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2721, - "step": 6190 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2704, - "step": 6191 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2944, - "step": 6192 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2607, - "step": 6193 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.245, - "step": 6194 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2581, - "step": 6195 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2597, - "step": 6196 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2709, - "step": 6197 - }, - { - "epoch": 0.76, - "learning_rate": 0.0003, - "loss": 0.2655, - "step": 6198 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2885, - "step": 6199 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.255, - "step": 6200 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2562, - "step": 6201 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2672, - "step": 6202 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2526, - "step": 6203 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2611, - "step": 6204 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.261, - "step": 6205 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2833, - "step": 6206 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2684, - "step": 6207 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2797, - "step": 6208 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2621, - "step": 6209 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2714, - "step": 6210 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2658, - "step": 6211 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2804, - "step": 6212 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2595, - "step": 6213 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.267, - "step": 6214 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2535, - "step": 6215 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2653, - "step": 6216 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2536, - "step": 6217 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2777, - "step": 6218 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2699, - "step": 6219 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2751, - "step": 6220 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2564, - "step": 6221 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2449, - "step": 6222 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.27, - "step": 6223 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2728, - "step": 6224 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2652, - "step": 6225 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2747, - "step": 6226 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2554, - "step": 6227 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2781, - "step": 6228 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2604, - "step": 6229 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2755, - "step": 6230 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2651, - "step": 6231 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2681, - "step": 6232 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2724, - "step": 6233 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2804, - "step": 6234 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2512, - "step": 6235 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2632, - "step": 6236 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2694, - "step": 6237 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2738, - "step": 6238 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2696, - "step": 6239 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2567, - "step": 6240 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2594, - "step": 6241 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.265, - "step": 6242 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2707, - "step": 6243 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2569, - "step": 6244 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.268, - "step": 6245 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2666, - "step": 6246 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2592, - "step": 6247 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2587, - "step": 6248 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2377, - "step": 6249 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2722, - "step": 6250 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2617, - "step": 6251 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2736, - "step": 6252 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.277, - "step": 6253 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2819, - "step": 6254 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2769, - "step": 6255 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2507, - "step": 6256 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2746, - "step": 6257 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2654, - "step": 6258 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.258, - "step": 6259 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.269, - "step": 6260 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2716, - "step": 6261 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2633, - "step": 6262 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2718, - "step": 6263 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2396, - "step": 6264 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.259, - "step": 6265 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2589, - "step": 6266 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2696, - "step": 6267 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2686, - "step": 6268 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2683, - "step": 6269 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2673, - "step": 6270 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2664, - "step": 6271 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2734, - "step": 6272 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2839, - "step": 6273 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2631, - "step": 6274 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2652, - "step": 6275 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.276, - "step": 6276 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2543, - "step": 6277 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2811, - "step": 6278 - }, - { - "epoch": 0.77, - "learning_rate": 0.0003, - "loss": 0.2504, - "step": 6279 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2683, - "step": 6280 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2534, - "step": 6281 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2783, - "step": 6282 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2841, - "step": 6283 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2619, - "step": 6284 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.287, - "step": 6285 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2875, - "step": 6286 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.269, - "step": 6287 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2606, - "step": 6288 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2647, - "step": 6289 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2593, - "step": 6290 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2677, - "step": 6291 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2558, - "step": 6292 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2599, - "step": 6293 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2672, - "step": 6294 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.272, - "step": 6295 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2684, - "step": 6296 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2644, - "step": 6297 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2844, - "step": 6298 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2759, - "step": 6299 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2764, - "step": 6300 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2633, - "step": 6301 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2761, - "step": 6302 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.288, - "step": 6303 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2594, - "step": 6304 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2836, - "step": 6305 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.262, - "step": 6306 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2727, - "step": 6307 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2883, - "step": 6308 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2691, - "step": 6309 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2573, - "step": 6310 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2741, - "step": 6311 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2843, - "step": 6312 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2674, - "step": 6313 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2765, - "step": 6314 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2634, - "step": 6315 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2637, - "step": 6316 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2634, - "step": 6317 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2727, - "step": 6318 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2708, - "step": 6319 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2818, - "step": 6320 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2647, - "step": 6321 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2713, - "step": 6322 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2637, - "step": 6323 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2702, - "step": 6324 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2724, - "step": 6325 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2687, - "step": 6326 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2701, - "step": 6327 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2773, - "step": 6328 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2539, - "step": 6329 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2674, - "step": 6330 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2604, - "step": 6331 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2646, - "step": 6332 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2551, - "step": 6333 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2714, - "step": 6334 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2696, - "step": 6335 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2468, - "step": 6336 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2588, - "step": 6337 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2538, - "step": 6338 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2583, - "step": 6339 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2668, - "step": 6340 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2716, - "step": 6341 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2634, - "step": 6342 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2755, - "step": 6343 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2719, - "step": 6344 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2743, - "step": 6345 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2649, - "step": 6346 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2561, - "step": 6347 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2783, - "step": 6348 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2704, - "step": 6349 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2738, - "step": 6350 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.259, - "step": 6351 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2749, - "step": 6352 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2809, - "step": 6353 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2806, - "step": 6354 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2732, - "step": 6355 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2806, - "step": 6356 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2815, - "step": 6357 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.257, - "step": 6358 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2574, - "step": 6359 - }, - { - "epoch": 0.78, - "learning_rate": 0.0003, - "loss": 0.2549, - "step": 6360 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2885, - "step": 6361 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2658, - "step": 6362 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2527, - "step": 6363 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2636, - "step": 6364 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2714, - "step": 6365 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2656, - "step": 6366 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2662, - "step": 6367 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2709, - "step": 6368 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2735, - "step": 6369 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2695, - "step": 6370 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.26, - "step": 6371 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2647, - "step": 6372 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2625, - "step": 6373 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2745, - "step": 6374 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2714, - "step": 6375 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2593, - "step": 6376 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2737, - "step": 6377 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2515, - "step": 6378 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2687, - "step": 6379 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.259, - "step": 6380 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2547, - "step": 6381 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2669, - "step": 6382 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.268, - "step": 6383 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2765, - "step": 6384 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2717, - "step": 6385 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2676, - "step": 6386 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2564, - "step": 6387 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2698, - "step": 6388 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2616, - "step": 6389 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2653, - "step": 6390 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2716, - "step": 6391 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.265, - "step": 6392 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2685, - "step": 6393 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2599, - "step": 6394 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2617, - "step": 6395 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2633, - "step": 6396 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2739, - "step": 6397 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.3072, - "step": 6398 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2671, - "step": 6399 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2666, - "step": 6400 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2471, - "step": 6401 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.259, - "step": 6402 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2623, - "step": 6403 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2625, - "step": 6404 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2665, - "step": 6405 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2927, - "step": 6406 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2684, - "step": 6407 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2828, - "step": 6408 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2653, - "step": 6409 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2717, - "step": 6410 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2472, - "step": 6411 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2658, - "step": 6412 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2787, - "step": 6413 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2649, - "step": 6414 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.269, - "step": 6415 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2533, - "step": 6416 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2519, - "step": 6417 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2775, - "step": 6418 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2775, - "step": 6419 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2844, - "step": 6420 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2444, - "step": 6421 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2465, - "step": 6422 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2669, - "step": 6423 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2714, - "step": 6424 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2564, - "step": 6425 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.274, - "step": 6426 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2725, - "step": 6427 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.26, - "step": 6428 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2759, - "step": 6429 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2473, - "step": 6430 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2553, - "step": 6431 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2503, - "step": 6432 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2516, - "step": 6433 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2895, - "step": 6434 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2528, - "step": 6435 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2567, - "step": 6436 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.263, - "step": 6437 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2617, - "step": 6438 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2582, - "step": 6439 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2554, - "step": 6440 - }, - { - "epoch": 0.79, - "learning_rate": 0.0003, - "loss": 0.2581, - "step": 6441 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2602, - "step": 6442 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.286, - "step": 6443 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2675, - "step": 6444 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2733, - "step": 6445 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2705, - "step": 6446 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2846, - "step": 6447 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2581, - "step": 6448 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2622, - "step": 6449 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2826, - "step": 6450 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2748, - "step": 6451 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2649, - "step": 6452 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2807, - "step": 6453 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2602, - "step": 6454 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2639, - "step": 6455 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.296, - "step": 6456 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2569, - "step": 6457 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2803, - "step": 6458 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2558, - "step": 6459 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2528, - "step": 6460 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2761, - "step": 6461 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2688, - "step": 6462 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2643, - "step": 6463 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2734, - "step": 6464 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2659, - "step": 6465 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2814, - "step": 6466 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2588, - "step": 6467 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2664, - "step": 6468 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2684, - "step": 6469 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2769, - "step": 6470 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2696, - "step": 6471 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2607, - "step": 6472 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2671, - "step": 6473 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2665, - "step": 6474 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2742, - "step": 6475 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2585, - "step": 6476 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2736, - "step": 6477 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2641, - "step": 6478 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2664, - "step": 6479 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.265, - "step": 6480 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2615, - "step": 6481 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2607, - "step": 6482 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2688, - "step": 6483 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2653, - "step": 6484 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.265, - "step": 6485 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.283, - "step": 6486 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2505, - "step": 6487 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2526, - "step": 6488 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.269, - "step": 6489 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2597, - "step": 6490 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2612, - "step": 6491 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2574, - "step": 6492 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2512, - "step": 6493 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.26, - "step": 6494 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2574, - "step": 6495 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2612, - "step": 6496 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2615, - "step": 6497 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2722, - "step": 6498 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2713, - "step": 6499 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.278, - "step": 6500 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2779, - "step": 6501 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2656, - "step": 6502 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2565, - "step": 6503 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2732, - "step": 6504 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2709, - "step": 6505 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2662, - "step": 6506 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2528, - "step": 6507 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2697, - "step": 6508 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2482, - "step": 6509 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2585, - "step": 6510 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2649, - "step": 6511 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.274, - "step": 6512 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2612, - "step": 6513 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.277, - "step": 6514 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2665, - "step": 6515 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2645, - "step": 6516 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2573, - "step": 6517 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2799, - "step": 6518 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2742, - "step": 6519 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2649, - "step": 6520 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.2477, - "step": 6521 - }, - { - "epoch": 0.8, - "learning_rate": 0.0003, - "loss": 0.268, - "step": 6522 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2839, - "step": 6523 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.271, - "step": 6524 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2735, - "step": 6525 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2566, - "step": 6526 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2719, - "step": 6527 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2805, - "step": 6528 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2709, - "step": 6529 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2512, - "step": 6530 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2886, - "step": 6531 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2544, - "step": 6532 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2745, - "step": 6533 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2775, - "step": 6534 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2566, - "step": 6535 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2631, - "step": 6536 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2732, - "step": 6537 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2753, - "step": 6538 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2607, - "step": 6539 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2651, - "step": 6540 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2808, - "step": 6541 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2972, - "step": 6542 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2732, - "step": 6543 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2718, - "step": 6544 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2508, - "step": 6545 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2723, - "step": 6546 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2437, - "step": 6547 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2515, - "step": 6548 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.281, - "step": 6549 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2579, - "step": 6550 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.28, - "step": 6551 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2518, - "step": 6552 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2733, - "step": 6553 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2651, - "step": 6554 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.272, - "step": 6555 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2823, - "step": 6556 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2472, - "step": 6557 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2527, - "step": 6558 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2761, - "step": 6559 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2905, - "step": 6560 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2852, - "step": 6561 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2602, - "step": 6562 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2584, - "step": 6563 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2621, - "step": 6564 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2677, - "step": 6565 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2671, - "step": 6566 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.27, - "step": 6567 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2767, - "step": 6568 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2711, - "step": 6569 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2592, - "step": 6570 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2527, - "step": 6571 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2647, - "step": 6572 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2539, - "step": 6573 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2654, - "step": 6574 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2658, - "step": 6575 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.265, - "step": 6576 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2561, - "step": 6577 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.245, - "step": 6578 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2723, - "step": 6579 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2557, - "step": 6580 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2622, - "step": 6581 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2549, - "step": 6582 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2628, - "step": 6583 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2878, - "step": 6584 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.262, - "step": 6585 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2577, - "step": 6586 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2644, - "step": 6587 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2656, - "step": 6588 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2868, - "step": 6589 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2572, - "step": 6590 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2469, - "step": 6591 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2499, - "step": 6592 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2604, - "step": 6593 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2703, - "step": 6594 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2695, - "step": 6595 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2503, - "step": 6596 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2713, - "step": 6597 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2833, - "step": 6598 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2761, - "step": 6599 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2696, - "step": 6600 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.253, - "step": 6601 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.259, - "step": 6602 - }, - { - "epoch": 0.81, - "learning_rate": 0.0003, - "loss": 0.2694, - "step": 6603 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2537, - "step": 6604 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2585, - "step": 6605 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2446, - "step": 6606 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2853, - "step": 6607 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2584, - "step": 6608 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2655, - "step": 6609 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2558, - "step": 6610 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2347, - "step": 6611 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2713, - "step": 6612 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2741, - "step": 6613 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.278, - "step": 6614 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2537, - "step": 6615 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2752, - "step": 6616 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2543, - "step": 6617 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.268, - "step": 6618 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2578, - "step": 6619 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2722, - "step": 6620 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2697, - "step": 6621 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2585, - "step": 6622 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2612, - "step": 6623 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2705, - "step": 6624 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2583, - "step": 6625 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2523, - "step": 6626 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.255, - "step": 6627 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2792, - "step": 6628 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2561, - "step": 6629 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2721, - "step": 6630 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2826, - "step": 6631 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2793, - "step": 6632 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2583, - "step": 6633 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2716, - "step": 6634 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2719, - "step": 6635 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2594, - "step": 6636 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2557, - "step": 6637 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2795, - "step": 6638 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2536, - "step": 6639 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2575, - "step": 6640 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2645, - "step": 6641 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.268, - "step": 6642 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2622, - "step": 6643 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2661, - "step": 6644 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2701, - "step": 6645 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2635, - "step": 6646 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2598, - "step": 6647 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2519, - "step": 6648 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2677, - "step": 6649 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2589, - "step": 6650 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2473, - "step": 6651 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2731, - "step": 6652 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2736, - "step": 6653 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2595, - "step": 6654 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2701, - "step": 6655 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2635, - "step": 6656 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2512, - "step": 6657 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2735, - "step": 6658 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.286, - "step": 6659 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.268, - "step": 6660 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2615, - "step": 6661 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2735, - "step": 6662 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2537, - "step": 6663 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2464, - "step": 6664 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.26, - "step": 6665 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.267, - "step": 6666 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2621, - "step": 6667 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2696, - "step": 6668 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2719, - "step": 6669 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2663, - "step": 6670 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2722, - "step": 6671 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2676, - "step": 6672 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2803, - "step": 6673 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2568, - "step": 6674 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2519, - "step": 6675 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2649, - "step": 6676 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2667, - "step": 6677 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2749, - "step": 6678 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2567, - "step": 6679 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2657, - "step": 6680 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2543, - "step": 6681 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2752, - "step": 6682 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2739, - "step": 6683 - }, - { - "epoch": 0.82, - "learning_rate": 0.0003, - "loss": 0.2654, - "step": 6684 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2694, - "step": 6685 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2849, - "step": 6686 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2628, - "step": 6687 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2853, - "step": 6688 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2588, - "step": 6689 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2767, - "step": 6690 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2629, - "step": 6691 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2586, - "step": 6692 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2692, - "step": 6693 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2769, - "step": 6694 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2671, - "step": 6695 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2558, - "step": 6696 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2778, - "step": 6697 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2524, - "step": 6698 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2607, - "step": 6699 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2615, - "step": 6700 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2782, - "step": 6701 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2436, - "step": 6702 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2627, - "step": 6703 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2544, - "step": 6704 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2713, - "step": 6705 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2585, - "step": 6706 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2514, - "step": 6707 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2462, - "step": 6708 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2584, - "step": 6709 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2662, - "step": 6710 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.255, - "step": 6711 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2677, - "step": 6712 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.285, - "step": 6713 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2654, - "step": 6714 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2564, - "step": 6715 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2685, - "step": 6716 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.257, - "step": 6717 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2822, - "step": 6718 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2496, - "step": 6719 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2693, - "step": 6720 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2755, - "step": 6721 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2848, - "step": 6722 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.267, - "step": 6723 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2778, - "step": 6724 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2792, - "step": 6725 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2788, - "step": 6726 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2761, - "step": 6727 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.264, - "step": 6728 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2436, - "step": 6729 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2868, - "step": 6730 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2729, - "step": 6731 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2673, - "step": 6732 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2596, - "step": 6733 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2645, - "step": 6734 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2711, - "step": 6735 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2582, - "step": 6736 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2544, - "step": 6737 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2703, - "step": 6738 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2448, - "step": 6739 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2567, - "step": 6740 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2606, - "step": 6741 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.257, - "step": 6742 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2417, - "step": 6743 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.262, - "step": 6744 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2438, - "step": 6745 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2647, - "step": 6746 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2782, - "step": 6747 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2772, - "step": 6748 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2526, - "step": 6749 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2504, - "step": 6750 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.272, - "step": 6751 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2698, - "step": 6752 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2572, - "step": 6753 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2683, - "step": 6754 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2674, - "step": 6755 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2688, - "step": 6756 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2709, - "step": 6757 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2652, - "step": 6758 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2604, - "step": 6759 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2568, - "step": 6760 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2632, - "step": 6761 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2593, - "step": 6762 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2609, - "step": 6763 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2591, - "step": 6764 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2468, - "step": 6765 - }, - { - "epoch": 0.83, - "learning_rate": 0.0003, - "loss": 0.2872, - "step": 6766 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2675, - "step": 6767 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2602, - "step": 6768 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2739, - "step": 6769 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2706, - "step": 6770 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2746, - "step": 6771 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.254, - "step": 6772 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2718, - "step": 6773 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2736, - "step": 6774 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2722, - "step": 6775 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2449, - "step": 6776 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2582, - "step": 6777 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2657, - "step": 6778 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2699, - "step": 6779 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2512, - "step": 6780 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2553, - "step": 6781 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2667, - "step": 6782 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2591, - "step": 6783 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2686, - "step": 6784 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2815, - "step": 6785 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2566, - "step": 6786 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2519, - "step": 6787 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2608, - "step": 6788 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.284, - "step": 6789 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2554, - "step": 6790 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2671, - "step": 6791 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2555, - "step": 6792 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2585, - "step": 6793 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2619, - "step": 6794 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2661, - "step": 6795 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2553, - "step": 6796 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2744, - "step": 6797 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2666, - "step": 6798 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2666, - "step": 6799 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2554, - "step": 6800 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2605, - "step": 6801 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2618, - "step": 6802 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2542, - "step": 6803 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2624, - "step": 6804 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2635, - "step": 6805 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2699, - "step": 6806 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2638, - "step": 6807 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2664, - "step": 6808 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2545, - "step": 6809 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2571, - "step": 6810 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2663, - "step": 6811 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2798, - "step": 6812 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.274, - "step": 6813 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2544, - "step": 6814 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2607, - "step": 6815 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2507, - "step": 6816 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2845, - "step": 6817 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2651, - "step": 6818 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2574, - "step": 6819 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.274, - "step": 6820 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2597, - "step": 6821 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2488, - "step": 6822 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2583, - "step": 6823 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.279, - "step": 6824 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2646, - "step": 6825 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2684, - "step": 6826 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2569, - "step": 6827 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2733, - "step": 6828 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2796, - "step": 6829 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2651, - "step": 6830 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2506, - "step": 6831 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2485, - "step": 6832 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2513, - "step": 6833 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2672, - "step": 6834 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2643, - "step": 6835 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2756, - "step": 6836 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.27, - "step": 6837 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2559, - "step": 6838 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2714, - "step": 6839 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2502, - "step": 6840 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2621, - "step": 6841 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2559, - "step": 6842 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2552, - "step": 6843 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2647, - "step": 6844 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2618, - "step": 6845 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2753, - "step": 6846 - }, - { - "epoch": 0.84, - "learning_rate": 0.0003, - "loss": 0.2586, - "step": 6847 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2697, - "step": 6848 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2906, - "step": 6849 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2777, - "step": 6850 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2593, - "step": 6851 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2618, - "step": 6852 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2795, - "step": 6853 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.28, - "step": 6854 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2812, - "step": 6855 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2648, - "step": 6856 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2487, - "step": 6857 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2753, - "step": 6858 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2682, - "step": 6859 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.28, - "step": 6860 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2758, - "step": 6861 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2562, - "step": 6862 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2451, - "step": 6863 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2864, - "step": 6864 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.26, - "step": 6865 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2581, - "step": 6866 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2674, - "step": 6867 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2681, - "step": 6868 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2655, - "step": 6869 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2785, - "step": 6870 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2558, - "step": 6871 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2536, - "step": 6872 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2725, - "step": 6873 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2582, - "step": 6874 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2698, - "step": 6875 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.264, - "step": 6876 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2562, - "step": 6877 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2573, - "step": 6878 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2746, - "step": 6879 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2837, - "step": 6880 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2533, - "step": 6881 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2723, - "step": 6882 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2588, - "step": 6883 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2786, - "step": 6884 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2561, - "step": 6885 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2869, - "step": 6886 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2516, - "step": 6887 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2495, - "step": 6888 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2582, - "step": 6889 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2836, - "step": 6890 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2704, - "step": 6891 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.256, - "step": 6892 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.255, - "step": 6893 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2424, - "step": 6894 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2955, - "step": 6895 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2655, - "step": 6896 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2678, - "step": 6897 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2406, - "step": 6898 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2717, - "step": 6899 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2626, - "step": 6900 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2421, - "step": 6901 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2699, - "step": 6902 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2803, - "step": 6903 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.257, - "step": 6904 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2543, - "step": 6905 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2696, - "step": 6906 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2481, - "step": 6907 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2794, - "step": 6908 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2752, - "step": 6909 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.272, - "step": 6910 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2729, - "step": 6911 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2659, - "step": 6912 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2555, - "step": 6913 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2443, - "step": 6914 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2728, - "step": 6915 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2662, - "step": 6916 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2452, - "step": 6917 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2453, - "step": 6918 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2533, - "step": 6919 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2478, - "step": 6920 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2579, - "step": 6921 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2542, - "step": 6922 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2708, - "step": 6923 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2326, - "step": 6924 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.251, - "step": 6925 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2512, - "step": 6926 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2632, - "step": 6927 - }, - { - "epoch": 0.85, - "learning_rate": 0.0003, - "loss": 0.2624, - "step": 6928 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2619, - "step": 6929 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2567, - "step": 6930 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2588, - "step": 6931 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2595, - "step": 6932 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2466, - "step": 6933 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.244, - "step": 6934 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2663, - "step": 6935 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2588, - "step": 6936 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2601, - "step": 6937 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.248, - "step": 6938 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2717, - "step": 6939 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2614, - "step": 6940 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2551, - "step": 6941 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.26, - "step": 6942 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2711, - "step": 6943 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2555, - "step": 6944 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2728, - "step": 6945 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.276, - "step": 6946 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2518, - "step": 6947 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.264, - "step": 6948 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2746, - "step": 6949 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2546, - "step": 6950 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2396, - "step": 6951 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2713, - "step": 6952 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2692, - "step": 6953 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2631, - "step": 6954 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2528, - "step": 6955 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2408, - "step": 6956 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2822, - "step": 6957 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2698, - "step": 6958 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2871, - "step": 6959 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2738, - "step": 6960 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2577, - "step": 6961 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2487, - "step": 6962 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2587, - "step": 6963 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2438, - "step": 6964 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2705, - "step": 6965 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2528, - "step": 6966 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2687, - "step": 6967 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2774, - "step": 6968 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2481, - "step": 6969 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2622, - "step": 6970 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2434, - "step": 6971 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2798, - "step": 6972 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2678, - "step": 6973 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2379, - "step": 6974 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2481, - "step": 6975 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2633, - "step": 6976 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2609, - "step": 6977 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2639, - "step": 6978 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2623, - "step": 6979 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.262, - "step": 6980 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2493, - "step": 6981 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2595, - "step": 6982 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2579, - "step": 6983 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2665, - "step": 6984 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2472, - "step": 6985 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2647, - "step": 6986 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2533, - "step": 6987 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2701, - "step": 6988 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.274, - "step": 6989 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2602, - "step": 6990 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2631, - "step": 6991 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2755, - "step": 6992 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2645, - "step": 6993 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.268, - "step": 6994 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2416, - "step": 6995 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2683, - "step": 6996 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2624, - "step": 6997 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2851, - "step": 6998 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2753, - "step": 6999 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2561, - "step": 7000 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2435, - "step": 7001 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2619, - "step": 7002 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2544, - "step": 7003 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2705, - "step": 7004 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2798, - "step": 7005 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2503, - "step": 7006 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2661, - "step": 7007 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2785, - "step": 7008 - }, - { - "epoch": 0.86, - "learning_rate": 0.0003, - "loss": 0.2477, - "step": 7009 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2542, - "step": 7010 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2852, - "step": 7011 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2604, - "step": 7012 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2542, - "step": 7013 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2422, - "step": 7014 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2655, - "step": 7015 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2476, - "step": 7016 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2667, - "step": 7017 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.271, - "step": 7018 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2546, - "step": 7019 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2825, - "step": 7020 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2664, - "step": 7021 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2843, - "step": 7022 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2795, - "step": 7023 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2538, - "step": 7024 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2487, - "step": 7025 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2714, - "step": 7026 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2552, - "step": 7027 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.252, - "step": 7028 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2565, - "step": 7029 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.266, - "step": 7030 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2436, - "step": 7031 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2711, - "step": 7032 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2591, - "step": 7033 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2542, - "step": 7034 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.247, - "step": 7035 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.269, - "step": 7036 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2484, - "step": 7037 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2791, - "step": 7038 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2589, - "step": 7039 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2597, - "step": 7040 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2684, - "step": 7041 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2524, - "step": 7042 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2555, - "step": 7043 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2665, - "step": 7044 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2643, - "step": 7045 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2605, - "step": 7046 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2586, - "step": 7047 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2538, - "step": 7048 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2638, - "step": 7049 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.258, - "step": 7050 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.264, - "step": 7051 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2582, - "step": 7052 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2778, - "step": 7053 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2754, - "step": 7054 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2475, - "step": 7055 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.256, - "step": 7056 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2543, - "step": 7057 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2624, - "step": 7058 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2603, - "step": 7059 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2533, - "step": 7060 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2502, - "step": 7061 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2707, - "step": 7062 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2708, - "step": 7063 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2674, - "step": 7064 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2695, - "step": 7065 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2547, - "step": 7066 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2765, - "step": 7067 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2761, - "step": 7068 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2724, - "step": 7069 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2713, - "step": 7070 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2553, - "step": 7071 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2511, - "step": 7072 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2527, - "step": 7073 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2688, - "step": 7074 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2778, - "step": 7075 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2672, - "step": 7076 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2406, - "step": 7077 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2511, - "step": 7078 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.267, - "step": 7079 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2587, - "step": 7080 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2452, - "step": 7081 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2614, - "step": 7082 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2704, - "step": 7083 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2531, - "step": 7084 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2666, - "step": 7085 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2552, - "step": 7086 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2637, - "step": 7087 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2497, - "step": 7088 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2506, - "step": 7089 - }, - { - "epoch": 0.87, - "learning_rate": 0.0003, - "loss": 0.2611, - "step": 7090 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2688, - "step": 7091 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2771, - "step": 7092 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2563, - "step": 7093 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2569, - "step": 7094 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.248, - "step": 7095 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2566, - "step": 7096 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2669, - "step": 7097 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2676, - "step": 7098 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2405, - "step": 7099 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2586, - "step": 7100 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2766, - "step": 7101 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2778, - "step": 7102 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2567, - "step": 7103 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2571, - "step": 7104 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2752, - "step": 7105 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2559, - "step": 7106 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2596, - "step": 7107 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2518, - "step": 7108 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2534, - "step": 7109 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2605, - "step": 7110 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2754, - "step": 7111 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2594, - "step": 7112 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2417, - "step": 7113 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2526, - "step": 7114 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.257, - "step": 7115 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2529, - "step": 7116 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2578, - "step": 7117 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.24, - "step": 7118 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2863, - "step": 7119 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2489, - "step": 7120 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2676, - "step": 7121 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2401, - "step": 7122 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2681, - "step": 7123 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2576, - "step": 7124 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2608, - "step": 7125 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2703, - "step": 7126 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2676, - "step": 7127 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2686, - "step": 7128 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2555, - "step": 7129 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2687, - "step": 7130 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2723, - "step": 7131 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2483, - "step": 7132 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2655, - "step": 7133 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2724, - "step": 7134 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2717, - "step": 7135 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2744, - "step": 7136 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2519, - "step": 7137 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2544, - "step": 7138 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.256, - "step": 7139 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2679, - "step": 7140 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2593, - "step": 7141 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2679, - "step": 7142 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2299, - "step": 7143 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.249, - "step": 7144 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2663, - "step": 7145 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2448, - "step": 7146 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2738, - "step": 7147 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2486, - "step": 7148 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2545, - "step": 7149 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2584, - "step": 7150 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2763, - "step": 7151 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2577, - "step": 7152 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2596, - "step": 7153 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2451, - "step": 7154 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2468, - "step": 7155 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.251, - "step": 7156 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2767, - "step": 7157 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2555, - "step": 7158 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.269, - "step": 7159 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2493, - "step": 7160 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2524, - "step": 7161 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2518, - "step": 7162 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2491, - "step": 7163 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.271, - "step": 7164 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2623, - "step": 7165 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2535, - "step": 7166 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2622, - "step": 7167 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2575, - "step": 7168 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2647, - "step": 7169 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2486, - "step": 7170 - }, - { - "epoch": 0.88, - "learning_rate": 0.0003, - "loss": 0.2542, - "step": 7171 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2626, - "step": 7172 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2808, - "step": 7173 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2481, - "step": 7174 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2427, - "step": 7175 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2613, - "step": 7176 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2483, - "step": 7177 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2547, - "step": 7178 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2555, - "step": 7179 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2666, - "step": 7180 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2563, - "step": 7181 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.25, - "step": 7182 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2535, - "step": 7183 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2622, - "step": 7184 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2567, - "step": 7185 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2755, - "step": 7186 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2256, - "step": 7187 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2596, - "step": 7188 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2707, - "step": 7189 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2675, - "step": 7190 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2672, - "step": 7191 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2705, - "step": 7192 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2589, - "step": 7193 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2582, - "step": 7194 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2532, - "step": 7195 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2423, - "step": 7196 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2662, - "step": 7197 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2493, - "step": 7198 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2522, - "step": 7199 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2683, - "step": 7200 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2594, - "step": 7201 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2637, - "step": 7202 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2552, - "step": 7203 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.274, - "step": 7204 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2503, - "step": 7205 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2552, - "step": 7206 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2512, - "step": 7207 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2556, - "step": 7208 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2617, - "step": 7209 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2682, - "step": 7210 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2524, - "step": 7211 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2589, - "step": 7212 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2789, - "step": 7213 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.261, - "step": 7214 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2541, - "step": 7215 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.253, - "step": 7216 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2693, - "step": 7217 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2522, - "step": 7218 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2502, - "step": 7219 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2527, - "step": 7220 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2588, - "step": 7221 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2637, - "step": 7222 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.246, - "step": 7223 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2614, - "step": 7224 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2666, - "step": 7225 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.267, - "step": 7226 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2512, - "step": 7227 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2549, - "step": 7228 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2769, - "step": 7229 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2621, - "step": 7230 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2598, - "step": 7231 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2579, - "step": 7232 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2502, - "step": 7233 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2566, - "step": 7234 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2515, - "step": 7235 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2585, - "step": 7236 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2597, - "step": 7237 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.248, - "step": 7238 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2648, - "step": 7239 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2622, - "step": 7240 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2734, - "step": 7241 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2721, - "step": 7242 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2723, - "step": 7243 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2664, - "step": 7244 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2623, - "step": 7245 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2684, - "step": 7246 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2476, - "step": 7247 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2931, - "step": 7248 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2563, - "step": 7249 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2518, - "step": 7250 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2611, - "step": 7251 - }, - { - "epoch": 0.89, - "learning_rate": 0.0003, - "loss": 0.2689, - "step": 7252 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2721, - "step": 7253 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2766, - "step": 7254 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.27, - "step": 7255 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2533, - "step": 7256 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2712, - "step": 7257 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.258, - "step": 7258 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2608, - "step": 7259 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2604, - "step": 7260 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2687, - "step": 7261 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2767, - "step": 7262 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2643, - "step": 7263 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2527, - "step": 7264 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2639, - "step": 7265 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2399, - "step": 7266 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2558, - "step": 7267 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2593, - "step": 7268 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2691, - "step": 7269 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2539, - "step": 7270 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2725, - "step": 7271 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2388, - "step": 7272 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2727, - "step": 7273 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.253, - "step": 7274 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2564, - "step": 7275 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2495, - "step": 7276 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2506, - "step": 7277 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2562, - "step": 7278 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2632, - "step": 7279 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2843, - "step": 7280 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2679, - "step": 7281 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2628, - "step": 7282 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2598, - "step": 7283 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2581, - "step": 7284 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2599, - "step": 7285 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2423, - "step": 7286 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2511, - "step": 7287 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2648, - "step": 7288 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2667, - "step": 7289 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2705, - "step": 7290 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2585, - "step": 7291 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2714, - "step": 7292 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2618, - "step": 7293 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2495, - "step": 7294 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2554, - "step": 7295 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.261, - "step": 7296 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2558, - "step": 7297 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2507, - "step": 7298 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2677, - "step": 7299 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2453, - "step": 7300 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2501, - "step": 7301 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2687, - "step": 7302 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2438, - "step": 7303 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2665, - "step": 7304 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2563, - "step": 7305 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2509, - "step": 7306 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2594, - "step": 7307 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2558, - "step": 7308 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2524, - "step": 7309 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2567, - "step": 7310 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2537, - "step": 7311 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2697, - "step": 7312 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2607, - "step": 7313 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2734, - "step": 7314 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.263, - "step": 7315 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2589, - "step": 7316 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2471, - "step": 7317 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2584, - "step": 7318 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2572, - "step": 7319 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2522, - "step": 7320 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2605, - "step": 7321 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2529, - "step": 7322 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2559, - "step": 7323 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2587, - "step": 7324 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2567, - "step": 7325 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.259, - "step": 7326 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2624, - "step": 7327 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2802, - "step": 7328 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2519, - "step": 7329 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2599, - "step": 7330 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2445, - "step": 7331 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2646, - "step": 7332 - }, - { - "epoch": 0.9, - "learning_rate": 0.0003, - "loss": 0.2542, - "step": 7333 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2717, - "step": 7334 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2595, - "step": 7335 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2642, - "step": 7336 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2473, - "step": 7337 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.258, - "step": 7338 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2641, - "step": 7339 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2514, - "step": 7340 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2587, - "step": 7341 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2487, - "step": 7342 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2527, - "step": 7343 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2593, - "step": 7344 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2526, - "step": 7345 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2601, - "step": 7346 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.238, - "step": 7347 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2655, - "step": 7348 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2556, - "step": 7349 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.264, - "step": 7350 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2634, - "step": 7351 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2578, - "step": 7352 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2673, - "step": 7353 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2669, - "step": 7354 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2464, - "step": 7355 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2535, - "step": 7356 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2625, - "step": 7357 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2574, - "step": 7358 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2604, - "step": 7359 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2626, - "step": 7360 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.249, - "step": 7361 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2586, - "step": 7362 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2677, - "step": 7363 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2565, - "step": 7364 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2529, - "step": 7365 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2409, - "step": 7366 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2517, - "step": 7367 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2622, - "step": 7368 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2584, - "step": 7369 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2488, - "step": 7370 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2745, - "step": 7371 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2619, - "step": 7372 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2432, - "step": 7373 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2574, - "step": 7374 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2706, - "step": 7375 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2609, - "step": 7376 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2465, - "step": 7377 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.258, - "step": 7378 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2809, - "step": 7379 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2599, - "step": 7380 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2567, - "step": 7381 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2722, - "step": 7382 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2636, - "step": 7383 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2663, - "step": 7384 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2447, - "step": 7385 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.248, - "step": 7386 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2636, - "step": 7387 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2575, - "step": 7388 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2633, - "step": 7389 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2597, - "step": 7390 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.264, - "step": 7391 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2385, - "step": 7392 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2769, - "step": 7393 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2593, - "step": 7394 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2486, - "step": 7395 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2743, - "step": 7396 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2491, - "step": 7397 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2573, - "step": 7398 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2416, - "step": 7399 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2651, - "step": 7400 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2544, - "step": 7401 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2544, - "step": 7402 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.259, - "step": 7403 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2645, - "step": 7404 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2738, - "step": 7405 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2719, - "step": 7406 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2643, - "step": 7407 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2491, - "step": 7408 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2673, - "step": 7409 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2542, - "step": 7410 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2732, - "step": 7411 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2664, - "step": 7412 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.2667, - "step": 7413 - }, - { - "epoch": 0.91, - "learning_rate": 0.0003, - "loss": 0.241, - "step": 7414 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2723, - "step": 7415 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2752, - "step": 7416 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.262, - "step": 7417 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2609, - "step": 7418 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2732, - "step": 7419 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.26, - "step": 7420 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2615, - "step": 7421 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2611, - "step": 7422 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2489, - "step": 7423 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2701, - "step": 7424 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2395, - "step": 7425 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2726, - "step": 7426 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2305, - "step": 7427 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2731, - "step": 7428 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2516, - "step": 7429 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2727, - "step": 7430 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2487, - "step": 7431 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2503, - "step": 7432 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2631, - "step": 7433 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2604, - "step": 7434 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.273, - "step": 7435 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.252, - "step": 7436 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2496, - "step": 7437 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2618, - "step": 7438 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2484, - "step": 7439 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2617, - "step": 7440 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2635, - "step": 7441 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2663, - "step": 7442 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.258, - "step": 7443 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2766, - "step": 7444 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.273, - "step": 7445 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2499, - "step": 7446 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2559, - "step": 7447 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2515, - "step": 7448 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2429, - "step": 7449 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2498, - "step": 7450 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2795, - "step": 7451 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2652, - "step": 7452 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2486, - "step": 7453 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2522, - "step": 7454 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2601, - "step": 7455 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2657, - "step": 7456 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.248, - "step": 7457 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2767, - "step": 7458 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2631, - "step": 7459 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2586, - "step": 7460 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2638, - "step": 7461 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2595, - "step": 7462 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2483, - "step": 7463 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2532, - "step": 7464 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2723, - "step": 7465 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2615, - "step": 7466 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2539, - "step": 7467 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2592, - "step": 7468 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2588, - "step": 7469 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2565, - "step": 7470 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2511, - "step": 7471 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2758, - "step": 7472 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2598, - "step": 7473 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2434, - "step": 7474 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2623, - "step": 7475 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2565, - "step": 7476 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2646, - "step": 7477 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2551, - "step": 7478 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2815, - "step": 7479 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2824, - "step": 7480 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2624, - "step": 7481 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2671, - "step": 7482 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2519, - "step": 7483 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2553, - "step": 7484 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2534, - "step": 7485 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2491, - "step": 7486 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2741, - "step": 7487 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2425, - "step": 7488 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2633, - "step": 7489 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.257, - "step": 7490 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2534, - "step": 7491 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2647, - "step": 7492 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2663, - "step": 7493 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2515, - "step": 7494 - }, - { - "epoch": 0.92, - "learning_rate": 0.0003, - "loss": 0.2476, - "step": 7495 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2559, - "step": 7496 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2547, - "step": 7497 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2628, - "step": 7498 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2566, - "step": 7499 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2433, - "step": 7500 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2507, - "step": 7501 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2349, - "step": 7502 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2576, - "step": 7503 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2699, - "step": 7504 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2657, - "step": 7505 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2604, - "step": 7506 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2488, - "step": 7507 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2605, - "step": 7508 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2694, - "step": 7509 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2686, - "step": 7510 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.238, - "step": 7511 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2443, - "step": 7512 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2559, - "step": 7513 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.262, - "step": 7514 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2704, - "step": 7515 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2683, - "step": 7516 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.241, - "step": 7517 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2433, - "step": 7518 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2497, - "step": 7519 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.252, - "step": 7520 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2634, - "step": 7521 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2549, - "step": 7522 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2539, - "step": 7523 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2569, - "step": 7524 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2523, - "step": 7525 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2647, - "step": 7526 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2388, - "step": 7527 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2663, - "step": 7528 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2676, - "step": 7529 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2686, - "step": 7530 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2442, - "step": 7531 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2448, - "step": 7532 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2558, - "step": 7533 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2551, - "step": 7534 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2702, - "step": 7535 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2567, - "step": 7536 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2585, - "step": 7537 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2668, - "step": 7538 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.27, - "step": 7539 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.278, - "step": 7540 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2562, - "step": 7541 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.244, - "step": 7542 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2485, - "step": 7543 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2514, - "step": 7544 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2577, - "step": 7545 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2648, - "step": 7546 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2662, - "step": 7547 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2664, - "step": 7548 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2646, - "step": 7549 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2476, - "step": 7550 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2639, - "step": 7551 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2566, - "step": 7552 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2464, - "step": 7553 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2728, - "step": 7554 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2425, - "step": 7555 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2474, - "step": 7556 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2506, - "step": 7557 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2656, - "step": 7558 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2555, - "step": 7559 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2391, - "step": 7560 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2569, - "step": 7561 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2625, - "step": 7562 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2584, - "step": 7563 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2681, - "step": 7564 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2461, - "step": 7565 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2685, - "step": 7566 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2587, - "step": 7567 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2432, - "step": 7568 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.254, - "step": 7569 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2576, - "step": 7570 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2651, - "step": 7571 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2592, - "step": 7572 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2443, - "step": 7573 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2656, - "step": 7574 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2815, - "step": 7575 - }, - { - "epoch": 0.93, - "learning_rate": 0.0003, - "loss": 0.2487, - "step": 7576 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2435, - "step": 7577 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2383, - "step": 7578 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2469, - "step": 7579 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2646, - "step": 7580 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2607, - "step": 7581 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2685, - "step": 7582 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2347, - "step": 7583 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2548, - "step": 7584 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2591, - "step": 7585 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2594, - "step": 7586 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2611, - "step": 7587 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2492, - "step": 7588 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.256, - "step": 7589 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2566, - "step": 7590 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2634, - "step": 7591 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.254, - "step": 7592 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2496, - "step": 7593 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2612, - "step": 7594 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.255, - "step": 7595 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.257, - "step": 7596 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2473, - "step": 7597 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.249, - "step": 7598 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2508, - "step": 7599 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2511, - "step": 7600 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2592, - "step": 7601 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2621, - "step": 7602 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2578, - "step": 7603 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2493, - "step": 7604 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2588, - "step": 7605 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2697, - "step": 7606 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2656, - "step": 7607 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2541, - "step": 7608 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2734, - "step": 7609 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2631, - "step": 7610 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2657, - "step": 7611 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.253, - "step": 7612 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2692, - "step": 7613 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.244, - "step": 7614 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2546, - "step": 7615 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2597, - "step": 7616 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2659, - "step": 7617 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2496, - "step": 7618 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2501, - "step": 7619 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2654, - "step": 7620 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2544, - "step": 7621 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2718, - "step": 7622 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2592, - "step": 7623 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2647, - "step": 7624 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2598, - "step": 7625 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2719, - "step": 7626 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2632, - "step": 7627 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2537, - "step": 7628 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2485, - "step": 7629 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.268, - "step": 7630 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2643, - "step": 7631 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2606, - "step": 7632 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.246, - "step": 7633 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2653, - "step": 7634 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2501, - "step": 7635 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2493, - "step": 7636 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2719, - "step": 7637 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2466, - "step": 7638 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2695, - "step": 7639 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2501, - "step": 7640 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2565, - "step": 7641 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2532, - "step": 7642 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2593, - "step": 7643 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2687, - "step": 7644 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.256, - "step": 7645 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2702, - "step": 7646 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2716, - "step": 7647 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2567, - "step": 7648 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.27, - "step": 7649 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2543, - "step": 7650 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2518, - "step": 7651 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2563, - "step": 7652 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2698, - "step": 7653 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2517, - "step": 7654 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2709, - "step": 7655 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2454, - "step": 7656 - }, - { - "epoch": 0.94, - "learning_rate": 0.0003, - "loss": 0.2517, - "step": 7657 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.262, - "step": 7658 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2524, - "step": 7659 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.256, - "step": 7660 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2709, - "step": 7661 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2502, - "step": 7662 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2419, - "step": 7663 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2616, - "step": 7664 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2583, - "step": 7665 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2499, - "step": 7666 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2718, - "step": 7667 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2324, - "step": 7668 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2428, - "step": 7669 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2673, - "step": 7670 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.258, - "step": 7671 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.253, - "step": 7672 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2506, - "step": 7673 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2525, - "step": 7674 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2705, - "step": 7675 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2419, - "step": 7676 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2313, - "step": 7677 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2717, - "step": 7678 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2515, - "step": 7679 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2556, - "step": 7680 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2709, - "step": 7681 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2504, - "step": 7682 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2567, - "step": 7683 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2573, - "step": 7684 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2496, - "step": 7685 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2488, - "step": 7686 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2663, - "step": 7687 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2753, - "step": 7688 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2567, - "step": 7689 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2572, - "step": 7690 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2665, - "step": 7691 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2608, - "step": 7692 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2556, - "step": 7693 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2468, - "step": 7694 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2484, - "step": 7695 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2562, - "step": 7696 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2525, - "step": 7697 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2423, - "step": 7698 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.247, - "step": 7699 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2642, - "step": 7700 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2587, - "step": 7701 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2378, - "step": 7702 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2389, - "step": 7703 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2541, - "step": 7704 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2709, - "step": 7705 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2445, - "step": 7706 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2609, - "step": 7707 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2557, - "step": 7708 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2515, - "step": 7709 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2657, - "step": 7710 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2539, - "step": 7711 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2538, - "step": 7712 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2608, - "step": 7713 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2712, - "step": 7714 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2623, - "step": 7715 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2477, - "step": 7716 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2651, - "step": 7717 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2648, - "step": 7718 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2579, - "step": 7719 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2633, - "step": 7720 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2436, - "step": 7721 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2665, - "step": 7722 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2656, - "step": 7723 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2497, - "step": 7724 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2496, - "step": 7725 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2645, - "step": 7726 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2505, - "step": 7727 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2611, - "step": 7728 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2528, - "step": 7729 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2533, - "step": 7730 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2503, - "step": 7731 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2373, - "step": 7732 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.247, - "step": 7733 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2465, - "step": 7734 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2583, - "step": 7735 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2657, - "step": 7736 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2586, - "step": 7737 - }, - { - "epoch": 0.95, - "learning_rate": 0.0003, - "loss": 0.2634, - "step": 7738 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.25, - "step": 7739 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2577, - "step": 7740 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2433, - "step": 7741 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2646, - "step": 7742 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2614, - "step": 7743 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2651, - "step": 7744 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2624, - "step": 7745 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2588, - "step": 7746 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2743, - "step": 7747 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2524, - "step": 7748 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2591, - "step": 7749 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2572, - "step": 7750 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2766, - "step": 7751 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2647, - "step": 7752 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2621, - "step": 7753 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2515, - "step": 7754 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2597, - "step": 7755 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2562, - "step": 7756 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2524, - "step": 7757 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2619, - "step": 7758 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.25, - "step": 7759 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.267, - "step": 7760 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2756, - "step": 7761 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2511, - "step": 7762 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2561, - "step": 7763 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2591, - "step": 7764 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2544, - "step": 7765 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2561, - "step": 7766 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.272, - "step": 7767 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2368, - "step": 7768 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2613, - "step": 7769 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.263, - "step": 7770 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2473, - "step": 7771 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2543, - "step": 7772 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2598, - "step": 7773 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2568, - "step": 7774 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2699, - "step": 7775 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2453, - "step": 7776 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2453, - "step": 7777 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2559, - "step": 7778 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2605, - "step": 7779 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2745, - "step": 7780 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2659, - "step": 7781 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.244, - "step": 7782 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2652, - "step": 7783 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2626, - "step": 7784 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2742, - "step": 7785 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.26, - "step": 7786 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2554, - "step": 7787 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2433, - "step": 7788 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2534, - "step": 7789 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2655, - "step": 7790 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2467, - "step": 7791 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2487, - "step": 7792 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2452, - "step": 7793 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2622, - "step": 7794 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2424, - "step": 7795 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2469, - "step": 7796 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2509, - "step": 7797 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2476, - "step": 7798 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2696, - "step": 7799 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2534, - "step": 7800 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2565, - "step": 7801 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2629, - "step": 7802 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2536, - "step": 7803 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2614, - "step": 7804 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.267, - "step": 7805 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2516, - "step": 7806 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.261, - "step": 7807 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2506, - "step": 7808 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2607, - "step": 7809 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2692, - "step": 7810 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2644, - "step": 7811 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.235, - "step": 7812 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2746, - "step": 7813 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.265, - "step": 7814 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2484, - "step": 7815 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2531, - "step": 7816 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2509, - "step": 7817 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.2484, - "step": 7818 - }, - { - "epoch": 0.96, - "learning_rate": 0.0003, - "loss": 0.252, - "step": 7819 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2457, - "step": 7820 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2768, - "step": 7821 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.262, - "step": 7822 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2458, - "step": 7823 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2533, - "step": 7824 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2545, - "step": 7825 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2411, - "step": 7826 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2506, - "step": 7827 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.248, - "step": 7828 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2709, - "step": 7829 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2589, - "step": 7830 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2585, - "step": 7831 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2442, - "step": 7832 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2532, - "step": 7833 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2579, - "step": 7834 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.258, - "step": 7835 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2395, - "step": 7836 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.274, - "step": 7837 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2629, - "step": 7838 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2721, - "step": 7839 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2299, - "step": 7840 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2408, - "step": 7841 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2553, - "step": 7842 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2807, - "step": 7843 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2608, - "step": 7844 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2549, - "step": 7845 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2546, - "step": 7846 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2657, - "step": 7847 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2742, - "step": 7848 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2314, - "step": 7849 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2587, - "step": 7850 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2731, - "step": 7851 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2599, - "step": 7852 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2409, - "step": 7853 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.255, - "step": 7854 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2674, - "step": 7855 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2612, - "step": 7856 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2443, - "step": 7857 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2573, - "step": 7858 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2778, - "step": 7859 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2513, - "step": 7860 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2491, - "step": 7861 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2473, - "step": 7862 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2551, - "step": 7863 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2521, - "step": 7864 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2525, - "step": 7865 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2552, - "step": 7866 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2567, - "step": 7867 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2453, - "step": 7868 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.256, - "step": 7869 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2531, - "step": 7870 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2565, - "step": 7871 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2606, - "step": 7872 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2488, - "step": 7873 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2574, - "step": 7874 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2385, - "step": 7875 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2634, - "step": 7876 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2586, - "step": 7877 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2459, - "step": 7878 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2462, - "step": 7879 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2429, - "step": 7880 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2415, - "step": 7881 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2471, - "step": 7882 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2443, - "step": 7883 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.254, - "step": 7884 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2569, - "step": 7885 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2563, - "step": 7886 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2597, - "step": 7887 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.257, - "step": 7888 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2498, - "step": 7889 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.275, - "step": 7890 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2571, - "step": 7891 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2645, - "step": 7892 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2623, - "step": 7893 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.259, - "step": 7894 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.25, - "step": 7895 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2442, - "step": 7896 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2603, - "step": 7897 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2608, - "step": 7898 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2486, - "step": 7899 - }, - { - "epoch": 0.97, - "learning_rate": 0.0003, - "loss": 0.2522, - "step": 7900 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2464, - "step": 7901 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2651, - "step": 7902 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2468, - "step": 7903 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2565, - "step": 7904 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2527, - "step": 7905 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2608, - "step": 7906 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2448, - "step": 7907 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2617, - "step": 7908 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2648, - "step": 7909 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2629, - "step": 7910 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2438, - "step": 7911 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2595, - "step": 7912 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.258, - "step": 7913 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2491, - "step": 7914 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.256, - "step": 7915 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2443, - "step": 7916 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2394, - "step": 7917 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.252, - "step": 7918 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2637, - "step": 7919 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2481, - "step": 7920 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2571, - "step": 7921 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2553, - "step": 7922 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2398, - "step": 7923 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2491, - "step": 7924 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2402, - "step": 7925 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2458, - "step": 7926 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2481, - "step": 7927 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2586, - "step": 7928 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.249, - "step": 7929 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2575, - "step": 7930 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.242, - "step": 7931 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2505, - "step": 7932 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2542, - "step": 7933 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2408, - "step": 7934 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2557, - "step": 7935 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2678, - "step": 7936 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2598, - "step": 7937 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2386, - "step": 7938 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.255, - "step": 7939 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2572, - "step": 7940 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.247, - "step": 7941 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2481, - "step": 7942 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2579, - "step": 7943 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2633, - "step": 7944 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2352, - "step": 7945 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2503, - "step": 7946 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2694, - "step": 7947 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2493, - "step": 7948 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2589, - "step": 7949 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2517, - "step": 7950 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2822, - "step": 7951 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2482, - "step": 7952 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2593, - "step": 7953 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2703, - "step": 7954 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2569, - "step": 7955 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2513, - "step": 7956 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2503, - "step": 7957 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2515, - "step": 7958 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2434, - "step": 7959 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2541, - "step": 7960 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2489, - "step": 7961 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2447, - "step": 7962 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2577, - "step": 7963 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2367, - "step": 7964 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2567, - "step": 7965 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2526, - "step": 7966 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2615, - "step": 7967 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2459, - "step": 7968 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2557, - "step": 7969 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2443, - "step": 7970 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2633, - "step": 7971 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2627, - "step": 7972 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2544, - "step": 7973 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2619, - "step": 7974 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2446, - "step": 7975 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2457, - "step": 7976 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2722, - "step": 7977 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2598, - "step": 7978 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2529, - "step": 7979 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2443, - "step": 7980 - }, - { - "epoch": 0.98, - "learning_rate": 0.0003, - "loss": 0.2542, - "step": 7981 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2461, - "step": 7982 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.243, - "step": 7983 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.244, - "step": 7984 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2476, - "step": 7985 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2491, - "step": 7986 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.259, - "step": 7987 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2479, - "step": 7988 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2483, - "step": 7989 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2576, - "step": 7990 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2611, - "step": 7991 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2638, - "step": 7992 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2446, - "step": 7993 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2498, - "step": 7994 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2513, - "step": 7995 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2619, - "step": 7996 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2531, - "step": 7997 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2538, - "step": 7998 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2612, - "step": 7999 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.255, - "step": 8000 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2453, - "step": 8001 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2552, - "step": 8002 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2424, - "step": 8003 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2548, - "step": 8004 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2468, - "step": 8005 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2401, - "step": 8006 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2497, - "step": 8007 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2597, - "step": 8008 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2481, - "step": 8009 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2371, - "step": 8010 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2474, - "step": 8011 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2629, - "step": 8012 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2439, - "step": 8013 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2482, - "step": 8014 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2543, - "step": 8015 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2514, - "step": 8016 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2502, - "step": 8017 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2359, - "step": 8018 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2416, - "step": 8019 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2641, - "step": 8020 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2631, - "step": 8021 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2405, - "step": 8022 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2483, - "step": 8023 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2593, - "step": 8024 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2404, - "step": 8025 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2589, - "step": 8026 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2493, - "step": 8027 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2633, - "step": 8028 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2542, - "step": 8029 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2573, - "step": 8030 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2424, - "step": 8031 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.252, - "step": 8032 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2469, - "step": 8033 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2622, - "step": 8034 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2684, - "step": 8035 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2376, - "step": 8036 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2291, - "step": 8037 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2343, - "step": 8038 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2721, - "step": 8039 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2423, - "step": 8040 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2519, - "step": 8041 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2688, - "step": 8042 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2623, - "step": 8043 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2462, - "step": 8044 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2711, - "step": 8045 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2451, - "step": 8046 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2639, - "step": 8047 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2464, - "step": 8048 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2693, - "step": 8049 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.252, - "step": 8050 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2213, - "step": 8051 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2456, - "step": 8052 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.269, - "step": 8053 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2662, - "step": 8054 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2524, - "step": 8055 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2384, - "step": 8056 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.246, - "step": 8057 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2665, - "step": 8058 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2483, - "step": 8059 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2656, - "step": 8060 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2767, - "step": 8061 - }, - { - "epoch": 0.99, - "learning_rate": 0.0003, - "loss": 0.2449, - "step": 8062 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2534, - "step": 8063 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.255, - "step": 8064 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.234, - "step": 8065 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2634, - "step": 8066 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2536, - "step": 8067 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.259, - "step": 8068 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2459, - "step": 8069 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2679, - "step": 8070 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2556, - "step": 8071 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2624, - "step": 8072 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2607, - "step": 8073 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2489, - "step": 8074 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2562, - "step": 8075 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2635, - "step": 8076 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2487, - "step": 8077 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.249, - "step": 8078 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2515, - "step": 8079 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2538, - "step": 8080 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2451, - "step": 8081 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2501, - "step": 8082 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2591, - "step": 8083 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2595, - "step": 8084 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2477, - "step": 8085 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2385, - "step": 8086 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2405, - "step": 8087 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2435, - "step": 8088 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2453, - "step": 8089 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2535, - "step": 8090 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2587, - "step": 8091 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2649, - "step": 8092 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2561, - "step": 8093 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2548, - "step": 8094 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2598, - "step": 8095 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2588, - "step": 8096 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2616, - "step": 8097 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2564, - "step": 8098 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2808, - "step": 8099 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2478, - "step": 8100 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.247, - "step": 8101 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2472, - "step": 8102 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2549, - "step": 8103 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2506, - "step": 8104 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2704, - "step": 8105 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2527, - "step": 8106 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2649, - "step": 8107 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2572, - "step": 8108 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2325, - "step": 8109 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2762, - "step": 8110 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2559, - "step": 8111 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2394, - "step": 8112 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2541, - "step": 8113 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2499, - "step": 8114 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2655, - "step": 8115 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2347, - "step": 8116 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2611, - "step": 8117 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2487, - "step": 8118 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2503, - "step": 8119 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2524, - "step": 8120 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.255, - "step": 8121 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2443, - "step": 8122 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2662, - "step": 8123 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2397, - "step": 8124 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2652, - "step": 8125 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2471, - "step": 8126 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2602, - "step": 8127 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2719, - "step": 8128 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2384, - "step": 8129 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2459, - "step": 8130 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.25, - "step": 8131 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.265, - "step": 8132 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2685, - "step": 8133 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2654, - "step": 8134 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2422, - "step": 8135 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2726, - "step": 8136 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2525, - "step": 8137 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2443, - "step": 8138 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2488, - "step": 8139 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2607, - "step": 8140 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.241, - "step": 8141 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.269, - "step": 8142 - }, - { - "epoch": 1.0, - "learning_rate": 0.0003, - "loss": 0.2577, - "step": 8143 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2693, - "step": 8144 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.253, - "step": 8145 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2502, - "step": 8146 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2592, - "step": 8147 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2469, - "step": 8148 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2497, - "step": 8149 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2468, - "step": 8150 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2456, - "step": 8151 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2541, - "step": 8152 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2593, - "step": 8153 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2509, - "step": 8154 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2522, - "step": 8155 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2441, - "step": 8156 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2481, - "step": 8157 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2506, - "step": 8158 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2516, - "step": 8159 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.241, - "step": 8160 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2503, - "step": 8161 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2395, - "step": 8162 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2458, - "step": 8163 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2506, - "step": 8164 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2546, - "step": 8165 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2463, - "step": 8166 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2577, - "step": 8167 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2699, - "step": 8168 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2706, - "step": 8169 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2648, - "step": 8170 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2606, - "step": 8171 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.247, - "step": 8172 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2435, - "step": 8173 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2743, - "step": 8174 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2579, - "step": 8175 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2479, - "step": 8176 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2482, - "step": 8177 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2524, - "step": 8178 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2671, - "step": 8179 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2585, - "step": 8180 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2439, - "step": 8181 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2366, - "step": 8182 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2413, - "step": 8183 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2413, - "step": 8184 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2473, - "step": 8185 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2471, - "step": 8186 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2613, - "step": 8187 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2535, - "step": 8188 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2452, - "step": 8189 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.245, - "step": 8190 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2586, - "step": 8191 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2586, - "step": 8192 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2444, - "step": 8193 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2446, - "step": 8194 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2494, - "step": 8195 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2602, - "step": 8196 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2487, - "step": 8197 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2412, - "step": 8198 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2457, - "step": 8199 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2545, - "step": 8200 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2444, - "step": 8201 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2592, - "step": 8202 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2406, - "step": 8203 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2593, - "step": 8204 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2517, - "step": 8205 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2534, - "step": 8206 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2526, - "step": 8207 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2686, - "step": 8208 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2447, - "step": 8209 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2607, - "step": 8210 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2523, - "step": 8211 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2483, - "step": 8212 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2496, - "step": 8213 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2492, - "step": 8214 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2607, - "step": 8215 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2528, - "step": 8216 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2445, - "step": 8217 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2517, - "step": 8218 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2506, - "step": 8219 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2588, - "step": 8220 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2559, - "step": 8221 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2483, - "step": 8222 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2574, - "step": 8223 - }, - { - "epoch": 1.01, - "learning_rate": 0.0003, - "loss": 0.2617, - "step": 8224 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2564, - "step": 8225 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2512, - "step": 8226 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.244, - "step": 8227 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.255, - "step": 8228 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2303, - "step": 8229 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2661, - "step": 8230 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2513, - "step": 8231 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2625, - "step": 8232 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2508, - "step": 8233 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.254, - "step": 8234 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2676, - "step": 8235 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2464, - "step": 8236 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2436, - "step": 8237 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2514, - "step": 8238 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2639, - "step": 8239 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2386, - "step": 8240 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.238, - "step": 8241 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2594, - "step": 8242 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2647, - "step": 8243 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2333, - "step": 8244 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2642, - "step": 8245 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.264, - "step": 8246 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2636, - "step": 8247 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2663, - "step": 8248 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2506, - "step": 8249 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2508, - "step": 8250 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2512, - "step": 8251 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2594, - "step": 8252 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2501, - "step": 8253 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2599, - "step": 8254 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2578, - "step": 8255 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2635, - "step": 8256 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2352, - "step": 8257 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2442, - "step": 8258 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2546, - "step": 8259 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2561, - "step": 8260 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.257, - "step": 8261 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.241, - "step": 8262 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.238, - "step": 8263 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2385, - "step": 8264 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2637, - "step": 8265 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2252, - "step": 8266 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2612, - "step": 8267 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.252, - "step": 8268 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2429, - "step": 8269 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2434, - "step": 8270 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2526, - "step": 8271 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2473, - "step": 8272 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2591, - "step": 8273 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2699, - "step": 8274 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2821, - "step": 8275 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2648, - "step": 8276 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2612, - "step": 8277 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.267, - "step": 8278 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2552, - "step": 8279 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2499, - "step": 8280 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2522, - "step": 8281 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2541, - "step": 8282 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2543, - "step": 8283 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2397, - "step": 8284 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2524, - "step": 8285 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2553, - "step": 8286 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2403, - "step": 8287 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2397, - "step": 8288 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2516, - "step": 8289 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2407, - "step": 8290 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.259, - "step": 8291 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2584, - "step": 8292 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2577, - "step": 8293 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2574, - "step": 8294 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2559, - "step": 8295 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2352, - "step": 8296 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2424, - "step": 8297 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2447, - "step": 8298 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2792, - "step": 8299 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2527, - "step": 8300 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.251, - "step": 8301 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2476, - "step": 8302 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2423, - "step": 8303 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2459, - "step": 8304 - }, - { - "epoch": 1.02, - "learning_rate": 0.0003, - "loss": 0.2569, - "step": 8305 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2605, - "step": 8306 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2466, - "step": 8307 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2505, - "step": 8308 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2595, - "step": 8309 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2551, - "step": 8310 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2478, - "step": 8311 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.269, - "step": 8312 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2597, - "step": 8313 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2525, - "step": 8314 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2505, - "step": 8315 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2487, - "step": 8316 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2565, - "step": 8317 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2554, - "step": 8318 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.242, - "step": 8319 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2635, - "step": 8320 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2415, - "step": 8321 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2483, - "step": 8322 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2656, - "step": 8323 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2442, - "step": 8324 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2447, - "step": 8325 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2429, - "step": 8326 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2639, - "step": 8327 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2492, - "step": 8328 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2412, - "step": 8329 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.25, - "step": 8330 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2521, - "step": 8331 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2489, - "step": 8332 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2492, - "step": 8333 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.248, - "step": 8334 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2396, - "step": 8335 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2589, - "step": 8336 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2493, - "step": 8337 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2627, - "step": 8338 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2369, - "step": 8339 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2518, - "step": 8340 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2526, - "step": 8341 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2496, - "step": 8342 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2491, - "step": 8343 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2563, - "step": 8344 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.251, - "step": 8345 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2584, - "step": 8346 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2419, - "step": 8347 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2468, - "step": 8348 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2453, - "step": 8349 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2577, - "step": 8350 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2644, - "step": 8351 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.248, - "step": 8352 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2629, - "step": 8353 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2472, - "step": 8354 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.241, - "step": 8355 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2371, - "step": 8356 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2598, - "step": 8357 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2395, - "step": 8358 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2417, - "step": 8359 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2487, - "step": 8360 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2484, - "step": 8361 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2506, - "step": 8362 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2533, - "step": 8363 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2514, - "step": 8364 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2499, - "step": 8365 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2423, - "step": 8366 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2416, - "step": 8367 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2371, - "step": 8368 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2485, - "step": 8369 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2583, - "step": 8370 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2478, - "step": 8371 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.269, - "step": 8372 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2625, - "step": 8373 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2497, - "step": 8374 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2434, - "step": 8375 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2474, - "step": 8376 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2475, - "step": 8377 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2439, - "step": 8378 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.252, - "step": 8379 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2666, - "step": 8380 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2475, - "step": 8381 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.24, - "step": 8382 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2492, - "step": 8383 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2561, - "step": 8384 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2507, - "step": 8385 - }, - { - "epoch": 1.03, - "learning_rate": 0.0003, - "loss": 0.2529, - "step": 8386 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.253, - "step": 8387 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2525, - "step": 8388 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2539, - "step": 8389 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2529, - "step": 8390 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.268, - "step": 8391 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2705, - "step": 8392 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2624, - "step": 8393 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.25, - "step": 8394 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2409, - "step": 8395 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.237, - "step": 8396 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2523, - "step": 8397 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2486, - "step": 8398 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2555, - "step": 8399 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2595, - "step": 8400 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2521, - "step": 8401 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2445, - "step": 8402 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2526, - "step": 8403 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2494, - "step": 8404 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2465, - "step": 8405 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2559, - "step": 8406 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2612, - "step": 8407 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2434, - "step": 8408 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2479, - "step": 8409 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2572, - "step": 8410 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2544, - "step": 8411 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.248, - "step": 8412 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2632, - "step": 8413 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2363, - "step": 8414 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2558, - "step": 8415 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2325, - "step": 8416 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2528, - "step": 8417 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2445, - "step": 8418 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2455, - "step": 8419 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2306, - "step": 8420 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2345, - "step": 8421 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2529, - "step": 8422 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2578, - "step": 8423 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2539, - "step": 8424 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2499, - "step": 8425 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2546, - "step": 8426 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2463, - "step": 8427 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2422, - "step": 8428 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2548, - "step": 8429 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2265, - "step": 8430 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.25, - "step": 8431 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.241, - "step": 8432 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2358, - "step": 8433 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.24, - "step": 8434 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2507, - "step": 8435 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2489, - "step": 8436 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2628, - "step": 8437 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2411, - "step": 8438 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2389, - "step": 8439 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2504, - "step": 8440 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2467, - "step": 8441 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2373, - "step": 8442 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2515, - "step": 8443 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2744, - "step": 8444 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2408, - "step": 8445 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2396, - "step": 8446 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2542, - "step": 8447 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2599, - "step": 8448 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2432, - "step": 8449 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2464, - "step": 8450 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2618, - "step": 8451 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2459, - "step": 8452 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2397, - "step": 8453 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2517, - "step": 8454 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2501, - "step": 8455 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2317, - "step": 8456 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2504, - "step": 8457 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2374, - "step": 8458 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2335, - "step": 8459 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2476, - "step": 8460 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2598, - "step": 8461 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2632, - "step": 8462 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2531, - "step": 8463 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2581, - "step": 8464 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2585, - "step": 8465 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2511, - "step": 8466 - }, - { - "epoch": 1.04, - "learning_rate": 0.0003, - "loss": 0.2557, - "step": 8467 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2337, - "step": 8468 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2607, - "step": 8469 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2431, - "step": 8470 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2588, - "step": 8471 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2539, - "step": 8472 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2465, - "step": 8473 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2577, - "step": 8474 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.253, - "step": 8475 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.249, - "step": 8476 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2508, - "step": 8477 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2405, - "step": 8478 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2575, - "step": 8479 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2642, - "step": 8480 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.248, - "step": 8481 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2538, - "step": 8482 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.255, - "step": 8483 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2493, - "step": 8484 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2631, - "step": 8485 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2432, - "step": 8486 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2416, - "step": 8487 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.25, - "step": 8488 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2418, - "step": 8489 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2766, - "step": 8490 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2599, - "step": 8491 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2424, - "step": 8492 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2402, - "step": 8493 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2449, - "step": 8494 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2371, - "step": 8495 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2492, - "step": 8496 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2511, - "step": 8497 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2447, - "step": 8498 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2414, - "step": 8499 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2496, - "step": 8500 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2565, - "step": 8501 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2632, - "step": 8502 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2485, - "step": 8503 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.256, - "step": 8504 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2595, - "step": 8505 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2671, - "step": 8506 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2605, - "step": 8507 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2467, - "step": 8508 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2623, - "step": 8509 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2219, - "step": 8510 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2535, - "step": 8511 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2411, - "step": 8512 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2607, - "step": 8513 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2592, - "step": 8514 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2504, - "step": 8515 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.235, - "step": 8516 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2266, - "step": 8517 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2624, - "step": 8518 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2385, - "step": 8519 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2668, - "step": 8520 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.26, - "step": 8521 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2609, - "step": 8522 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2372, - "step": 8523 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2402, - "step": 8524 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2477, - "step": 8525 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2529, - "step": 8526 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2493, - "step": 8527 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2378, - "step": 8528 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2446, - "step": 8529 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2452, - "step": 8530 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2662, - "step": 8531 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2484, - "step": 8532 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2407, - "step": 8533 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2377, - "step": 8534 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2492, - "step": 8535 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2747, - "step": 8536 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2506, - "step": 8537 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2371, - "step": 8538 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2352, - "step": 8539 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2647, - "step": 8540 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.26, - "step": 8541 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2287, - "step": 8542 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2579, - "step": 8543 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2349, - "step": 8544 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2389, - "step": 8545 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2447, - "step": 8546 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2467, - "step": 8547 - }, - { - "epoch": 1.05, - "learning_rate": 0.0003, - "loss": 0.2423, - "step": 8548 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2533, - "step": 8549 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2393, - "step": 8550 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2547, - "step": 8551 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2591, - "step": 8552 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2513, - "step": 8553 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2532, - "step": 8554 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2457, - "step": 8555 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.242, - "step": 8556 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2249, - "step": 8557 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2507, - "step": 8558 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2341, - "step": 8559 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2598, - "step": 8560 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2521, - "step": 8561 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2538, - "step": 8562 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.249, - "step": 8563 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2607, - "step": 8564 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2473, - "step": 8565 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2376, - "step": 8566 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2495, - "step": 8567 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2406, - "step": 8568 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2494, - "step": 8569 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2482, - "step": 8570 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2483, - "step": 8571 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2341, - "step": 8572 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2388, - "step": 8573 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.241, - "step": 8574 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2592, - "step": 8575 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2616, - "step": 8576 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2543, - "step": 8577 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2415, - "step": 8578 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2583, - "step": 8579 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2611, - "step": 8580 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2606, - "step": 8581 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.24, - "step": 8582 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2455, - "step": 8583 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.224, - "step": 8584 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2359, - "step": 8585 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2408, - "step": 8586 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2628, - "step": 8587 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2494, - "step": 8588 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2647, - "step": 8589 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2555, - "step": 8590 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2444, - "step": 8591 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2409, - "step": 8592 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2322, - "step": 8593 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2551, - "step": 8594 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2481, - "step": 8595 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2261, - "step": 8596 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2472, - "step": 8597 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2641, - "step": 8598 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2471, - "step": 8599 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2487, - "step": 8600 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2513, - "step": 8601 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2422, - "step": 8602 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2349, - "step": 8603 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2399, - "step": 8604 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2598, - "step": 8605 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2398, - "step": 8606 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2554, - "step": 8607 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2564, - "step": 8608 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2261, - "step": 8609 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2556, - "step": 8610 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2333, - "step": 8611 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2425, - "step": 8612 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2606, - "step": 8613 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2521, - "step": 8614 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2507, - "step": 8615 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2544, - "step": 8616 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.249, - "step": 8617 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2484, - "step": 8618 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2391, - "step": 8619 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2533, - "step": 8620 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.257, - "step": 8621 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2516, - "step": 8622 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2388, - "step": 8623 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2559, - "step": 8624 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2375, - "step": 8625 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2415, - "step": 8626 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2708, - "step": 8627 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.253, - "step": 8628 - }, - { - "epoch": 1.06, - "learning_rate": 0.0003, - "loss": 0.2557, - "step": 8629 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2366, - "step": 8630 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.251, - "step": 8631 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2492, - "step": 8632 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.25, - "step": 8633 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2512, - "step": 8634 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2359, - "step": 8635 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2396, - "step": 8636 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2355, - "step": 8637 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2501, - "step": 8638 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2383, - "step": 8639 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2363, - "step": 8640 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2384, - "step": 8641 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2539, - "step": 8642 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2742, - "step": 8643 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2331, - "step": 8644 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.257, - "step": 8645 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2636, - "step": 8646 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2497, - "step": 8647 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2353, - "step": 8648 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2392, - "step": 8649 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2346, - "step": 8650 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2421, - "step": 8651 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2434, - "step": 8652 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2449, - "step": 8653 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2544, - "step": 8654 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2325, - "step": 8655 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2591, - "step": 8656 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2461, - "step": 8657 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2315, - "step": 8658 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2431, - "step": 8659 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2406, - "step": 8660 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.25, - "step": 8661 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2386, - "step": 8662 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2579, - "step": 8663 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2599, - "step": 8664 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2485, - "step": 8665 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2361, - "step": 8666 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2369, - "step": 8667 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2576, - "step": 8668 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2447, - "step": 8669 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2359, - "step": 8670 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2478, - "step": 8671 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2552, - "step": 8672 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2413, - "step": 8673 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2596, - "step": 8674 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2619, - "step": 8675 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2582, - "step": 8676 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2366, - "step": 8677 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2377, - "step": 8678 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2495, - "step": 8679 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2568, - "step": 8680 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2514, - "step": 8681 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2544, - "step": 8682 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2563, - "step": 8683 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2373, - "step": 8684 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2441, - "step": 8685 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2343, - "step": 8686 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2502, - "step": 8687 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.238, - "step": 8688 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2501, - "step": 8689 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2536, - "step": 8690 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2551, - "step": 8691 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2512, - "step": 8692 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2419, - "step": 8693 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2392, - "step": 8694 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.246, - "step": 8695 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2426, - "step": 8696 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.256, - "step": 8697 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2435, - "step": 8698 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2269, - "step": 8699 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2366, - "step": 8700 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2588, - "step": 8701 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2505, - "step": 8702 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2602, - "step": 8703 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.26, - "step": 8704 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2478, - "step": 8705 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2506, - "step": 8706 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2467, - "step": 8707 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2447, - "step": 8708 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.2476, - "step": 8709 - }, - { - "epoch": 1.07, - "learning_rate": 0.0003, - "loss": 0.266, - "step": 8710 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2425, - "step": 8711 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2532, - "step": 8712 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2534, - "step": 8713 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2456, - "step": 8714 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2538, - "step": 8715 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2523, - "step": 8716 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.248, - "step": 8717 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2308, - "step": 8718 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2438, - "step": 8719 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.252, - "step": 8720 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2399, - "step": 8721 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2574, - "step": 8722 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2532, - "step": 8723 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2525, - "step": 8724 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.247, - "step": 8725 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2616, - "step": 8726 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2491, - "step": 8727 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.25, - "step": 8728 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2491, - "step": 8729 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2534, - "step": 8730 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2444, - "step": 8731 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2433, - "step": 8732 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2325, - "step": 8733 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2466, - "step": 8734 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2336, - "step": 8735 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2387, - "step": 8736 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.243, - "step": 8737 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2553, - "step": 8738 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.242, - "step": 8739 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2611, - "step": 8740 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2475, - "step": 8741 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2612, - "step": 8742 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2504, - "step": 8743 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.251, - "step": 8744 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.253, - "step": 8745 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2561, - "step": 8746 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.245, - "step": 8747 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2422, - "step": 8748 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2667, - "step": 8749 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2322, - "step": 8750 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.263, - "step": 8751 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2489, - "step": 8752 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2523, - "step": 8753 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2361, - "step": 8754 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2578, - "step": 8755 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2403, - "step": 8756 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2345, - "step": 8757 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2409, - "step": 8758 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2544, - "step": 8759 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2502, - "step": 8760 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2535, - "step": 8761 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2463, - "step": 8762 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2483, - "step": 8763 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2359, - "step": 8764 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2432, - "step": 8765 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2369, - "step": 8766 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2457, - "step": 8767 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2445, - "step": 8768 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.245, - "step": 8769 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2359, - "step": 8770 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2383, - "step": 8771 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2445, - "step": 8772 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2377, - "step": 8773 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2486, - "step": 8774 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2569, - "step": 8775 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2496, - "step": 8776 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2485, - "step": 8777 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2366, - "step": 8778 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2418, - "step": 8779 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.231, - "step": 8780 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2398, - "step": 8781 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2436, - "step": 8782 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2428, - "step": 8783 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2557, - "step": 8784 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2575, - "step": 8785 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2476, - "step": 8786 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2483, - "step": 8787 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2393, - "step": 8788 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2504, - "step": 8789 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2452, - "step": 8790 - }, - { - "epoch": 1.08, - "learning_rate": 0.0003, - "loss": 0.2387, - "step": 8791 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.234, - "step": 8792 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2419, - "step": 8793 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2262, - "step": 8794 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2591, - "step": 8795 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2479, - "step": 8796 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2437, - "step": 8797 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2448, - "step": 8798 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2571, - "step": 8799 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2456, - "step": 8800 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2395, - "step": 8801 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2646, - "step": 8802 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2559, - "step": 8803 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2426, - "step": 8804 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2456, - "step": 8805 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2332, - "step": 8806 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2405, - "step": 8807 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2341, - "step": 8808 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2378, - "step": 8809 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2424, - "step": 8810 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2484, - "step": 8811 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2561, - "step": 8812 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2477, - "step": 8813 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2618, - "step": 8814 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2352, - "step": 8815 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.239, - "step": 8816 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2258, - "step": 8817 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2329, - "step": 8818 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2455, - "step": 8819 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2453, - "step": 8820 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2506, - "step": 8821 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2479, - "step": 8822 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2393, - "step": 8823 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2718, - "step": 8824 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2445, - "step": 8825 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2354, - "step": 8826 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2285, - "step": 8827 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2326, - "step": 8828 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2507, - "step": 8829 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2416, - "step": 8830 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2441, - "step": 8831 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2287, - "step": 8832 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2506, - "step": 8833 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2551, - "step": 8834 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2325, - "step": 8835 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2393, - "step": 8836 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2448, - "step": 8837 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2412, - "step": 8838 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2099, - "step": 8839 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2498, - "step": 8840 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2449, - "step": 8841 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2385, - "step": 8842 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2526, - "step": 8843 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2629, - "step": 8844 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2546, - "step": 8845 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.249, - "step": 8846 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2198, - "step": 8847 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2473, - "step": 8848 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2314, - "step": 8849 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2581, - "step": 8850 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.265, - "step": 8851 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2369, - "step": 8852 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2476, - "step": 8853 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2352, - "step": 8854 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2519, - "step": 8855 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2468, - "step": 8856 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2546, - "step": 8857 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2425, - "step": 8858 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2563, - "step": 8859 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2696, - "step": 8860 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2558, - "step": 8861 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2451, - "step": 8862 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2376, - "step": 8863 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2433, - "step": 8864 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.246, - "step": 8865 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2438, - "step": 8866 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2492, - "step": 8867 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.242, - "step": 8868 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.252, - "step": 8869 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2446, - "step": 8870 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2558, - "step": 8871 - }, - { - "epoch": 1.09, - "learning_rate": 0.0003, - "loss": 0.2536, - "step": 8872 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2513, - "step": 8873 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2588, - "step": 8874 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2441, - "step": 8875 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.263, - "step": 8876 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.248, - "step": 8877 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.248, - "step": 8878 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2583, - "step": 8879 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2497, - "step": 8880 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2398, - "step": 8881 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2427, - "step": 8882 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2427, - "step": 8883 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2715, - "step": 8884 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2456, - "step": 8885 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2626, - "step": 8886 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2328, - "step": 8887 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2292, - "step": 8888 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2286, - "step": 8889 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2539, - "step": 8890 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2412, - "step": 8891 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2292, - "step": 8892 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2448, - "step": 8893 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2367, - "step": 8894 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2607, - "step": 8895 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2451, - "step": 8896 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.244, - "step": 8897 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2579, - "step": 8898 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2425, - "step": 8899 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2528, - "step": 8900 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2553, - "step": 8901 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.232, - "step": 8902 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2603, - "step": 8903 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.255, - "step": 8904 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2758, - "step": 8905 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2453, - "step": 8906 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2583, - "step": 8907 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2636, - "step": 8908 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2451, - "step": 8909 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2452, - "step": 8910 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2475, - "step": 8911 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2399, - "step": 8912 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.258, - "step": 8913 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2446, - "step": 8914 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2457, - "step": 8915 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2487, - "step": 8916 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2481, - "step": 8917 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.253, - "step": 8918 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2533, - "step": 8919 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.254, - "step": 8920 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2344, - "step": 8921 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2446, - "step": 8922 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.241, - "step": 8923 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2501, - "step": 8924 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2484, - "step": 8925 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2387, - "step": 8926 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2572, - "step": 8927 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2516, - "step": 8928 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2429, - "step": 8929 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2578, - "step": 8930 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2606, - "step": 8931 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2384, - "step": 8932 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2373, - "step": 8933 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2433, - "step": 8934 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2405, - "step": 8935 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2537, - "step": 8936 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.255, - "step": 8937 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2494, - "step": 8938 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2493, - "step": 8939 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2637, - "step": 8940 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2457, - "step": 8941 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2517, - "step": 8942 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2375, - "step": 8943 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2537, - "step": 8944 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.241, - "step": 8945 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2368, - "step": 8946 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2548, - "step": 8947 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2516, - "step": 8948 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2463, - "step": 8949 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.234, - "step": 8950 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2446, - "step": 8951 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2492, - "step": 8952 - }, - { - "epoch": 1.1, - "learning_rate": 0.0003, - "loss": 0.2334, - "step": 8953 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2378, - "step": 8954 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2588, - "step": 8955 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2314, - "step": 8956 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2627, - "step": 8957 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2499, - "step": 8958 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2581, - "step": 8959 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2498, - "step": 8960 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2478, - "step": 8961 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2425, - "step": 8962 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2577, - "step": 8963 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2441, - "step": 8964 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2368, - "step": 8965 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2428, - "step": 8966 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2625, - "step": 8967 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2444, - "step": 8968 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2317, - "step": 8969 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2346, - "step": 8970 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2428, - "step": 8971 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2423, - "step": 8972 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.249, - "step": 8973 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2528, - "step": 8974 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2436, - "step": 8975 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2502, - "step": 8976 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2499, - "step": 8977 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2467, - "step": 8978 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2532, - "step": 8979 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2475, - "step": 8980 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2542, - "step": 8981 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2585, - "step": 8982 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2398, - "step": 8983 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2439, - "step": 8984 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2389, - "step": 8985 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2444, - "step": 8986 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.249, - "step": 8987 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2447, - "step": 8988 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2492, - "step": 8989 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.248, - "step": 8990 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2385, - "step": 8991 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2381, - "step": 8992 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2486, - "step": 8993 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2617, - "step": 8994 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2329, - "step": 8995 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2484, - "step": 8996 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2479, - "step": 8997 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.238, - "step": 8998 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2278, - "step": 8999 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2276, - "step": 9000 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.259, - "step": 9001 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2576, - "step": 9002 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2569, - "step": 9003 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2343, - "step": 9004 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2408, - "step": 9005 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2461, - "step": 9006 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2405, - "step": 9007 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2389, - "step": 9008 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2426, - "step": 9009 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2528, - "step": 9010 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2345, - "step": 9011 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.237, - "step": 9012 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2298, - "step": 9013 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2474, - "step": 9014 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2396, - "step": 9015 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2463, - "step": 9016 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2471, - "step": 9017 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2525, - "step": 9018 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2589, - "step": 9019 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.254, - "step": 9020 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2551, - "step": 9021 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2453, - "step": 9022 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2407, - "step": 9023 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2311, - "step": 9024 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2373, - "step": 9025 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2554, - "step": 9026 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2417, - "step": 9027 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2441, - "step": 9028 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2403, - "step": 9029 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2545, - "step": 9030 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2291, - "step": 9031 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2427, - "step": 9032 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2517, - "step": 9033 - }, - { - "epoch": 1.11, - "learning_rate": 0.0003, - "loss": 0.2384, - "step": 9034 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2385, - "step": 9035 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2544, - "step": 9036 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2319, - "step": 9037 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2528, - "step": 9038 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2482, - "step": 9039 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2391, - "step": 9040 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2512, - "step": 9041 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2421, - "step": 9042 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2388, - "step": 9043 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.233, - "step": 9044 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2536, - "step": 9045 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2444, - "step": 9046 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2495, - "step": 9047 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2464, - "step": 9048 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2271, - "step": 9049 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2396, - "step": 9050 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2489, - "step": 9051 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.238, - "step": 9052 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2352, - "step": 9053 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2439, - "step": 9054 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2353, - "step": 9055 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2421, - "step": 9056 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.244, - "step": 9057 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2491, - "step": 9058 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2342, - "step": 9059 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2664, - "step": 9060 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2514, - "step": 9061 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2437, - "step": 9062 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2548, - "step": 9063 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2337, - "step": 9064 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2441, - "step": 9065 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2618, - "step": 9066 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2445, - "step": 9067 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2344, - "step": 9068 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2547, - "step": 9069 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2334, - "step": 9070 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2405, - "step": 9071 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2409, - "step": 9072 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2444, - "step": 9073 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.24, - "step": 9074 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2385, - "step": 9075 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2504, - "step": 9076 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2361, - "step": 9077 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2642, - "step": 9078 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2436, - "step": 9079 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2588, - "step": 9080 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2464, - "step": 9081 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2465, - "step": 9082 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2359, - "step": 9083 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2457, - "step": 9084 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2445, - "step": 9085 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2217, - "step": 9086 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2572, - "step": 9087 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2718, - "step": 9088 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2405, - "step": 9089 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2401, - "step": 9090 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2356, - "step": 9091 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2611, - "step": 9092 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2407, - "step": 9093 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2599, - "step": 9094 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2484, - "step": 9095 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2661, - "step": 9096 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.232, - "step": 9097 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2599, - "step": 9098 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2646, - "step": 9099 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2395, - "step": 9100 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2298, - "step": 9101 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2581, - "step": 9102 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2456, - "step": 9103 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2439, - "step": 9104 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.241, - "step": 9105 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2385, - "step": 9106 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2367, - "step": 9107 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2258, - "step": 9108 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2531, - "step": 9109 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2368, - "step": 9110 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2312, - "step": 9111 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2256, - "step": 9112 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2426, - "step": 9113 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2368, - "step": 9114 - }, - { - "epoch": 1.12, - "learning_rate": 0.0003, - "loss": 0.2407, - "step": 9115 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2362, - "step": 9116 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2472, - "step": 9117 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2514, - "step": 9118 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2629, - "step": 9119 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2413, - "step": 9120 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2366, - "step": 9121 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2662, - "step": 9122 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2284, - "step": 9123 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2419, - "step": 9124 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2414, - "step": 9125 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2338, - "step": 9126 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2429, - "step": 9127 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2508, - "step": 9128 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2397, - "step": 9129 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2502, - "step": 9130 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2614, - "step": 9131 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2376, - "step": 9132 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2419, - "step": 9133 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2392, - "step": 9134 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.244, - "step": 9135 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2365, - "step": 9136 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2488, - "step": 9137 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2461, - "step": 9138 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2591, - "step": 9139 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2411, - "step": 9140 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2407, - "step": 9141 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2441, - "step": 9142 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2449, - "step": 9143 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2624, - "step": 9144 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2411, - "step": 9145 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2508, - "step": 9146 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.249, - "step": 9147 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2502, - "step": 9148 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2385, - "step": 9149 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2381, - "step": 9150 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2344, - "step": 9151 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2411, - "step": 9152 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2611, - "step": 9153 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2287, - "step": 9154 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2545, - "step": 9155 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2474, - "step": 9156 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2484, - "step": 9157 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2641, - "step": 9158 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2343, - "step": 9159 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2454, - "step": 9160 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2376, - "step": 9161 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.245, - "step": 9162 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2425, - "step": 9163 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2482, - "step": 9164 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2507, - "step": 9165 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.241, - "step": 9166 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2503, - "step": 9167 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2409, - "step": 9168 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2403, - "step": 9169 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2375, - "step": 9170 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2383, - "step": 9171 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2382, - "step": 9172 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2505, - "step": 9173 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2546, - "step": 9174 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2463, - "step": 9175 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2253, - "step": 9176 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2717, - "step": 9177 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2623, - "step": 9178 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.245, - "step": 9179 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2535, - "step": 9180 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2417, - "step": 9181 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2408, - "step": 9182 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2505, - "step": 9183 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2402, - "step": 9184 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2313, - "step": 9185 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2364, - "step": 9186 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2429, - "step": 9187 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2449, - "step": 9188 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2464, - "step": 9189 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2192, - "step": 9190 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2358, - "step": 9191 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2287, - "step": 9192 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2427, - "step": 9193 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2564, - "step": 9194 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2475, - "step": 9195 - }, - { - "epoch": 1.13, - "learning_rate": 0.0003, - "loss": 0.2334, - "step": 9196 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.239, - "step": 9197 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2398, - "step": 9198 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2394, - "step": 9199 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2514, - "step": 9200 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2541, - "step": 9201 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2444, - "step": 9202 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2408, - "step": 9203 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2355, - "step": 9204 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2442, - "step": 9205 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2422, - "step": 9206 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2384, - "step": 9207 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2488, - "step": 9208 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2426, - "step": 9209 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2391, - "step": 9210 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2326, - "step": 9211 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2498, - "step": 9212 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2324, - "step": 9213 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2378, - "step": 9214 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2377, - "step": 9215 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2273, - "step": 9216 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2436, - "step": 9217 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2366, - "step": 9218 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2544, - "step": 9219 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.246, - "step": 9220 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2437, - "step": 9221 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2487, - "step": 9222 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2342, - "step": 9223 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2308, - "step": 9224 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2424, - "step": 9225 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2546, - "step": 9226 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2424, - "step": 9227 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2303, - "step": 9228 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2334, - "step": 9229 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.259, - "step": 9230 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2466, - "step": 9231 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2577, - "step": 9232 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2584, - "step": 9233 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2315, - "step": 9234 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2344, - "step": 9235 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.234, - "step": 9236 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2677, - "step": 9237 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.255, - "step": 9238 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2487, - "step": 9239 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.249, - "step": 9240 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2312, - "step": 9241 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.245, - "step": 9242 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2687, - "step": 9243 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2549, - "step": 9244 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2414, - "step": 9245 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2498, - "step": 9246 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2373, - "step": 9247 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2423, - "step": 9248 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2341, - "step": 9249 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2327, - "step": 9250 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2466, - "step": 9251 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2396, - "step": 9252 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2548, - "step": 9253 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2499, - "step": 9254 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2631, - "step": 9255 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2437, - "step": 9256 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2363, - "step": 9257 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2543, - "step": 9258 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2451, - "step": 9259 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2484, - "step": 9260 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.256, - "step": 9261 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.24, - "step": 9262 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2474, - "step": 9263 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2321, - "step": 9264 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2424, - "step": 9265 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2407, - "step": 9266 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2397, - "step": 9267 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2471, - "step": 9268 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2495, - "step": 9269 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2453, - "step": 9270 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2439, - "step": 9271 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.237, - "step": 9272 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.258, - "step": 9273 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2395, - "step": 9274 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2546, - "step": 9275 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2628, - "step": 9276 - }, - { - "epoch": 1.14, - "learning_rate": 0.0003, - "loss": 0.2508, - "step": 9277 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2475, - "step": 9278 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2331, - "step": 9279 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2332, - "step": 9280 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2403, - "step": 9281 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2447, - "step": 9282 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2248, - "step": 9283 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2409, - "step": 9284 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2549, - "step": 9285 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2399, - "step": 9286 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.245, - "step": 9287 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2516, - "step": 9288 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2496, - "step": 9289 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2472, - "step": 9290 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.236, - "step": 9291 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2477, - "step": 9292 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2517, - "step": 9293 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2405, - "step": 9294 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2475, - "step": 9295 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2435, - "step": 9296 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.229, - "step": 9297 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2314, - "step": 9298 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2321, - "step": 9299 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2442, - "step": 9300 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2507, - "step": 9301 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2378, - "step": 9302 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2373, - "step": 9303 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2326, - "step": 9304 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2438, - "step": 9305 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2266, - "step": 9306 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2447, - "step": 9307 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2561, - "step": 9308 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2509, - "step": 9309 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2517, - "step": 9310 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.252, - "step": 9311 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2509, - "step": 9312 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2427, - "step": 9313 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.241, - "step": 9314 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2398, - "step": 9315 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2301, - "step": 9316 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2369, - "step": 9317 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2415, - "step": 9318 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2362, - "step": 9319 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2604, - "step": 9320 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2363, - "step": 9321 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2381, - "step": 9322 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2319, - "step": 9323 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2393, - "step": 9324 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2582, - "step": 9325 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.248, - "step": 9326 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2396, - "step": 9327 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2214, - "step": 9328 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2396, - "step": 9329 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2487, - "step": 9330 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2445, - "step": 9331 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2281, - "step": 9332 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2403, - "step": 9333 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2385, - "step": 9334 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2384, - "step": 9335 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2421, - "step": 9336 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2492, - "step": 9337 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2468, - "step": 9338 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2473, - "step": 9339 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2468, - "step": 9340 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2425, - "step": 9341 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.264, - "step": 9342 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2286, - "step": 9343 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2629, - "step": 9344 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2378, - "step": 9345 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2575, - "step": 9346 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2724, - "step": 9347 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2616, - "step": 9348 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2514, - "step": 9349 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2378, - "step": 9350 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2383, - "step": 9351 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2426, - "step": 9352 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2207, - "step": 9353 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2463, - "step": 9354 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2367, - "step": 9355 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2278, - "step": 9356 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.2583, - "step": 9357 - }, - { - "epoch": 1.15, - "learning_rate": 0.0003, - "loss": 0.249, - "step": 9358 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2286, - "step": 9359 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2446, - "step": 9360 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2233, - "step": 9361 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2396, - "step": 9362 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.237, - "step": 9363 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2313, - "step": 9364 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2392, - "step": 9365 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2411, - "step": 9366 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2338, - "step": 9367 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2687, - "step": 9368 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2402, - "step": 9369 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2556, - "step": 9370 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2608, - "step": 9371 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2388, - "step": 9372 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2377, - "step": 9373 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2503, - "step": 9374 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2517, - "step": 9375 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2487, - "step": 9376 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2463, - "step": 9377 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2588, - "step": 9378 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2315, - "step": 9379 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.244, - "step": 9380 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2305, - "step": 9381 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2357, - "step": 9382 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2385, - "step": 9383 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2507, - "step": 9384 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2614, - "step": 9385 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2671, - "step": 9386 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2194, - "step": 9387 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2525, - "step": 9388 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2325, - "step": 9389 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2427, - "step": 9390 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.244, - "step": 9391 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2469, - "step": 9392 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2269, - "step": 9393 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2387, - "step": 9394 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2402, - "step": 9395 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2256, - "step": 9396 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2583, - "step": 9397 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2518, - "step": 9398 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2441, - "step": 9399 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2317, - "step": 9400 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.247, - "step": 9401 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2497, - "step": 9402 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2347, - "step": 9403 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2353, - "step": 9404 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2462, - "step": 9405 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2477, - "step": 9406 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2593, - "step": 9407 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2544, - "step": 9408 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2382, - "step": 9409 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2426, - "step": 9410 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2593, - "step": 9411 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2418, - "step": 9412 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2328, - "step": 9413 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2364, - "step": 9414 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2287, - "step": 9415 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2328, - "step": 9416 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2476, - "step": 9417 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2327, - "step": 9418 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2227, - "step": 9419 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2498, - "step": 9420 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2536, - "step": 9421 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2374, - "step": 9422 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2352, - "step": 9423 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2477, - "step": 9424 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.248, - "step": 9425 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2268, - "step": 9426 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2537, - "step": 9427 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2323, - "step": 9428 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2359, - "step": 9429 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2394, - "step": 9430 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2427, - "step": 9431 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2723, - "step": 9432 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2489, - "step": 9433 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.241, - "step": 9434 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2514, - "step": 9435 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2259, - "step": 9436 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2493, - "step": 9437 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2462, - "step": 9438 - }, - { - "epoch": 1.16, - "learning_rate": 0.0003, - "loss": 0.2348, - "step": 9439 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2349, - "step": 9440 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2343, - "step": 9441 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2427, - "step": 9442 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2379, - "step": 9443 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2316, - "step": 9444 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2456, - "step": 9445 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2448, - "step": 9446 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2497, - "step": 9447 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2295, - "step": 9448 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2426, - "step": 9449 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2317, - "step": 9450 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2369, - "step": 9451 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2452, - "step": 9452 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2442, - "step": 9453 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2364, - "step": 9454 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.253, - "step": 9455 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2396, - "step": 9456 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2394, - "step": 9457 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2417, - "step": 9458 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2355, - "step": 9459 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.26, - "step": 9460 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2422, - "step": 9461 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2334, - "step": 9462 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2442, - "step": 9463 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2472, - "step": 9464 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2368, - "step": 9465 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2482, - "step": 9466 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2499, - "step": 9467 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2319, - "step": 9468 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2287, - "step": 9469 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2566, - "step": 9470 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2549, - "step": 9471 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2304, - "step": 9472 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2292, - "step": 9473 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2505, - "step": 9474 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2422, - "step": 9475 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2526, - "step": 9476 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2307, - "step": 9477 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2539, - "step": 9478 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2456, - "step": 9479 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2637, - "step": 9480 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2358, - "step": 9481 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2425, - "step": 9482 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2355, - "step": 9483 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2388, - "step": 9484 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2427, - "step": 9485 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2471, - "step": 9486 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2474, - "step": 9487 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2383, - "step": 9488 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2328, - "step": 9489 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2396, - "step": 9490 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2425, - "step": 9491 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2508, - "step": 9492 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2228, - "step": 9493 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2485, - "step": 9494 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2262, - "step": 9495 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2463, - "step": 9496 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2363, - "step": 9497 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2254, - "step": 9498 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2466, - "step": 9499 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.252, - "step": 9500 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2182, - "step": 9501 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2399, - "step": 9502 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.24, - "step": 9503 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2386, - "step": 9504 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2471, - "step": 9505 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.238, - "step": 9506 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.242, - "step": 9507 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2344, - "step": 9508 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2493, - "step": 9509 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2486, - "step": 9510 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2351, - "step": 9511 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2306, - "step": 9512 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2427, - "step": 9513 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2447, - "step": 9514 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2227, - "step": 9515 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.245, - "step": 9516 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2629, - "step": 9517 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2333, - "step": 9518 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2411, - "step": 9519 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.2354, - "step": 9520 - }, - { - "epoch": 1.17, - "learning_rate": 0.0003, - "loss": 0.231, - "step": 9521 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.23, - "step": 9522 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2332, - "step": 9523 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.234, - "step": 9524 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2326, - "step": 9525 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2407, - "step": 9526 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2473, - "step": 9527 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2423, - "step": 9528 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2499, - "step": 9529 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2511, - "step": 9530 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2544, - "step": 9531 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2418, - "step": 9532 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2394, - "step": 9533 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2331, - "step": 9534 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2505, - "step": 9535 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2443, - "step": 9536 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2542, - "step": 9537 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2502, - "step": 9538 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.235, - "step": 9539 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2281, - "step": 9540 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2499, - "step": 9541 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2377, - "step": 9542 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.261, - "step": 9543 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2283, - "step": 9544 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2457, - "step": 9545 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2469, - "step": 9546 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2531, - "step": 9547 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.241, - "step": 9548 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2257, - "step": 9549 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2447, - "step": 9550 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2429, - "step": 9551 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2367, - "step": 9552 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2311, - "step": 9553 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2201, - "step": 9554 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2517, - "step": 9555 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2273, - "step": 9556 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2299, - "step": 9557 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2351, - "step": 9558 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2387, - "step": 9559 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2353, - "step": 9560 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2516, - "step": 9561 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2464, - "step": 9562 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2347, - "step": 9563 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2431, - "step": 9564 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2572, - "step": 9565 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.244, - "step": 9566 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2321, - "step": 9567 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.238, - "step": 9568 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2432, - "step": 9569 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.252, - "step": 9570 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2535, - "step": 9571 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2275, - "step": 9572 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2482, - "step": 9573 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2305, - "step": 9574 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.236, - "step": 9575 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2235, - "step": 9576 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2327, - "step": 9577 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2419, - "step": 9578 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2441, - "step": 9579 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2498, - "step": 9580 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2433, - "step": 9581 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2444, - "step": 9582 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2454, - "step": 9583 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2501, - "step": 9584 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2239, - "step": 9585 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2562, - "step": 9586 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2274, - "step": 9587 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2571, - "step": 9588 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2413, - "step": 9589 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2267, - "step": 9590 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2239, - "step": 9591 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2407, - "step": 9592 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.237, - "step": 9593 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2351, - "step": 9594 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2359, - "step": 9595 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2444, - "step": 9596 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.251, - "step": 9597 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2529, - "step": 9598 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.239, - "step": 9599 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2357, - "step": 9600 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2531, - "step": 9601 - }, - { - "epoch": 1.18, - "learning_rate": 0.0003, - "loss": 0.2528, - "step": 9602 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2492, - "step": 9603 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2414, - "step": 9604 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2207, - "step": 9605 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.256, - "step": 9606 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2416, - "step": 9607 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2284, - "step": 9608 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2149, - "step": 9609 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2521, - "step": 9610 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2479, - "step": 9611 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2292, - "step": 9612 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2467, - "step": 9613 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2558, - "step": 9614 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2438, - "step": 9615 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2329, - "step": 9616 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2365, - "step": 9617 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2362, - "step": 9618 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2467, - "step": 9619 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.246, - "step": 9620 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.247, - "step": 9621 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2459, - "step": 9622 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2491, - "step": 9623 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2229, - "step": 9624 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2304, - "step": 9625 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2495, - "step": 9626 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2549, - "step": 9627 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.262, - "step": 9628 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2469, - "step": 9629 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2542, - "step": 9630 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2337, - "step": 9631 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2592, - "step": 9632 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.238, - "step": 9633 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2587, - "step": 9634 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2465, - "step": 9635 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2327, - "step": 9636 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2382, - "step": 9637 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2249, - "step": 9638 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2232, - "step": 9639 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2454, - "step": 9640 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2402, - "step": 9641 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2539, - "step": 9642 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2369, - "step": 9643 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2568, - "step": 9644 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2359, - "step": 9645 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2349, - "step": 9646 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2311, - "step": 9647 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2373, - "step": 9648 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2423, - "step": 9649 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2408, - "step": 9650 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2406, - "step": 9651 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2515, - "step": 9652 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2402, - "step": 9653 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2366, - "step": 9654 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2344, - "step": 9655 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2459, - "step": 9656 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2362, - "step": 9657 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2413, - "step": 9658 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2425, - "step": 9659 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2368, - "step": 9660 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2375, - "step": 9661 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2472, - "step": 9662 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.24, - "step": 9663 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2385, - "step": 9664 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2363, - "step": 9665 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2493, - "step": 9666 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2421, - "step": 9667 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2629, - "step": 9668 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2465, - "step": 9669 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2462, - "step": 9670 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.247, - "step": 9671 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2635, - "step": 9672 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2545, - "step": 9673 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2348, - "step": 9674 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2409, - "step": 9675 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2369, - "step": 9676 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2362, - "step": 9677 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2238, - "step": 9678 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2343, - "step": 9679 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2369, - "step": 9680 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2367, - "step": 9681 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2504, - "step": 9682 - }, - { - "epoch": 1.19, - "learning_rate": 0.0003, - "loss": 0.2403, - "step": 9683 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2358, - "step": 9684 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2135, - "step": 9685 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2263, - "step": 9686 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.227, - "step": 9687 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2275, - "step": 9688 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2403, - "step": 9689 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2581, - "step": 9690 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2462, - "step": 9691 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2351, - "step": 9692 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2414, - "step": 9693 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2439, - "step": 9694 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2369, - "step": 9695 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.241, - "step": 9696 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2422, - "step": 9697 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2332, - "step": 9698 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2406, - "step": 9699 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.238, - "step": 9700 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2527, - "step": 9701 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2441, - "step": 9702 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2488, - "step": 9703 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.233, - "step": 9704 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2415, - "step": 9705 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2428, - "step": 9706 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2295, - "step": 9707 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2477, - "step": 9708 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2485, - "step": 9709 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2332, - "step": 9710 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2476, - "step": 9711 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2383, - "step": 9712 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2377, - "step": 9713 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2378, - "step": 9714 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.242, - "step": 9715 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2232, - "step": 9716 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2325, - "step": 9717 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.236, - "step": 9718 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2338, - "step": 9719 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2351, - "step": 9720 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.247, - "step": 9721 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2398, - "step": 9722 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2432, - "step": 9723 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2411, - "step": 9724 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2376, - "step": 9725 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2372, - "step": 9726 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2311, - "step": 9727 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2392, - "step": 9728 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2473, - "step": 9729 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2451, - "step": 9730 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.247, - "step": 9731 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.247, - "step": 9732 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2497, - "step": 9733 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2281, - "step": 9734 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2432, - "step": 9735 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2361, - "step": 9736 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.248, - "step": 9737 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.259, - "step": 9738 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2309, - "step": 9739 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2538, - "step": 9740 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2344, - "step": 9741 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2371, - "step": 9742 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2362, - "step": 9743 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2454, - "step": 9744 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2377, - "step": 9745 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2511, - "step": 9746 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2402, - "step": 9747 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2379, - "step": 9748 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2403, - "step": 9749 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2453, - "step": 9750 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2374, - "step": 9751 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2471, - "step": 9752 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2517, - "step": 9753 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2336, - "step": 9754 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2414, - "step": 9755 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2342, - "step": 9756 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2399, - "step": 9757 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2481, - "step": 9758 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2226, - "step": 9759 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2501, - "step": 9760 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2383, - "step": 9761 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2455, - "step": 9762 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2588, - "step": 9763 - }, - { - "epoch": 1.2, - "learning_rate": 0.0003, - "loss": 0.2369, - "step": 9764 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2375, - "step": 9765 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2311, - "step": 9766 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2492, - "step": 9767 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2459, - "step": 9768 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.234, - "step": 9769 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2307, - "step": 9770 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2292, - "step": 9771 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2579, - "step": 9772 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.225, - "step": 9773 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2738, - "step": 9774 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2331, - "step": 9775 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2289, - "step": 9776 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.228, - "step": 9777 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2331, - "step": 9778 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2446, - "step": 9779 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2302, - "step": 9780 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2419, - "step": 9781 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2338, - "step": 9782 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2335, - "step": 9783 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2403, - "step": 9784 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2558, - "step": 9785 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2429, - "step": 9786 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2434, - "step": 9787 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2332, - "step": 9788 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2411, - "step": 9789 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2587, - "step": 9790 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2364, - "step": 9791 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.258, - "step": 9792 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2389, - "step": 9793 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2544, - "step": 9794 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2426, - "step": 9795 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.243, - "step": 9796 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2478, - "step": 9797 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2494, - "step": 9798 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2577, - "step": 9799 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.249, - "step": 9800 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2359, - "step": 9801 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2391, - "step": 9802 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2293, - "step": 9803 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2298, - "step": 9804 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2302, - "step": 9805 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2461, - "step": 9806 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2451, - "step": 9807 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2454, - "step": 9808 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2308, - "step": 9809 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2346, - "step": 9810 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.244, - "step": 9811 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2348, - "step": 9812 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2313, - "step": 9813 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2413, - "step": 9814 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2368, - "step": 9815 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2392, - "step": 9816 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2461, - "step": 9817 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2431, - "step": 9818 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2598, - "step": 9819 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2326, - "step": 9820 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2308, - "step": 9821 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2399, - "step": 9822 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2369, - "step": 9823 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2476, - "step": 9824 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2424, - "step": 9825 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2457, - "step": 9826 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2531, - "step": 9827 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2479, - "step": 9828 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.243, - "step": 9829 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2458, - "step": 9830 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2221, - "step": 9831 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2445, - "step": 9832 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2349, - "step": 9833 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2326, - "step": 9834 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2377, - "step": 9835 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2619, - "step": 9836 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2445, - "step": 9837 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.246, - "step": 9838 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2503, - "step": 9839 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2321, - "step": 9840 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2459, - "step": 9841 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2407, - "step": 9842 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2542, - "step": 9843 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2362, - "step": 9844 - }, - { - "epoch": 1.21, - "learning_rate": 0.0003, - "loss": 0.2323, - "step": 9845 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.221, - "step": 9846 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2223, - "step": 9847 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2434, - "step": 9848 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2597, - "step": 9849 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2285, - "step": 9850 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2328, - "step": 9851 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2534, - "step": 9852 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2511, - "step": 9853 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2588, - "step": 9854 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2313, - "step": 9855 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2645, - "step": 9856 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2407, - "step": 9857 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2369, - "step": 9858 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.244, - "step": 9859 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2357, - "step": 9860 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2535, - "step": 9861 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2276, - "step": 9862 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2374, - "step": 9863 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2192, - "step": 9864 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2327, - "step": 9865 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2423, - "step": 9866 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2383, - "step": 9867 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.247, - "step": 9868 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.234, - "step": 9869 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2456, - "step": 9870 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2419, - "step": 9871 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2231, - "step": 9872 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2371, - "step": 9873 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2355, - "step": 9874 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2258, - "step": 9875 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2476, - "step": 9876 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.241, - "step": 9877 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2455, - "step": 9878 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2441, - "step": 9879 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2361, - "step": 9880 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2625, - "step": 9881 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2419, - "step": 9882 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2488, - "step": 9883 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2579, - "step": 9884 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2549, - "step": 9885 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2419, - "step": 9886 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2296, - "step": 9887 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2449, - "step": 9888 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2362, - "step": 9889 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.239, - "step": 9890 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2324, - "step": 9891 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2289, - "step": 9892 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2159, - "step": 9893 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2453, - "step": 9894 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2461, - "step": 9895 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2403, - "step": 9896 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2451, - "step": 9897 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2427, - "step": 9898 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2421, - "step": 9899 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2386, - "step": 9900 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2326, - "step": 9901 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2324, - "step": 9902 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2493, - "step": 9903 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2337, - "step": 9904 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2505, - "step": 9905 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.236, - "step": 9906 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2271, - "step": 9907 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2392, - "step": 9908 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2299, - "step": 9909 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2376, - "step": 9910 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2315, - "step": 9911 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2296, - "step": 9912 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2472, - "step": 9913 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2245, - "step": 9914 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2383, - "step": 9915 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2403, - "step": 9916 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.247, - "step": 9917 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2378, - "step": 9918 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2475, - "step": 9919 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.245, - "step": 9920 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2275, - "step": 9921 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2538, - "step": 9922 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2297, - "step": 9923 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2426, - "step": 9924 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2573, - "step": 9925 - }, - { - "epoch": 1.22, - "learning_rate": 0.0003, - "loss": 0.2248, - "step": 9926 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2416, - "step": 9927 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2287, - "step": 9928 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2454, - "step": 9929 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2371, - "step": 9930 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2479, - "step": 9931 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2363, - "step": 9932 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2533, - "step": 9933 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2324, - "step": 9934 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2526, - "step": 9935 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2366, - "step": 9936 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2315, - "step": 9937 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2459, - "step": 9938 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2303, - "step": 9939 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2414, - "step": 9940 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2274, - "step": 9941 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2463, - "step": 9942 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2549, - "step": 9943 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2342, - "step": 9944 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2323, - "step": 9945 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2421, - "step": 9946 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2524, - "step": 9947 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2299, - "step": 9948 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2357, - "step": 9949 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2258, - "step": 9950 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.235, - "step": 9951 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.244, - "step": 9952 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2483, - "step": 9953 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2448, - "step": 9954 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2249, - "step": 9955 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2407, - "step": 9956 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2366, - "step": 9957 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2679, - "step": 9958 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2438, - "step": 9959 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.235, - "step": 9960 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2361, - "step": 9961 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2455, - "step": 9962 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2231, - "step": 9963 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2399, - "step": 9964 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2316, - "step": 9965 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2338, - "step": 9966 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2371, - "step": 9967 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2447, - "step": 9968 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2499, - "step": 9969 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2428, - "step": 9970 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2429, - "step": 9971 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.234, - "step": 9972 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.259, - "step": 9973 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2448, - "step": 9974 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2414, - "step": 9975 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2334, - "step": 9976 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2403, - "step": 9977 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2394, - "step": 9978 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2163, - "step": 9979 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2384, - "step": 9980 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2507, - "step": 9981 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2452, - "step": 9982 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2319, - "step": 9983 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.236, - "step": 9984 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2405, - "step": 9985 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2462, - "step": 9986 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2676, - "step": 9987 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2538, - "step": 9988 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2537, - "step": 9989 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2307, - "step": 9990 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2494, - "step": 9991 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2583, - "step": 9992 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2376, - "step": 9993 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2449, - "step": 9994 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2421, - "step": 9995 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2447, - "step": 9996 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2354, - "step": 9997 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2478, - "step": 9998 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2596, - "step": 9999 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2482, - "step": 10000 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2148, - "step": 10001 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2534, - "step": 10002 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2387, - "step": 10003 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2455, - "step": 10004 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2543, - "step": 10005 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2322, - "step": 10006 - }, - { - "epoch": 1.23, - "learning_rate": 0.0003, - "loss": 0.2364, - "step": 10007 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2473, - "step": 10008 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2492, - "step": 10009 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2331, - "step": 10010 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2372, - "step": 10011 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2405, - "step": 10012 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.241, - "step": 10013 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2413, - "step": 10014 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2502, - "step": 10015 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2454, - "step": 10016 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2279, - "step": 10017 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2369, - "step": 10018 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2517, - "step": 10019 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2369, - "step": 10020 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2471, - "step": 10021 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2433, - "step": 10022 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2495, - "step": 10023 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2342, - "step": 10024 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2348, - "step": 10025 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2092, - "step": 10026 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2455, - "step": 10027 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2379, - "step": 10028 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2377, - "step": 10029 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2272, - "step": 10030 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2382, - "step": 10031 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.258, - "step": 10032 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2433, - "step": 10033 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.235, - "step": 10034 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2323, - "step": 10035 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2558, - "step": 10036 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2348, - "step": 10037 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2318, - "step": 10038 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2504, - "step": 10039 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2374, - "step": 10040 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.234, - "step": 10041 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2483, - "step": 10042 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2542, - "step": 10043 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2484, - "step": 10044 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2228, - "step": 10045 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2309, - "step": 10046 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2381, - "step": 10047 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2381, - "step": 10048 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2353, - "step": 10049 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2201, - "step": 10050 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2501, - "step": 10051 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2461, - "step": 10052 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2397, - "step": 10053 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2377, - "step": 10054 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2369, - "step": 10055 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2498, - "step": 10056 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2284, - "step": 10057 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2303, - "step": 10058 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2455, - "step": 10059 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2355, - "step": 10060 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2279, - "step": 10061 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.238, - "step": 10062 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2327, - "step": 10063 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2313, - "step": 10064 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2386, - "step": 10065 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2437, - "step": 10066 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2371, - "step": 10067 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2319, - "step": 10068 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2356, - "step": 10069 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2404, - "step": 10070 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2226, - "step": 10071 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2268, - "step": 10072 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2575, - "step": 10073 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2258, - "step": 10074 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2229, - "step": 10075 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2223, - "step": 10076 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2493, - "step": 10077 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.23, - "step": 10078 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2392, - "step": 10079 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2246, - "step": 10080 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2421, - "step": 10081 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2508, - "step": 10082 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2498, - "step": 10083 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2269, - "step": 10084 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2402, - "step": 10085 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2264, - "step": 10086 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2432, - "step": 10087 - }, - { - "epoch": 1.24, - "learning_rate": 0.0003, - "loss": 0.2385, - "step": 10088 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2409, - "step": 10089 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2441, - "step": 10090 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2324, - "step": 10091 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2537, - "step": 10092 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2349, - "step": 10093 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2254, - "step": 10094 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2379, - "step": 10095 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2209, - "step": 10096 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2469, - "step": 10097 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2335, - "step": 10098 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2378, - "step": 10099 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2451, - "step": 10100 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2199, - "step": 10101 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2357, - "step": 10102 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.246, - "step": 10103 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.24, - "step": 10104 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2452, - "step": 10105 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2437, - "step": 10106 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2366, - "step": 10107 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2361, - "step": 10108 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.251, - "step": 10109 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.238, - "step": 10110 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2416, - "step": 10111 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2517, - "step": 10112 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.241, - "step": 10113 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2399, - "step": 10114 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2361, - "step": 10115 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2259, - "step": 10116 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2454, - "step": 10117 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2351, - "step": 10118 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.247, - "step": 10119 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2293, - "step": 10120 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2394, - "step": 10121 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2325, - "step": 10122 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.226, - "step": 10123 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2382, - "step": 10124 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2332, - "step": 10125 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2391, - "step": 10126 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2289, - "step": 10127 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2406, - "step": 10128 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2399, - "step": 10129 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2532, - "step": 10130 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.236, - "step": 10131 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2294, - "step": 10132 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2449, - "step": 10133 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2432, - "step": 10134 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2493, - "step": 10135 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.239, - "step": 10136 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2242, - "step": 10137 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2348, - "step": 10138 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2364, - "step": 10139 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.235, - "step": 10140 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2556, - "step": 10141 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2293, - "step": 10142 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2218, - "step": 10143 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2589, - "step": 10144 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2464, - "step": 10145 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2488, - "step": 10146 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2399, - "step": 10147 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2369, - "step": 10148 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2346, - "step": 10149 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2348, - "step": 10150 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2324, - "step": 10151 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2372, - "step": 10152 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2317, - "step": 10153 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2377, - "step": 10154 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.238, - "step": 10155 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.25, - "step": 10156 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2265, - "step": 10157 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2386, - "step": 10158 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2448, - "step": 10159 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2197, - "step": 10160 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2267, - "step": 10161 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2478, - "step": 10162 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2528, - "step": 10163 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.222, - "step": 10164 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2469, - "step": 10165 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2401, - "step": 10166 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2518, - "step": 10167 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2315, - "step": 10168 - }, - { - "epoch": 1.25, - "learning_rate": 0.0003, - "loss": 0.2463, - "step": 10169 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2436, - "step": 10170 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2257, - "step": 10171 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2292, - "step": 10172 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2414, - "step": 10173 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2355, - "step": 10174 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2428, - "step": 10175 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2344, - "step": 10176 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2415, - "step": 10177 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2435, - "step": 10178 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2538, - "step": 10179 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2529, - "step": 10180 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.233, - "step": 10181 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2349, - "step": 10182 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2382, - "step": 10183 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2397, - "step": 10184 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2367, - "step": 10185 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2411, - "step": 10186 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2351, - "step": 10187 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2299, - "step": 10188 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2389, - "step": 10189 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2364, - "step": 10190 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2379, - "step": 10191 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2527, - "step": 10192 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2385, - "step": 10193 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.229, - "step": 10194 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2266, - "step": 10195 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2396, - "step": 10196 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2265, - "step": 10197 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2308, - "step": 10198 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.236, - "step": 10199 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.238, - "step": 10200 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2436, - "step": 10201 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2617, - "step": 10202 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2407, - "step": 10203 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2441, - "step": 10204 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2234, - "step": 10205 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2241, - "step": 10206 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2468, - "step": 10207 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2399, - "step": 10208 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2345, - "step": 10209 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2353, - "step": 10210 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2346, - "step": 10211 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2458, - "step": 10212 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.222, - "step": 10213 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2299, - "step": 10214 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2377, - "step": 10215 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2448, - "step": 10216 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2329, - "step": 10217 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2423, - "step": 10218 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2386, - "step": 10219 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2535, - "step": 10220 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2433, - "step": 10221 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2317, - "step": 10222 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2398, - "step": 10223 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.233, - "step": 10224 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2377, - "step": 10225 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2175, - "step": 10226 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.242, - "step": 10227 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2273, - "step": 10228 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2288, - "step": 10229 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2357, - "step": 10230 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2275, - "step": 10231 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2257, - "step": 10232 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2411, - "step": 10233 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2321, - "step": 10234 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2379, - "step": 10235 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2263, - "step": 10236 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2313, - "step": 10237 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2421, - "step": 10238 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.238, - "step": 10239 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2575, - "step": 10240 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2422, - "step": 10241 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.224, - "step": 10242 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2448, - "step": 10243 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2564, - "step": 10244 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2415, - "step": 10245 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2538, - "step": 10246 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2312, - "step": 10247 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2227, - "step": 10248 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2139, - "step": 10249 - }, - { - "epoch": 1.26, - "learning_rate": 0.0003, - "loss": 0.2482, - "step": 10250 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2258, - "step": 10251 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2344, - "step": 10252 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2352, - "step": 10253 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2407, - "step": 10254 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2381, - "step": 10255 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2312, - "step": 10256 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2367, - "step": 10257 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2269, - "step": 10258 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2353, - "step": 10259 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2278, - "step": 10260 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2407, - "step": 10261 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.218, - "step": 10262 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2399, - "step": 10263 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.222, - "step": 10264 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2349, - "step": 10265 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2437, - "step": 10266 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2223, - "step": 10267 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2161, - "step": 10268 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2457, - "step": 10269 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2331, - "step": 10270 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2401, - "step": 10271 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2529, - "step": 10272 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2315, - "step": 10273 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2514, - "step": 10274 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2416, - "step": 10275 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2364, - "step": 10276 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.236, - "step": 10277 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2271, - "step": 10278 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2414, - "step": 10279 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2262, - "step": 10280 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.234, - "step": 10281 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2274, - "step": 10282 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2323, - "step": 10283 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.253, - "step": 10284 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2187, - "step": 10285 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2444, - "step": 10286 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2378, - "step": 10287 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2355, - "step": 10288 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2432, - "step": 10289 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2276, - "step": 10290 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2434, - "step": 10291 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2433, - "step": 10292 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2411, - "step": 10293 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.244, - "step": 10294 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2306, - "step": 10295 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2426, - "step": 10296 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2312, - "step": 10297 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.246, - "step": 10298 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2295, - "step": 10299 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2411, - "step": 10300 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2316, - "step": 10301 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2239, - "step": 10302 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2436, - "step": 10303 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2389, - "step": 10304 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2403, - "step": 10305 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2341, - "step": 10306 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2443, - "step": 10307 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2419, - "step": 10308 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2417, - "step": 10309 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2447, - "step": 10310 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2457, - "step": 10311 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2394, - "step": 10312 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2319, - "step": 10313 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2297, - "step": 10314 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2362, - "step": 10315 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2352, - "step": 10316 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2466, - "step": 10317 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2453, - "step": 10318 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2403, - "step": 10319 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2321, - "step": 10320 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2396, - "step": 10321 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2293, - "step": 10322 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2331, - "step": 10323 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2328, - "step": 10324 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2482, - "step": 10325 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2261, - "step": 10326 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2321, - "step": 10327 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2249, - "step": 10328 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2345, - "step": 10329 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2324, - "step": 10330 - }, - { - "epoch": 1.27, - "learning_rate": 0.0003, - "loss": 0.2519, - "step": 10331 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2421, - "step": 10332 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2309, - "step": 10333 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2458, - "step": 10334 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2346, - "step": 10335 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2437, - "step": 10336 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2405, - "step": 10337 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2231, - "step": 10338 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.213, - "step": 10339 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2372, - "step": 10340 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2322, - "step": 10341 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2632, - "step": 10342 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2362, - "step": 10343 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2363, - "step": 10344 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2485, - "step": 10345 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2402, - "step": 10346 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2286, - "step": 10347 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.252, - "step": 10348 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2511, - "step": 10349 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2365, - "step": 10350 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2374, - "step": 10351 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2436, - "step": 10352 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2268, - "step": 10353 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2329, - "step": 10354 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2393, - "step": 10355 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2428, - "step": 10356 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2306, - "step": 10357 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2312, - "step": 10358 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2447, - "step": 10359 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2331, - "step": 10360 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2194, - "step": 10361 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2343, - "step": 10362 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2353, - "step": 10363 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2359, - "step": 10364 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2291, - "step": 10365 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.24, - "step": 10366 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2107, - "step": 10367 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2301, - "step": 10368 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.239, - "step": 10369 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2371, - "step": 10370 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2409, - "step": 10371 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2386, - "step": 10372 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.235, - "step": 10373 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2387, - "step": 10374 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2377, - "step": 10375 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2611, - "step": 10376 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.243, - "step": 10377 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.239, - "step": 10378 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.235, - "step": 10379 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2331, - "step": 10380 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2271, - "step": 10381 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2437, - "step": 10382 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.26, - "step": 10383 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2508, - "step": 10384 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2541, - "step": 10385 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2459, - "step": 10386 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2473, - "step": 10387 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2337, - "step": 10388 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.23, - "step": 10389 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2366, - "step": 10390 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2426, - "step": 10391 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2166, - "step": 10392 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2373, - "step": 10393 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2342, - "step": 10394 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2485, - "step": 10395 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2454, - "step": 10396 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.219, - "step": 10397 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2422, - "step": 10398 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2325, - "step": 10399 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.251, - "step": 10400 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2517, - "step": 10401 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2343, - "step": 10402 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2382, - "step": 10403 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2383, - "step": 10404 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2173, - "step": 10405 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2156, - "step": 10406 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2335, - "step": 10407 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2433, - "step": 10408 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.238, - "step": 10409 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2361, - "step": 10410 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2339, - "step": 10411 - }, - { - "epoch": 1.28, - "learning_rate": 0.0003, - "loss": 0.2462, - "step": 10412 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2313, - "step": 10413 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2428, - "step": 10414 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2371, - "step": 10415 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2445, - "step": 10416 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2386, - "step": 10417 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2322, - "step": 10418 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2308, - "step": 10419 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2264, - "step": 10420 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.222, - "step": 10421 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2451, - "step": 10422 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2272, - "step": 10423 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.241, - "step": 10424 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2439, - "step": 10425 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.238, - "step": 10426 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2497, - "step": 10427 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2432, - "step": 10428 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2394, - "step": 10429 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2372, - "step": 10430 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2391, - "step": 10431 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.235, - "step": 10432 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2509, - "step": 10433 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.241, - "step": 10434 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2263, - "step": 10435 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2339, - "step": 10436 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2383, - "step": 10437 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2389, - "step": 10438 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2347, - "step": 10439 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2455, - "step": 10440 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2453, - "step": 10441 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2525, - "step": 10442 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2219, - "step": 10443 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2321, - "step": 10444 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2343, - "step": 10445 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2388, - "step": 10446 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2356, - "step": 10447 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2343, - "step": 10448 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2434, - "step": 10449 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2295, - "step": 10450 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2457, - "step": 10451 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2222, - "step": 10452 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2408, - "step": 10453 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2297, - "step": 10454 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2295, - "step": 10455 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2457, - "step": 10456 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2439, - "step": 10457 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2344, - "step": 10458 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2483, - "step": 10459 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2461, - "step": 10460 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2246, - "step": 10461 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2392, - "step": 10462 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2207, - "step": 10463 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.241, - "step": 10464 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2211, - "step": 10465 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2418, - "step": 10466 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2244, - "step": 10467 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2303, - "step": 10468 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2391, - "step": 10469 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2398, - "step": 10470 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2608, - "step": 10471 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2261, - "step": 10472 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2369, - "step": 10473 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2252, - "step": 10474 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2455, - "step": 10475 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2262, - "step": 10476 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2291, - "step": 10477 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2629, - "step": 10478 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.238, - "step": 10479 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2371, - "step": 10480 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2446, - "step": 10481 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2431, - "step": 10482 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2337, - "step": 10483 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2425, - "step": 10484 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2444, - "step": 10485 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2293, - "step": 10486 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.241, - "step": 10487 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2393, - "step": 10488 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2384, - "step": 10489 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2219, - "step": 10490 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2423, - "step": 10491 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2258, - "step": 10492 - }, - { - "epoch": 1.29, - "learning_rate": 0.0003, - "loss": 0.2365, - "step": 10493 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2223, - "step": 10494 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2401, - "step": 10495 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2411, - "step": 10496 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2269, - "step": 10497 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2362, - "step": 10498 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2413, - "step": 10499 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2455, - "step": 10500 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2332, - "step": 10501 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2628, - "step": 10502 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2378, - "step": 10503 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2366, - "step": 10504 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2247, - "step": 10505 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2325, - "step": 10506 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2298, - "step": 10507 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2176, - "step": 10508 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.24, - "step": 10509 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2292, - "step": 10510 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2519, - "step": 10511 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2332, - "step": 10512 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2349, - "step": 10513 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2331, - "step": 10514 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2472, - "step": 10515 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2262, - "step": 10516 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2419, - "step": 10517 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.232, - "step": 10518 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2297, - "step": 10519 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2248, - "step": 10520 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2352, - "step": 10521 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2418, - "step": 10522 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2325, - "step": 10523 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2251, - "step": 10524 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.224, - "step": 10525 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2347, - "step": 10526 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2393, - "step": 10527 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2302, - "step": 10528 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2497, - "step": 10529 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2318, - "step": 10530 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2407, - "step": 10531 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.246, - "step": 10532 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2287, - "step": 10533 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2198, - "step": 10534 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2341, - "step": 10535 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2441, - "step": 10536 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2281, - "step": 10537 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2183, - "step": 10538 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2425, - "step": 10539 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.24, - "step": 10540 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2266, - "step": 10541 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2305, - "step": 10542 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2481, - "step": 10543 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2436, - "step": 10544 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.233, - "step": 10545 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2324, - "step": 10546 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2375, - "step": 10547 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2388, - "step": 10548 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2333, - "step": 10549 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2502, - "step": 10550 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2462, - "step": 10551 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2417, - "step": 10552 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.234, - "step": 10553 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2206, - "step": 10554 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2572, - "step": 10555 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2291, - "step": 10556 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2479, - "step": 10557 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2314, - "step": 10558 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2275, - "step": 10559 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2325, - "step": 10560 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2181, - "step": 10561 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2315, - "step": 10562 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2384, - "step": 10563 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2392, - "step": 10564 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2487, - "step": 10565 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2562, - "step": 10566 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2425, - "step": 10567 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2252, - "step": 10568 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2214, - "step": 10569 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.231, - "step": 10570 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2381, - "step": 10571 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2374, - "step": 10572 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2518, - "step": 10573 - }, - { - "epoch": 1.3, - "learning_rate": 0.0003, - "loss": 0.2403, - "step": 10574 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.238, - "step": 10575 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2383, - "step": 10576 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2367, - "step": 10577 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2423, - "step": 10578 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.224, - "step": 10579 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2405, - "step": 10580 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2418, - "step": 10581 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2342, - "step": 10582 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.238, - "step": 10583 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2131, - "step": 10584 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2407, - "step": 10585 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.234, - "step": 10586 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2588, - "step": 10587 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2464, - "step": 10588 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2234, - "step": 10589 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2249, - "step": 10590 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2393, - "step": 10591 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.243, - "step": 10592 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2444, - "step": 10593 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2368, - "step": 10594 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2436, - "step": 10595 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2258, - "step": 10596 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2389, - "step": 10597 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2293, - "step": 10598 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2498, - "step": 10599 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2329, - "step": 10600 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2331, - "step": 10601 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2554, - "step": 10602 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2312, - "step": 10603 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2443, - "step": 10604 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2252, - "step": 10605 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2334, - "step": 10606 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2409, - "step": 10607 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2386, - "step": 10608 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.229, - "step": 10609 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2367, - "step": 10610 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2577, - "step": 10611 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2366, - "step": 10612 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2248, - "step": 10613 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2411, - "step": 10614 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2374, - "step": 10615 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2396, - "step": 10616 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2382, - "step": 10617 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2388, - "step": 10618 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2316, - "step": 10619 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2263, - "step": 10620 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2505, - "step": 10621 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.241, - "step": 10622 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2385, - "step": 10623 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2447, - "step": 10624 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2349, - "step": 10625 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2494, - "step": 10626 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2229, - "step": 10627 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2364, - "step": 10628 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2297, - "step": 10629 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2316, - "step": 10630 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2294, - "step": 10631 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2408, - "step": 10632 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2357, - "step": 10633 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2311, - "step": 10634 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2382, - "step": 10635 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2271, - "step": 10636 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2538, - "step": 10637 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2528, - "step": 10638 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2373, - "step": 10639 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2306, - "step": 10640 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2501, - "step": 10641 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.22, - "step": 10642 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2549, - "step": 10643 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2374, - "step": 10644 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2228, - "step": 10645 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2415, - "step": 10646 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2328, - "step": 10647 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2337, - "step": 10648 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2429, - "step": 10649 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2427, - "step": 10650 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2426, - "step": 10651 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.257, - "step": 10652 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2312, - "step": 10653 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.229, - "step": 10654 - }, - { - "epoch": 1.31, - "learning_rate": 0.0003, - "loss": 0.2376, - "step": 10655 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2357, - "step": 10656 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2316, - "step": 10657 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2329, - "step": 10658 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2313, - "step": 10659 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.223, - "step": 10660 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2407, - "step": 10661 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2438, - "step": 10662 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.244, - "step": 10663 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2312, - "step": 10664 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2309, - "step": 10665 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.231, - "step": 10666 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2304, - "step": 10667 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2423, - "step": 10668 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2386, - "step": 10669 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2507, - "step": 10670 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2185, - "step": 10671 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2273, - "step": 10672 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.227, - "step": 10673 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2316, - "step": 10674 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.245, - "step": 10675 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.226, - "step": 10676 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2234, - "step": 10677 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2234, - "step": 10678 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2353, - "step": 10679 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2313, - "step": 10680 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2327, - "step": 10681 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2387, - "step": 10682 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2307, - "step": 10683 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2359, - "step": 10684 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2413, - "step": 10685 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2267, - "step": 10686 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2274, - "step": 10687 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2434, - "step": 10688 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2371, - "step": 10689 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.228, - "step": 10690 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2312, - "step": 10691 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2419, - "step": 10692 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2442, - "step": 10693 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.247, - "step": 10694 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.239, - "step": 10695 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2405, - "step": 10696 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2266, - "step": 10697 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2321, - "step": 10698 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.231, - "step": 10699 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2437, - "step": 10700 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2372, - "step": 10701 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2414, - "step": 10702 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2266, - "step": 10703 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2289, - "step": 10704 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2392, - "step": 10705 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.234, - "step": 10706 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2373, - "step": 10707 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2235, - "step": 10708 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2331, - "step": 10709 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2315, - "step": 10710 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2557, - "step": 10711 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2288, - "step": 10712 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2392, - "step": 10713 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2399, - "step": 10714 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2382, - "step": 10715 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2282, - "step": 10716 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2362, - "step": 10717 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2511, - "step": 10718 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2273, - "step": 10719 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2494, - "step": 10720 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2278, - "step": 10721 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.234, - "step": 10722 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2382, - "step": 10723 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2258, - "step": 10724 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2433, - "step": 10725 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2337, - "step": 10726 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2325, - "step": 10727 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2329, - "step": 10728 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2234, - "step": 10729 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2393, - "step": 10730 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2236, - "step": 10731 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2241, - "step": 10732 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.234, - "step": 10733 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2346, - "step": 10734 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2268, - "step": 10735 - }, - { - "epoch": 1.32, - "learning_rate": 0.0003, - "loss": 0.2302, - "step": 10736 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2244, - "step": 10737 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2293, - "step": 10738 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2262, - "step": 10739 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2359, - "step": 10740 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2391, - "step": 10741 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2335, - "step": 10742 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2396, - "step": 10743 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2416, - "step": 10744 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2271, - "step": 10745 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2345, - "step": 10746 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2349, - "step": 10747 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2326, - "step": 10748 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2301, - "step": 10749 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2404, - "step": 10750 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2367, - "step": 10751 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2143, - "step": 10752 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.241, - "step": 10753 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2285, - "step": 10754 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2356, - "step": 10755 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2445, - "step": 10756 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2451, - "step": 10757 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2365, - "step": 10758 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.239, - "step": 10759 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2507, - "step": 10760 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2432, - "step": 10761 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2286, - "step": 10762 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.235, - "step": 10763 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2271, - "step": 10764 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2288, - "step": 10765 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2112, - "step": 10766 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2379, - "step": 10767 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2321, - "step": 10768 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2443, - "step": 10769 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2295, - "step": 10770 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2124, - "step": 10771 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2518, - "step": 10772 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2318, - "step": 10773 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2225, - "step": 10774 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2346, - "step": 10775 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2491, - "step": 10776 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2248, - "step": 10777 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2351, - "step": 10778 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.247, - "step": 10779 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2422, - "step": 10780 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2292, - "step": 10781 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2159, - "step": 10782 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2269, - "step": 10783 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2504, - "step": 10784 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2379, - "step": 10785 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2347, - "step": 10786 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2349, - "step": 10787 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2365, - "step": 10788 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2341, - "step": 10789 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2423, - "step": 10790 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2401, - "step": 10791 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2316, - "step": 10792 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2396, - "step": 10793 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2239, - "step": 10794 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2252, - "step": 10795 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2343, - "step": 10796 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2337, - "step": 10797 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2371, - "step": 10798 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2593, - "step": 10799 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2227, - "step": 10800 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2361, - "step": 10801 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2334, - "step": 10802 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2289, - "step": 10803 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2383, - "step": 10804 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2359, - "step": 10805 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2314, - "step": 10806 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2312, - "step": 10807 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2486, - "step": 10808 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.236, - "step": 10809 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2534, - "step": 10810 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2369, - "step": 10811 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2329, - "step": 10812 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2299, - "step": 10813 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2358, - "step": 10814 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2397, - "step": 10815 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2309, - "step": 10816 - }, - { - "epoch": 1.33, - "learning_rate": 0.0003, - "loss": 0.2209, - "step": 10817 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2286, - "step": 10818 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2229, - "step": 10819 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2432, - "step": 10820 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2369, - "step": 10821 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2343, - "step": 10822 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2509, - "step": 10823 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2244, - "step": 10824 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2459, - "step": 10825 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2356, - "step": 10826 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2477, - "step": 10827 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2499, - "step": 10828 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2276, - "step": 10829 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2226, - "step": 10830 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2563, - "step": 10831 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2464, - "step": 10832 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2346, - "step": 10833 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2333, - "step": 10834 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2157, - "step": 10835 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2315, - "step": 10836 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2324, - "step": 10837 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2422, - "step": 10838 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2236, - "step": 10839 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2401, - "step": 10840 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2341, - "step": 10841 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.228, - "step": 10842 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2393, - "step": 10843 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2506, - "step": 10844 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2299, - "step": 10845 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.242, - "step": 10846 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2288, - "step": 10847 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2456, - "step": 10848 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2194, - "step": 10849 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2414, - "step": 10850 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.231, - "step": 10851 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2311, - "step": 10852 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2281, - "step": 10853 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2486, - "step": 10854 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2231, - "step": 10855 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2228, - "step": 10856 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2385, - "step": 10857 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2356, - "step": 10858 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2341, - "step": 10859 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2494, - "step": 10860 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2362, - "step": 10861 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2321, - "step": 10862 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2219, - "step": 10863 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.237, - "step": 10864 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2367, - "step": 10865 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2373, - "step": 10866 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2305, - "step": 10867 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2337, - "step": 10868 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2488, - "step": 10869 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.24, - "step": 10870 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2456, - "step": 10871 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2351, - "step": 10872 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2352, - "step": 10873 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2321, - "step": 10874 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2536, - "step": 10875 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2256, - "step": 10876 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2252, - "step": 10877 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2386, - "step": 10878 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2284, - "step": 10879 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2393, - "step": 10880 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2403, - "step": 10881 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2365, - "step": 10882 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2376, - "step": 10883 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2364, - "step": 10884 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2384, - "step": 10885 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2296, - "step": 10886 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2444, - "step": 10887 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2231, - "step": 10888 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2488, - "step": 10889 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.233, - "step": 10890 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2311, - "step": 10891 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2287, - "step": 10892 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2417, - "step": 10893 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2445, - "step": 10894 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2623, - "step": 10895 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2291, - "step": 10896 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2261, - "step": 10897 - }, - { - "epoch": 1.34, - "learning_rate": 0.0003, - "loss": 0.2294, - "step": 10898 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2267, - "step": 10899 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2318, - "step": 10900 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2393, - "step": 10901 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2449, - "step": 10902 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2274, - "step": 10903 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2248, - "step": 10904 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2334, - "step": 10905 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.24, - "step": 10906 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2304, - "step": 10907 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2462, - "step": 10908 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2164, - "step": 10909 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2311, - "step": 10910 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2407, - "step": 10911 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2304, - "step": 10912 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2318, - "step": 10913 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2365, - "step": 10914 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2362, - "step": 10915 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2325, - "step": 10916 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.235, - "step": 10917 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2317, - "step": 10918 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2257, - "step": 10919 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2213, - "step": 10920 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2231, - "step": 10921 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2301, - "step": 10922 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2311, - "step": 10923 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2296, - "step": 10924 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.235, - "step": 10925 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2431, - "step": 10926 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2438, - "step": 10927 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2422, - "step": 10928 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2527, - "step": 10929 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2461, - "step": 10930 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2296, - "step": 10931 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.233, - "step": 10932 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2224, - "step": 10933 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2246, - "step": 10934 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2483, - "step": 10935 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2463, - "step": 10936 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2353, - "step": 10937 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2467, - "step": 10938 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2398, - "step": 10939 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2398, - "step": 10940 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2477, - "step": 10941 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2341, - "step": 10942 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2557, - "step": 10943 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.232, - "step": 10944 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2395, - "step": 10945 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2348, - "step": 10946 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2252, - "step": 10947 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2405, - "step": 10948 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2147, - "step": 10949 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2446, - "step": 10950 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2402, - "step": 10951 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2477, - "step": 10952 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2429, - "step": 10953 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.246, - "step": 10954 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2331, - "step": 10955 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2322, - "step": 10956 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2205, - "step": 10957 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2547, - "step": 10958 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2399, - "step": 10959 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2352, - "step": 10960 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2403, - "step": 10961 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2442, - "step": 10962 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2411, - "step": 10963 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2325, - "step": 10964 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2461, - "step": 10965 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2193, - "step": 10966 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2314, - "step": 10967 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2273, - "step": 10968 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.215, - "step": 10969 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2177, - "step": 10970 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2367, - "step": 10971 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2368, - "step": 10972 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2181, - "step": 10973 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2319, - "step": 10974 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2279, - "step": 10975 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2294, - "step": 10976 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2334, - "step": 10977 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2595, - "step": 10978 - }, - { - "epoch": 1.35, - "learning_rate": 0.0003, - "loss": 0.2371, - "step": 10979 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2411, - "step": 10980 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.23, - "step": 10981 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2532, - "step": 10982 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2374, - "step": 10983 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2628, - "step": 10984 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2201, - "step": 10985 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2294, - "step": 10986 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2351, - "step": 10987 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2265, - "step": 10988 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2467, - "step": 10989 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2411, - "step": 10990 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.239, - "step": 10991 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2375, - "step": 10992 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2413, - "step": 10993 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2202, - "step": 10994 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2311, - "step": 10995 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2297, - "step": 10996 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2512, - "step": 10997 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2323, - "step": 10998 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2402, - "step": 10999 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2321, - "step": 11000 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2481, - "step": 11001 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2472, - "step": 11002 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2388, - "step": 11003 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2295, - "step": 11004 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.222, - "step": 11005 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2154, - "step": 11006 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2455, - "step": 11007 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2286, - "step": 11008 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2454, - "step": 11009 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2398, - "step": 11010 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2235, - "step": 11011 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2272, - "step": 11012 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2232, - "step": 11013 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2378, - "step": 11014 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.229, - "step": 11015 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2225, - "step": 11016 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2342, - "step": 11017 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2345, - "step": 11018 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2312, - "step": 11019 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2445, - "step": 11020 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2486, - "step": 11021 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2529, - "step": 11022 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2265, - "step": 11023 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2224, - "step": 11024 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2307, - "step": 11025 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.234, - "step": 11026 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2439, - "step": 11027 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2228, - "step": 11028 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2271, - "step": 11029 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2345, - "step": 11030 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2255, - "step": 11031 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2478, - "step": 11032 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2354, - "step": 11033 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2303, - "step": 11034 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2296, - "step": 11035 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2334, - "step": 11036 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2204, - "step": 11037 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2257, - "step": 11038 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2436, - "step": 11039 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.217, - "step": 11040 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2395, - "step": 11041 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2325, - "step": 11042 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.231, - "step": 11043 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2287, - "step": 11044 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2425, - "step": 11045 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2313, - "step": 11046 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2347, - "step": 11047 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2325, - "step": 11048 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2455, - "step": 11049 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2267, - "step": 11050 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2384, - "step": 11051 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2295, - "step": 11052 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2255, - "step": 11053 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2343, - "step": 11054 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2334, - "step": 11055 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2377, - "step": 11056 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2372, - "step": 11057 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2176, - "step": 11058 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.2269, - "step": 11059 - }, - { - "epoch": 1.36, - "learning_rate": 0.0003, - "loss": 0.205, - "step": 11060 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2617, - "step": 11061 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.225, - "step": 11062 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2413, - "step": 11063 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2386, - "step": 11064 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2535, - "step": 11065 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.238, - "step": 11066 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2447, - "step": 11067 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2349, - "step": 11068 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2312, - "step": 11069 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2213, - "step": 11070 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2362, - "step": 11071 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2478, - "step": 11072 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2353, - "step": 11073 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2173, - "step": 11074 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2384, - "step": 11075 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2268, - "step": 11076 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2186, - "step": 11077 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.225, - "step": 11078 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.24, - "step": 11079 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2392, - "step": 11080 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2413, - "step": 11081 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2229, - "step": 11082 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2321, - "step": 11083 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.25, - "step": 11084 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2331, - "step": 11085 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2515, - "step": 11086 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2274, - "step": 11087 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2293, - "step": 11088 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2237, - "step": 11089 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2373, - "step": 11090 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2199, - "step": 11091 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2306, - "step": 11092 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2417, - "step": 11093 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2473, - "step": 11094 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2356, - "step": 11095 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2423, - "step": 11096 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2203, - "step": 11097 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2302, - "step": 11098 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.238, - "step": 11099 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2345, - "step": 11100 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2273, - "step": 11101 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2291, - "step": 11102 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2253, - "step": 11103 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2178, - "step": 11104 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2374, - "step": 11105 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2321, - "step": 11106 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2335, - "step": 11107 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2356, - "step": 11108 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.243, - "step": 11109 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2257, - "step": 11110 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2349, - "step": 11111 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2588, - "step": 11112 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2291, - "step": 11113 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2237, - "step": 11114 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.255, - "step": 11115 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2364, - "step": 11116 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2294, - "step": 11117 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2346, - "step": 11118 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2432, - "step": 11119 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.225, - "step": 11120 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2308, - "step": 11121 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2369, - "step": 11122 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2293, - "step": 11123 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2189, - "step": 11124 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2179, - "step": 11125 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2121, - "step": 11126 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2248, - "step": 11127 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2187, - "step": 11128 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.227, - "step": 11129 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2204, - "step": 11130 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2313, - "step": 11131 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2294, - "step": 11132 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2311, - "step": 11133 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2487, - "step": 11134 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2362, - "step": 11135 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.235, - "step": 11136 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2343, - "step": 11137 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2336, - "step": 11138 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2397, - "step": 11139 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2219, - "step": 11140 - }, - { - "epoch": 1.37, - "learning_rate": 0.0003, - "loss": 0.2432, - "step": 11141 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2492, - "step": 11142 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2394, - "step": 11143 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2387, - "step": 11144 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2303, - "step": 11145 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2509, - "step": 11146 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2441, - "step": 11147 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2525, - "step": 11148 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2322, - "step": 11149 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2417, - "step": 11150 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2176, - "step": 11151 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.228, - "step": 11152 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2455, - "step": 11153 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2547, - "step": 11154 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2298, - "step": 11155 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2363, - "step": 11156 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2219, - "step": 11157 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2412, - "step": 11158 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.232, - "step": 11159 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2417, - "step": 11160 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.254, - "step": 11161 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2417, - "step": 11162 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2452, - "step": 11163 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2226, - "step": 11164 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2248, - "step": 11165 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2315, - "step": 11166 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2252, - "step": 11167 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2399, - "step": 11168 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2179, - "step": 11169 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2243, - "step": 11170 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2311, - "step": 11171 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2365, - "step": 11172 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2277, - "step": 11173 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2486, - "step": 11174 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2344, - "step": 11175 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2371, - "step": 11176 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2593, - "step": 11177 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2285, - "step": 11178 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2271, - "step": 11179 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2455, - "step": 11180 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2351, - "step": 11181 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2473, - "step": 11182 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2524, - "step": 11183 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2329, - "step": 11184 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2302, - "step": 11185 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2482, - "step": 11186 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2373, - "step": 11187 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2344, - "step": 11188 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2467, - "step": 11189 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2418, - "step": 11190 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2187, - "step": 11191 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2304, - "step": 11192 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2262, - "step": 11193 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2345, - "step": 11194 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2314, - "step": 11195 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2329, - "step": 11196 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2239, - "step": 11197 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2378, - "step": 11198 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2565, - "step": 11199 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2457, - "step": 11200 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2221, - "step": 11201 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2124, - "step": 11202 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2358, - "step": 11203 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2492, - "step": 11204 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2375, - "step": 11205 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2443, - "step": 11206 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2352, - "step": 11207 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2263, - "step": 11208 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2269, - "step": 11209 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2214, - "step": 11210 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2227, - "step": 11211 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2238, - "step": 11212 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2374, - "step": 11213 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2282, - "step": 11214 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2378, - "step": 11215 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2263, - "step": 11216 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2309, - "step": 11217 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.23, - "step": 11218 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2449, - "step": 11219 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2189, - "step": 11220 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2247, - "step": 11221 - }, - { - "epoch": 1.38, - "learning_rate": 0.0003, - "loss": 0.2127, - "step": 11222 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2238, - "step": 11223 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2227, - "step": 11224 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.24, - "step": 11225 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2399, - "step": 11226 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2281, - "step": 11227 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2242, - "step": 11228 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2263, - "step": 11229 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2329, - "step": 11230 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2281, - "step": 11231 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2123, - "step": 11232 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2292, - "step": 11233 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2165, - "step": 11234 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2245, - "step": 11235 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2282, - "step": 11236 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2264, - "step": 11237 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2207, - "step": 11238 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.216, - "step": 11239 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2455, - "step": 11240 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2261, - "step": 11241 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2418, - "step": 11242 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2229, - "step": 11243 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2414, - "step": 11244 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2456, - "step": 11245 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.241, - "step": 11246 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2508, - "step": 11247 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2235, - "step": 11248 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2259, - "step": 11249 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2327, - "step": 11250 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2262, - "step": 11251 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2364, - "step": 11252 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2382, - "step": 11253 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2474, - "step": 11254 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2437, - "step": 11255 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2413, - "step": 11256 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2314, - "step": 11257 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2423, - "step": 11258 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2282, - "step": 11259 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2232, - "step": 11260 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2353, - "step": 11261 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2408, - "step": 11262 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2237, - "step": 11263 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2315, - "step": 11264 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2421, - "step": 11265 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2184, - "step": 11266 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2498, - "step": 11267 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2278, - "step": 11268 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2442, - "step": 11269 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2347, - "step": 11270 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2255, - "step": 11271 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2291, - "step": 11272 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2424, - "step": 11273 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2372, - "step": 11274 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2211, - "step": 11275 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2232, - "step": 11276 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2339, - "step": 11277 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.222, - "step": 11278 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2188, - "step": 11279 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2317, - "step": 11280 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2224, - "step": 11281 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2314, - "step": 11282 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.227, - "step": 11283 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2184, - "step": 11284 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2377, - "step": 11285 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2205, - "step": 11286 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2452, - "step": 11287 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2301, - "step": 11288 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2357, - "step": 11289 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2378, - "step": 11290 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2449, - "step": 11291 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2398, - "step": 11292 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2258, - "step": 11293 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2397, - "step": 11294 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.239, - "step": 11295 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2361, - "step": 11296 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2333, - "step": 11297 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2242, - "step": 11298 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2184, - "step": 11299 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2331, - "step": 11300 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2412, - "step": 11301 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.2215, - "step": 11302 - }, - { - "epoch": 1.39, - "learning_rate": 0.0003, - "loss": 0.24, - "step": 11303 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2323, - "step": 11304 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2421, - "step": 11305 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2461, - "step": 11306 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2327, - "step": 11307 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.231, - "step": 11308 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2539, - "step": 11309 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2343, - "step": 11310 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.241, - "step": 11311 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2407, - "step": 11312 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2187, - "step": 11313 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2501, - "step": 11314 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2276, - "step": 11315 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2438, - "step": 11316 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2377, - "step": 11317 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2309, - "step": 11318 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2362, - "step": 11319 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2463, - "step": 11320 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.225, - "step": 11321 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2376, - "step": 11322 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2373, - "step": 11323 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2395, - "step": 11324 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2303, - "step": 11325 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2395, - "step": 11326 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2263, - "step": 11327 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2324, - "step": 11328 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.251, - "step": 11329 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.244, - "step": 11330 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2353, - "step": 11331 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2289, - "step": 11332 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2428, - "step": 11333 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2228, - "step": 11334 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2491, - "step": 11335 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2291, - "step": 11336 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.224, - "step": 11337 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2261, - "step": 11338 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2228, - "step": 11339 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2439, - "step": 11340 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2296, - "step": 11341 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2499, - "step": 11342 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2347, - "step": 11343 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2336, - "step": 11344 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2175, - "step": 11345 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2475, - "step": 11346 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2337, - "step": 11347 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.229, - "step": 11348 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2251, - "step": 11349 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2356, - "step": 11350 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2427, - "step": 11351 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2323, - "step": 11352 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2364, - "step": 11353 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2293, - "step": 11354 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2425, - "step": 11355 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.219, - "step": 11356 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.228, - "step": 11357 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2234, - "step": 11358 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2255, - "step": 11359 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2342, - "step": 11360 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.248, - "step": 11361 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2287, - "step": 11362 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2388, - "step": 11363 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2357, - "step": 11364 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2258, - "step": 11365 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2469, - "step": 11366 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2353, - "step": 11367 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2157, - "step": 11368 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2298, - "step": 11369 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2468, - "step": 11370 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.231, - "step": 11371 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2434, - "step": 11372 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2341, - "step": 11373 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2305, - "step": 11374 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2458, - "step": 11375 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2426, - "step": 11376 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2237, - "step": 11377 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2299, - "step": 11378 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2316, - "step": 11379 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2227, - "step": 11380 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2358, - "step": 11381 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2578, - "step": 11382 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2283, - "step": 11383 - }, - { - "epoch": 1.4, - "learning_rate": 0.0003, - "loss": 0.2252, - "step": 11384 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2217, - "step": 11385 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2189, - "step": 11386 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2292, - "step": 11387 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2326, - "step": 11388 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2338, - "step": 11389 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.243, - "step": 11390 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2419, - "step": 11391 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2263, - "step": 11392 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2361, - "step": 11393 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2376, - "step": 11394 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2395, - "step": 11395 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2276, - "step": 11396 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2228, - "step": 11397 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2297, - "step": 11398 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2417, - "step": 11399 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.223, - "step": 11400 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2421, - "step": 11401 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2352, - "step": 11402 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2383, - "step": 11403 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2387, - "step": 11404 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2362, - "step": 11405 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2367, - "step": 11406 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2333, - "step": 11407 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2327, - "step": 11408 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2394, - "step": 11409 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2211, - "step": 11410 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2333, - "step": 11411 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2272, - "step": 11412 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2288, - "step": 11413 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2254, - "step": 11414 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2463, - "step": 11415 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2309, - "step": 11416 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2314, - "step": 11417 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2363, - "step": 11418 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2522, - "step": 11419 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2306, - "step": 11420 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2233, - "step": 11421 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2143, - "step": 11422 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.214, - "step": 11423 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2351, - "step": 11424 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2249, - "step": 11425 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2255, - "step": 11426 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2434, - "step": 11427 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2331, - "step": 11428 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2441, - "step": 11429 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2413, - "step": 11430 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2195, - "step": 11431 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2267, - "step": 11432 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2324, - "step": 11433 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2347, - "step": 11434 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2381, - "step": 11435 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2331, - "step": 11436 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2298, - "step": 11437 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2322, - "step": 11438 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2154, - "step": 11439 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2313, - "step": 11440 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2309, - "step": 11441 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2346, - "step": 11442 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2453, - "step": 11443 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2388, - "step": 11444 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2474, - "step": 11445 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2343, - "step": 11446 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2262, - "step": 11447 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2154, - "step": 11448 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2199, - "step": 11449 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2259, - "step": 11450 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2439, - "step": 11451 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2427, - "step": 11452 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2267, - "step": 11453 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2206, - "step": 11454 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2244, - "step": 11455 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2267, - "step": 11456 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2333, - "step": 11457 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2342, - "step": 11458 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2366, - "step": 11459 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.227, - "step": 11460 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2361, - "step": 11461 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2357, - "step": 11462 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2257, - "step": 11463 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2444, - "step": 11464 - }, - { - "epoch": 1.41, - "learning_rate": 0.0003, - "loss": 0.2236, - "step": 11465 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2178, - "step": 11466 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2284, - "step": 11467 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2382, - "step": 11468 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2397, - "step": 11469 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.232, - "step": 11470 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2521, - "step": 11471 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2225, - "step": 11472 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2366, - "step": 11473 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2344, - "step": 11474 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2285, - "step": 11475 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2416, - "step": 11476 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.223, - "step": 11477 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2319, - "step": 11478 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2494, - "step": 11479 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2361, - "step": 11480 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2464, - "step": 11481 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2326, - "step": 11482 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2445, - "step": 11483 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2282, - "step": 11484 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2378, - "step": 11485 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2465, - "step": 11486 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2164, - "step": 11487 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.229, - "step": 11488 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2249, - "step": 11489 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2352, - "step": 11490 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2273, - "step": 11491 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2416, - "step": 11492 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.203, - "step": 11493 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2247, - "step": 11494 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2267, - "step": 11495 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2509, - "step": 11496 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2263, - "step": 11497 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2293, - "step": 11498 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2333, - "step": 11499 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2328, - "step": 11500 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.222, - "step": 11501 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2258, - "step": 11502 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2128, - "step": 11503 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2332, - "step": 11504 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2191, - "step": 11505 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2312, - "step": 11506 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2328, - "step": 11507 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2191, - "step": 11508 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2363, - "step": 11509 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2415, - "step": 11510 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2413, - "step": 11511 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2325, - "step": 11512 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2377, - "step": 11513 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2454, - "step": 11514 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2236, - "step": 11515 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2286, - "step": 11516 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2196, - "step": 11517 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2496, - "step": 11518 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2368, - "step": 11519 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2353, - "step": 11520 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2411, - "step": 11521 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2532, - "step": 11522 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2296, - "step": 11523 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2397, - "step": 11524 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2284, - "step": 11525 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2338, - "step": 11526 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2359, - "step": 11527 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2284, - "step": 11528 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2429, - "step": 11529 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2456, - "step": 11530 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2324, - "step": 11531 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2318, - "step": 11532 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2323, - "step": 11533 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2417, - "step": 11534 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.221, - "step": 11535 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.237, - "step": 11536 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2239, - "step": 11537 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2305, - "step": 11538 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2497, - "step": 11539 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.233, - "step": 11540 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2486, - "step": 11541 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2206, - "step": 11542 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2309, - "step": 11543 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2285, - "step": 11544 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.257, - "step": 11545 - }, - { - "epoch": 1.42, - "learning_rate": 0.0003, - "loss": 0.2339, - "step": 11546 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2188, - "step": 11547 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2243, - "step": 11548 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2393, - "step": 11549 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2253, - "step": 11550 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2156, - "step": 11551 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2154, - "step": 11552 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2317, - "step": 11553 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2336, - "step": 11554 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.243, - "step": 11555 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2425, - "step": 11556 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2291, - "step": 11557 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2266, - "step": 11558 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2196, - "step": 11559 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2168, - "step": 11560 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2349, - "step": 11561 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2426, - "step": 11562 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2263, - "step": 11563 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2403, - "step": 11564 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2432, - "step": 11565 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2229, - "step": 11566 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2243, - "step": 11567 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2363, - "step": 11568 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2292, - "step": 11569 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2411, - "step": 11570 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2583, - "step": 11571 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.232, - "step": 11572 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2387, - "step": 11573 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2201, - "step": 11574 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2351, - "step": 11575 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2244, - "step": 11576 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2413, - "step": 11577 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2272, - "step": 11578 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.226, - "step": 11579 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2418, - "step": 11580 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2403, - "step": 11581 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2363, - "step": 11582 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.229, - "step": 11583 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2241, - "step": 11584 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2326, - "step": 11585 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2453, - "step": 11586 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.246, - "step": 11587 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2241, - "step": 11588 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2379, - "step": 11589 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.215, - "step": 11590 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2144, - "step": 11591 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2304, - "step": 11592 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2555, - "step": 11593 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2346, - "step": 11594 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2226, - "step": 11595 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2186, - "step": 11596 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2295, - "step": 11597 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2354, - "step": 11598 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2282, - "step": 11599 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.232, - "step": 11600 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2281, - "step": 11601 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2129, - "step": 11602 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2404, - "step": 11603 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2289, - "step": 11604 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2583, - "step": 11605 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2392, - "step": 11606 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2165, - "step": 11607 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2292, - "step": 11608 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2178, - "step": 11609 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2203, - "step": 11610 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2162, - "step": 11611 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2485, - "step": 11612 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2362, - "step": 11613 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2554, - "step": 11614 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2392, - "step": 11615 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2225, - "step": 11616 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2367, - "step": 11617 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2254, - "step": 11618 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2342, - "step": 11619 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2299, - "step": 11620 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2314, - "step": 11621 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.227, - "step": 11622 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.244, - "step": 11623 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2345, - "step": 11624 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2312, - "step": 11625 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2448, - "step": 11626 - }, - { - "epoch": 1.43, - "learning_rate": 0.0003, - "loss": 0.2321, - "step": 11627 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2373, - "step": 11628 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2171, - "step": 11629 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2285, - "step": 11630 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2318, - "step": 11631 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2316, - "step": 11632 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2329, - "step": 11633 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.229, - "step": 11634 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2344, - "step": 11635 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2264, - "step": 11636 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2193, - "step": 11637 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2262, - "step": 11638 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2175, - "step": 11639 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2377, - "step": 11640 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2493, - "step": 11641 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2337, - "step": 11642 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2418, - "step": 11643 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2334, - "step": 11644 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2161, - "step": 11645 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2322, - "step": 11646 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2296, - "step": 11647 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2238, - "step": 11648 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2327, - "step": 11649 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.243, - "step": 11650 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2299, - "step": 11651 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2235, - "step": 11652 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2174, - "step": 11653 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2219, - "step": 11654 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2238, - "step": 11655 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2206, - "step": 11656 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2285, - "step": 11657 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2228, - "step": 11658 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2393, - "step": 11659 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2427, - "step": 11660 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2324, - "step": 11661 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2173, - "step": 11662 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2375, - "step": 11663 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2313, - "step": 11664 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2356, - "step": 11665 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2202, - "step": 11666 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2285, - "step": 11667 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2312, - "step": 11668 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2346, - "step": 11669 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2395, - "step": 11670 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2309, - "step": 11671 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2472, - "step": 11672 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2398, - "step": 11673 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2373, - "step": 11674 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2343, - "step": 11675 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2465, - "step": 11676 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2254, - "step": 11677 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2365, - "step": 11678 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2227, - "step": 11679 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2349, - "step": 11680 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2348, - "step": 11681 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2362, - "step": 11682 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.228, - "step": 11683 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2446, - "step": 11684 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2335, - "step": 11685 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.243, - "step": 11686 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2347, - "step": 11687 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2311, - "step": 11688 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2251, - "step": 11689 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2378, - "step": 11690 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.221, - "step": 11691 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2357, - "step": 11692 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2267, - "step": 11693 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2437, - "step": 11694 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2368, - "step": 11695 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2266, - "step": 11696 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2597, - "step": 11697 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2454, - "step": 11698 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.219, - "step": 11699 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2343, - "step": 11700 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2432, - "step": 11701 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2218, - "step": 11702 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2409, - "step": 11703 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2449, - "step": 11704 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2388, - "step": 11705 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.241, - "step": 11706 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2196, - "step": 11707 - }, - { - "epoch": 1.44, - "learning_rate": 0.0003, - "loss": 0.2387, - "step": 11708 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2338, - "step": 11709 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2302, - "step": 11710 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2359, - "step": 11711 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2402, - "step": 11712 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2348, - "step": 11713 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2188, - "step": 11714 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2318, - "step": 11715 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.227, - "step": 11716 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2404, - "step": 11717 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2243, - "step": 11718 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2315, - "step": 11719 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2456, - "step": 11720 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2185, - "step": 11721 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.24, - "step": 11722 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2243, - "step": 11723 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2229, - "step": 11724 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2318, - "step": 11725 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2387, - "step": 11726 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2343, - "step": 11727 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2111, - "step": 11728 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.236, - "step": 11729 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2316, - "step": 11730 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2224, - "step": 11731 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2473, - "step": 11732 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2172, - "step": 11733 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2262, - "step": 11734 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2141, - "step": 11735 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2241, - "step": 11736 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2224, - "step": 11737 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2294, - "step": 11738 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2279, - "step": 11739 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2389, - "step": 11740 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2266, - "step": 11741 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2317, - "step": 11742 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2305, - "step": 11743 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2341, - "step": 11744 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2247, - "step": 11745 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2189, - "step": 11746 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2281, - "step": 11747 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2319, - "step": 11748 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2353, - "step": 11749 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2326, - "step": 11750 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2347, - "step": 11751 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2208, - "step": 11752 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2415, - "step": 11753 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2264, - "step": 11754 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2208, - "step": 11755 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2152, - "step": 11756 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2374, - "step": 11757 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2296, - "step": 11758 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2433, - "step": 11759 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.223, - "step": 11760 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2315, - "step": 11761 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2213, - "step": 11762 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2434, - "step": 11763 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2276, - "step": 11764 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2207, - "step": 11765 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2502, - "step": 11766 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2211, - "step": 11767 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2068, - "step": 11768 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2281, - "step": 11769 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2399, - "step": 11770 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2381, - "step": 11771 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.24, - "step": 11772 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2288, - "step": 11773 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2431, - "step": 11774 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2342, - "step": 11775 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2333, - "step": 11776 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2279, - "step": 11777 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2497, - "step": 11778 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2498, - "step": 11779 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.221, - "step": 11780 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2373, - "step": 11781 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2379, - "step": 11782 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.24, - "step": 11783 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.239, - "step": 11784 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2112, - "step": 11785 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2255, - "step": 11786 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2214, - "step": 11787 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2263, - "step": 11788 - }, - { - "epoch": 1.45, - "learning_rate": 0.0003, - "loss": 0.2381, - "step": 11789 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2196, - "step": 11790 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.257, - "step": 11791 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2294, - "step": 11792 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2288, - "step": 11793 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2462, - "step": 11794 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2232, - "step": 11795 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2427, - "step": 11796 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2241, - "step": 11797 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.211, - "step": 11798 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2207, - "step": 11799 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2246, - "step": 11800 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2403, - "step": 11801 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2331, - "step": 11802 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2405, - "step": 11803 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2284, - "step": 11804 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2392, - "step": 11805 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2229, - "step": 11806 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2538, - "step": 11807 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2299, - "step": 11808 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2373, - "step": 11809 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2262, - "step": 11810 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2559, - "step": 11811 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2388, - "step": 11812 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2464, - "step": 11813 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2369, - "step": 11814 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2327, - "step": 11815 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2438, - "step": 11816 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2171, - "step": 11817 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2202, - "step": 11818 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2396, - "step": 11819 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2344, - "step": 11820 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2293, - "step": 11821 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2128, - "step": 11822 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2307, - "step": 11823 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.232, - "step": 11824 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2309, - "step": 11825 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2352, - "step": 11826 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.24, - "step": 11827 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2404, - "step": 11828 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.224, - "step": 11829 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2165, - "step": 11830 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2267, - "step": 11831 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2439, - "step": 11832 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2237, - "step": 11833 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.232, - "step": 11834 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2173, - "step": 11835 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2349, - "step": 11836 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.24, - "step": 11837 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2326, - "step": 11838 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2205, - "step": 11839 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2155, - "step": 11840 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2321, - "step": 11841 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2306, - "step": 11842 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2444, - "step": 11843 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2233, - "step": 11844 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2527, - "step": 11845 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2454, - "step": 11846 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2236, - "step": 11847 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2342, - "step": 11848 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2187, - "step": 11849 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2288, - "step": 11850 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2398, - "step": 11851 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2375, - "step": 11852 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2184, - "step": 11853 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2399, - "step": 11854 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2158, - "step": 11855 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2251, - "step": 11856 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2292, - "step": 11857 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2205, - "step": 11858 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2358, - "step": 11859 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2273, - "step": 11860 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2213, - "step": 11861 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2293, - "step": 11862 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.1985, - "step": 11863 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2224, - "step": 11864 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2284, - "step": 11865 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2249, - "step": 11866 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2328, - "step": 11867 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2264, - "step": 11868 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2106, - "step": 11869 - }, - { - "epoch": 1.46, - "learning_rate": 0.0003, - "loss": 0.2328, - "step": 11870 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2341, - "step": 11871 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2246, - "step": 11872 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2189, - "step": 11873 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2276, - "step": 11874 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2431, - "step": 11875 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2296, - "step": 11876 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2272, - "step": 11877 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2374, - "step": 11878 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2351, - "step": 11879 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2192, - "step": 11880 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2256, - "step": 11881 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2151, - "step": 11882 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2267, - "step": 11883 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2274, - "step": 11884 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2287, - "step": 11885 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2322, - "step": 11886 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2338, - "step": 11887 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.226, - "step": 11888 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2203, - "step": 11889 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2198, - "step": 11890 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2429, - "step": 11891 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2303, - "step": 11892 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.236, - "step": 11893 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2339, - "step": 11894 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2314, - "step": 11895 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2212, - "step": 11896 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2464, - "step": 11897 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2239, - "step": 11898 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2097, - "step": 11899 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2313, - "step": 11900 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.234, - "step": 11901 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2102, - "step": 11902 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2347, - "step": 11903 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2511, - "step": 11904 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2165, - "step": 11905 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.234, - "step": 11906 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2199, - "step": 11907 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2114, - "step": 11908 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2381, - "step": 11909 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2389, - "step": 11910 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2245, - "step": 11911 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2446, - "step": 11912 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2103, - "step": 11913 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2388, - "step": 11914 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2301, - "step": 11915 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2237, - "step": 11916 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2343, - "step": 11917 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2276, - "step": 11918 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2178, - "step": 11919 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2346, - "step": 11920 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2226, - "step": 11921 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2285, - "step": 11922 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2272, - "step": 11923 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2183, - "step": 11924 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2307, - "step": 11925 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.225, - "step": 11926 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2296, - "step": 11927 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2318, - "step": 11928 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2334, - "step": 11929 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2314, - "step": 11930 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2412, - "step": 11931 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2354, - "step": 11932 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.211, - "step": 11933 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2244, - "step": 11934 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.255, - "step": 11935 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2306, - "step": 11936 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2269, - "step": 11937 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2281, - "step": 11938 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2278, - "step": 11939 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2336, - "step": 11940 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2166, - "step": 11941 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2277, - "step": 11942 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2319, - "step": 11943 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2226, - "step": 11944 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2435, - "step": 11945 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2396, - "step": 11946 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2207, - "step": 11947 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2323, - "step": 11948 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2107, - "step": 11949 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2242, - "step": 11950 - }, - { - "epoch": 1.47, - "learning_rate": 0.0003, - "loss": 0.2444, - "step": 11951 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2199, - "step": 11952 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2129, - "step": 11953 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2227, - "step": 11954 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2376, - "step": 11955 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.229, - "step": 11956 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2255, - "step": 11957 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.229, - "step": 11958 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2237, - "step": 11959 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2303, - "step": 11960 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2349, - "step": 11961 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2368, - "step": 11962 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2365, - "step": 11963 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2236, - "step": 11964 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2251, - "step": 11965 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2433, - "step": 11966 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2427, - "step": 11967 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.227, - "step": 11968 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2297, - "step": 11969 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2405, - "step": 11970 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2175, - "step": 11971 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.228, - "step": 11972 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2337, - "step": 11973 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2315, - "step": 11974 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2367, - "step": 11975 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2262, - "step": 11976 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2288, - "step": 11977 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2534, - "step": 11978 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2288, - "step": 11979 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2368, - "step": 11980 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2429, - "step": 11981 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2279, - "step": 11982 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2406, - "step": 11983 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2311, - "step": 11984 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2279, - "step": 11985 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2226, - "step": 11986 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2261, - "step": 11987 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2242, - "step": 11988 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2378, - "step": 11989 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2175, - "step": 11990 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2314, - "step": 11991 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2403, - "step": 11992 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2297, - "step": 11993 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2219, - "step": 11994 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2205, - "step": 11995 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2314, - "step": 11996 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2118, - "step": 11997 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2279, - "step": 11998 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2453, - "step": 11999 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2161, - "step": 12000 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2172, - "step": 12001 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2297, - "step": 12002 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2309, - "step": 12003 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2289, - "step": 12004 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2382, - "step": 12005 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2249, - "step": 12006 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.213, - "step": 12007 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2179, - "step": 12008 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2305, - "step": 12009 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2161, - "step": 12010 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.235, - "step": 12011 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2421, - "step": 12012 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.233, - "step": 12013 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2376, - "step": 12014 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2381, - "step": 12015 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2393, - "step": 12016 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2307, - "step": 12017 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2472, - "step": 12018 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2311, - "step": 12019 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2175, - "step": 12020 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2348, - "step": 12021 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2233, - "step": 12022 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2232, - "step": 12023 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.235, - "step": 12024 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2374, - "step": 12025 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2378, - "step": 12026 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2393, - "step": 12027 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2388, - "step": 12028 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.229, - "step": 12029 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2413, - "step": 12030 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2282, - "step": 12031 - }, - { - "epoch": 1.48, - "learning_rate": 0.0003, - "loss": 0.2243, - "step": 12032 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2199, - "step": 12033 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2238, - "step": 12034 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2279, - "step": 12035 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.219, - "step": 12036 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2473, - "step": 12037 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2145, - "step": 12038 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.252, - "step": 12039 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2413, - "step": 12040 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2156, - "step": 12041 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2117, - "step": 12042 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2426, - "step": 12043 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2401, - "step": 12044 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.235, - "step": 12045 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2379, - "step": 12046 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2327, - "step": 12047 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.234, - "step": 12048 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2334, - "step": 12049 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2257, - "step": 12050 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2248, - "step": 12051 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2366, - "step": 12052 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2287, - "step": 12053 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2175, - "step": 12054 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2301, - "step": 12055 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2232, - "step": 12056 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2213, - "step": 12057 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2386, - "step": 12058 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2155, - "step": 12059 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.214, - "step": 12060 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2409, - "step": 12061 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2399, - "step": 12062 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2355, - "step": 12063 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2243, - "step": 12064 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2365, - "step": 12065 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2336, - "step": 12066 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2245, - "step": 12067 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2185, - "step": 12068 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2375, - "step": 12069 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2298, - "step": 12070 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2126, - "step": 12071 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2302, - "step": 12072 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2272, - "step": 12073 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2368, - "step": 12074 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2226, - "step": 12075 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.206, - "step": 12076 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2309, - "step": 12077 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2275, - "step": 12078 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2277, - "step": 12079 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2336, - "step": 12080 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.243, - "step": 12081 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2275, - "step": 12082 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2156, - "step": 12083 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2269, - "step": 12084 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2352, - "step": 12085 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2359, - "step": 12086 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2172, - "step": 12087 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2422, - "step": 12088 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2357, - "step": 12089 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2306, - "step": 12090 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2304, - "step": 12091 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.218, - "step": 12092 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2082, - "step": 12093 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.25, - "step": 12094 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2344, - "step": 12095 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2254, - "step": 12096 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2356, - "step": 12097 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2311, - "step": 12098 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2332, - "step": 12099 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2358, - "step": 12100 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2194, - "step": 12101 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2385, - "step": 12102 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2316, - "step": 12103 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2186, - "step": 12104 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2391, - "step": 12105 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2424, - "step": 12106 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2201, - "step": 12107 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2279, - "step": 12108 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.21, - "step": 12109 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2523, - "step": 12110 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2326, - "step": 12111 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2381, - "step": 12112 - }, - { - "epoch": 1.49, - "learning_rate": 0.0003, - "loss": 0.2251, - "step": 12113 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2262, - "step": 12114 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.231, - "step": 12115 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2233, - "step": 12116 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2347, - "step": 12117 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2195, - "step": 12118 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2252, - "step": 12119 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2269, - "step": 12120 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2301, - "step": 12121 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.217, - "step": 12122 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2131, - "step": 12123 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2318, - "step": 12124 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2301, - "step": 12125 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2284, - "step": 12126 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2268, - "step": 12127 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2313, - "step": 12128 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2268, - "step": 12129 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2349, - "step": 12130 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.226, - "step": 12131 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2236, - "step": 12132 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2267, - "step": 12133 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2259, - "step": 12134 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2129, - "step": 12135 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2285, - "step": 12136 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2243, - "step": 12137 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2233, - "step": 12138 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2068, - "step": 12139 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2196, - "step": 12140 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2285, - "step": 12141 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2342, - "step": 12142 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2361, - "step": 12143 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2459, - "step": 12144 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2436, - "step": 12145 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2377, - "step": 12146 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2151, - "step": 12147 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2456, - "step": 12148 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2164, - "step": 12149 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2482, - "step": 12150 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2462, - "step": 12151 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2257, - "step": 12152 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2197, - "step": 12153 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2211, - "step": 12154 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2232, - "step": 12155 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2158, - "step": 12156 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.225, - "step": 12157 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2246, - "step": 12158 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2444, - "step": 12159 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2238, - "step": 12160 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2489, - "step": 12161 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2226, - "step": 12162 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2337, - "step": 12163 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2412, - "step": 12164 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2351, - "step": 12165 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2308, - "step": 12166 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2229, - "step": 12167 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2257, - "step": 12168 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2188, - "step": 12169 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2349, - "step": 12170 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2291, - "step": 12171 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2251, - "step": 12172 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.236, - "step": 12173 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2263, - "step": 12174 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2252, - "step": 12175 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2198, - "step": 12176 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2297, - "step": 12177 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2439, - "step": 12178 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2234, - "step": 12179 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2191, - "step": 12180 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2196, - "step": 12181 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2378, - "step": 12182 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2244, - "step": 12183 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2419, - "step": 12184 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2362, - "step": 12185 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2173, - "step": 12186 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2246, - "step": 12187 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.234, - "step": 12188 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2331, - "step": 12189 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2229, - "step": 12190 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2307, - "step": 12191 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2329, - "step": 12192 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2242, - "step": 12193 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2303, - "step": 12194 - }, - { - "epoch": 1.5, - "learning_rate": 0.0003, - "loss": 0.2436, - "step": 12195 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2223, - "step": 12196 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.235, - "step": 12197 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.221, - "step": 12198 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2383, - "step": 12199 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2363, - "step": 12200 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2204, - "step": 12201 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2267, - "step": 12202 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2343, - "step": 12203 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2307, - "step": 12204 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2591, - "step": 12205 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2538, - "step": 12206 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2205, - "step": 12207 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2455, - "step": 12208 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2421, - "step": 12209 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2242, - "step": 12210 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2333, - "step": 12211 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2178, - "step": 12212 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2279, - "step": 12213 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2289, - "step": 12214 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2066, - "step": 12215 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2191, - "step": 12216 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2477, - "step": 12217 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2231, - "step": 12218 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2343, - "step": 12219 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2368, - "step": 12220 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.223, - "step": 12221 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2136, - "step": 12222 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2365, - "step": 12223 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2237, - "step": 12224 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2235, - "step": 12225 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2082, - "step": 12226 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2252, - "step": 12227 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2218, - "step": 12228 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2471, - "step": 12229 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2356, - "step": 12230 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2299, - "step": 12231 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2312, - "step": 12232 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2378, - "step": 12233 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2303, - "step": 12234 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2282, - "step": 12235 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.232, - "step": 12236 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2225, - "step": 12237 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2536, - "step": 12238 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2187, - "step": 12239 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2357, - "step": 12240 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2377, - "step": 12241 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.226, - "step": 12242 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2247, - "step": 12243 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2219, - "step": 12244 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2349, - "step": 12245 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2284, - "step": 12246 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2322, - "step": 12247 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2348, - "step": 12248 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.227, - "step": 12249 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2308, - "step": 12250 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2262, - "step": 12251 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2304, - "step": 12252 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2417, - "step": 12253 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.214, - "step": 12254 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2127, - "step": 12255 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2242, - "step": 12256 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2332, - "step": 12257 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2407, - "step": 12258 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2276, - "step": 12259 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2341, - "step": 12260 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2181, - "step": 12261 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2034, - "step": 12262 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2277, - "step": 12263 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2288, - "step": 12264 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2301, - "step": 12265 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.225, - "step": 12266 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2334, - "step": 12267 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.213, - "step": 12268 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2236, - "step": 12269 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2341, - "step": 12270 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2223, - "step": 12271 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2222, - "step": 12272 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2294, - "step": 12273 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2347, - "step": 12274 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.2318, - "step": 12275 - }, - { - "epoch": 1.51, - "learning_rate": 0.0003, - "loss": 0.228, - "step": 12276 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2272, - "step": 12277 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2278, - "step": 12278 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2282, - "step": 12279 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2234, - "step": 12280 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2358, - "step": 12281 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2295, - "step": 12282 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2251, - "step": 12283 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.23, - "step": 12284 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2175, - "step": 12285 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2086, - "step": 12286 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2424, - "step": 12287 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2156, - "step": 12288 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2347, - "step": 12289 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2337, - "step": 12290 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2341, - "step": 12291 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.227, - "step": 12292 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.226, - "step": 12293 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2232, - "step": 12294 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2294, - "step": 12295 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2313, - "step": 12296 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2285, - "step": 12297 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2362, - "step": 12298 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2381, - "step": 12299 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.237, - "step": 12300 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2314, - "step": 12301 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2478, - "step": 12302 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2189, - "step": 12303 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2229, - "step": 12304 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2212, - "step": 12305 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2416, - "step": 12306 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2363, - "step": 12307 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2401, - "step": 12308 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2251, - "step": 12309 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.249, - "step": 12310 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2326, - "step": 12311 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2298, - "step": 12312 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2204, - "step": 12313 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2437, - "step": 12314 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2177, - "step": 12315 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2322, - "step": 12316 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2098, - "step": 12317 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2222, - "step": 12318 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2358, - "step": 12319 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2456, - "step": 12320 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2211, - "step": 12321 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2408, - "step": 12322 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2267, - "step": 12323 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2415, - "step": 12324 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.234, - "step": 12325 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2493, - "step": 12326 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2384, - "step": 12327 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2173, - "step": 12328 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2356, - "step": 12329 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2197, - "step": 12330 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2263, - "step": 12331 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2304, - "step": 12332 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2378, - "step": 12333 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2438, - "step": 12334 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2327, - "step": 12335 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2254, - "step": 12336 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2223, - "step": 12337 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2311, - "step": 12338 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2383, - "step": 12339 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2211, - "step": 12340 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2141, - "step": 12341 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2376, - "step": 12342 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2183, - "step": 12343 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.231, - "step": 12344 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2236, - "step": 12345 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2244, - "step": 12346 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2282, - "step": 12347 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2301, - "step": 12348 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2228, - "step": 12349 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2378, - "step": 12350 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2392, - "step": 12351 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2212, - "step": 12352 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2241, - "step": 12353 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2173, - "step": 12354 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2381, - "step": 12355 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2248, - "step": 12356 - }, - { - "epoch": 1.52, - "learning_rate": 0.0003, - "loss": 0.2195, - "step": 12357 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2251, - "step": 12358 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2365, - "step": 12359 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2367, - "step": 12360 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2414, - "step": 12361 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.235, - "step": 12362 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2313, - "step": 12363 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2289, - "step": 12364 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2268, - "step": 12365 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2134, - "step": 12366 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2196, - "step": 12367 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2261, - "step": 12368 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2367, - "step": 12369 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2417, - "step": 12370 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2204, - "step": 12371 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.224, - "step": 12372 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2364, - "step": 12373 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2243, - "step": 12374 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2099, - "step": 12375 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2177, - "step": 12376 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2249, - "step": 12377 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2227, - "step": 12378 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2191, - "step": 12379 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2481, - "step": 12380 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2288, - "step": 12381 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2403, - "step": 12382 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2213, - "step": 12383 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2338, - "step": 12384 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2348, - "step": 12385 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2306, - "step": 12386 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2146, - "step": 12387 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2156, - "step": 12388 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2078, - "step": 12389 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2289, - "step": 12390 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2215, - "step": 12391 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2294, - "step": 12392 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2308, - "step": 12393 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2317, - "step": 12394 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2342, - "step": 12395 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2446, - "step": 12396 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2144, - "step": 12397 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2294, - "step": 12398 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2271, - "step": 12399 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2258, - "step": 12400 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2254, - "step": 12401 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.215, - "step": 12402 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2245, - "step": 12403 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2345, - "step": 12404 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2111, - "step": 12405 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2311, - "step": 12406 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2242, - "step": 12407 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2344, - "step": 12408 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2289, - "step": 12409 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2215, - "step": 12410 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2297, - "step": 12411 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2236, - "step": 12412 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.229, - "step": 12413 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2261, - "step": 12414 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2229, - "step": 12415 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2162, - "step": 12416 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2201, - "step": 12417 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2193, - "step": 12418 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2435, - "step": 12419 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2298, - "step": 12420 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2169, - "step": 12421 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2432, - "step": 12422 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2165, - "step": 12423 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2266, - "step": 12424 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2542, - "step": 12425 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2234, - "step": 12426 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2235, - "step": 12427 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2268, - "step": 12428 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2277, - "step": 12429 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2281, - "step": 12430 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2174, - "step": 12431 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2242, - "step": 12432 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2311, - "step": 12433 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2317, - "step": 12434 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2203, - "step": 12435 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.223, - "step": 12436 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2303, - "step": 12437 - }, - { - "epoch": 1.53, - "learning_rate": 0.0003, - "loss": 0.2297, - "step": 12438 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.22, - "step": 12439 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2303, - "step": 12440 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2319, - "step": 12441 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2278, - "step": 12442 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2255, - "step": 12443 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2348, - "step": 12444 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2318, - "step": 12445 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.211, - "step": 12446 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2294, - "step": 12447 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2222, - "step": 12448 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2412, - "step": 12449 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2247, - "step": 12450 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2246, - "step": 12451 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2112, - "step": 12452 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2148, - "step": 12453 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2323, - "step": 12454 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.213, - "step": 12455 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2465, - "step": 12456 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2158, - "step": 12457 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2325, - "step": 12458 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2447, - "step": 12459 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2178, - "step": 12460 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2338, - "step": 12461 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2236, - "step": 12462 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2259, - "step": 12463 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.214, - "step": 12464 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2237, - "step": 12465 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2328, - "step": 12466 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2293, - "step": 12467 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2285, - "step": 12468 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.227, - "step": 12469 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2333, - "step": 12470 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2368, - "step": 12471 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.245, - "step": 12472 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2266, - "step": 12473 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.225, - "step": 12474 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2106, - "step": 12475 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2262, - "step": 12476 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2358, - "step": 12477 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2204, - "step": 12478 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2436, - "step": 12479 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2307, - "step": 12480 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2142, - "step": 12481 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2227, - "step": 12482 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2374, - "step": 12483 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2406, - "step": 12484 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.216, - "step": 12485 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2155, - "step": 12486 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2119, - "step": 12487 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.226, - "step": 12488 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2321, - "step": 12489 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2153, - "step": 12490 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.237, - "step": 12491 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2236, - "step": 12492 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2295, - "step": 12493 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2316, - "step": 12494 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2252, - "step": 12495 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2271, - "step": 12496 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2122, - "step": 12497 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2334, - "step": 12498 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2154, - "step": 12499 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2283, - "step": 12500 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2183, - "step": 12501 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2201, - "step": 12502 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2312, - "step": 12503 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2189, - "step": 12504 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2195, - "step": 12505 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2244, - "step": 12506 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2283, - "step": 12507 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2229, - "step": 12508 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.224, - "step": 12509 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2294, - "step": 12510 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2177, - "step": 12511 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2323, - "step": 12512 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.218, - "step": 12513 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2239, - "step": 12514 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2345, - "step": 12515 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2341, - "step": 12516 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2221, - "step": 12517 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2241, - "step": 12518 - }, - { - "epoch": 1.54, - "learning_rate": 0.0003, - "loss": 0.2239, - "step": 12519 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2149, - "step": 12520 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2234, - "step": 12521 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.232, - "step": 12522 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2287, - "step": 12523 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2439, - "step": 12524 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2351, - "step": 12525 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2136, - "step": 12526 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2211, - "step": 12527 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2277, - "step": 12528 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2299, - "step": 12529 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2361, - "step": 12530 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2396, - "step": 12531 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2402, - "step": 12532 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2105, - "step": 12533 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2354, - "step": 12534 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2345, - "step": 12535 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2318, - "step": 12536 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.228, - "step": 12537 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2094, - "step": 12538 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2415, - "step": 12539 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2479, - "step": 12540 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2312, - "step": 12541 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2366, - "step": 12542 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2442, - "step": 12543 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2287, - "step": 12544 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2225, - "step": 12545 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2225, - "step": 12546 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2315, - "step": 12547 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2199, - "step": 12548 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2292, - "step": 12549 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2404, - "step": 12550 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2359, - "step": 12551 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2077, - "step": 12552 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2077, - "step": 12553 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2201, - "step": 12554 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2205, - "step": 12555 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2298, - "step": 12556 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2348, - "step": 12557 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2158, - "step": 12558 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2118, - "step": 12559 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.234, - "step": 12560 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2305, - "step": 12561 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2143, - "step": 12562 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2229, - "step": 12563 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.227, - "step": 12564 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.218, - "step": 12565 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2427, - "step": 12566 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2311, - "step": 12567 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2097, - "step": 12568 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2251, - "step": 12569 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2291, - "step": 12570 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2274, - "step": 12571 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2352, - "step": 12572 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2264, - "step": 12573 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2308, - "step": 12574 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2315, - "step": 12575 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2166, - "step": 12576 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2183, - "step": 12577 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.237, - "step": 12578 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.225, - "step": 12579 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2417, - "step": 12580 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2319, - "step": 12581 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2109, - "step": 12582 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.231, - "step": 12583 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2389, - "step": 12584 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2278, - "step": 12585 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.248, - "step": 12586 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.236, - "step": 12587 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2311, - "step": 12588 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2164, - "step": 12589 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2026, - "step": 12590 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2304, - "step": 12591 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2212, - "step": 12592 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2303, - "step": 12593 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2513, - "step": 12594 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2236, - "step": 12595 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2275, - "step": 12596 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2178, - "step": 12597 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2326, - "step": 12598 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.2278, - "step": 12599 - }, - { - "epoch": 1.55, - "learning_rate": 0.0003, - "loss": 0.224, - "step": 12600 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2478, - "step": 12601 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2407, - "step": 12602 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2344, - "step": 12603 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2244, - "step": 12604 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2108, - "step": 12605 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2271, - "step": 12606 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2313, - "step": 12607 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2212, - "step": 12608 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2153, - "step": 12609 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2292, - "step": 12610 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.234, - "step": 12611 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.228, - "step": 12612 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.212, - "step": 12613 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2199, - "step": 12614 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2384, - "step": 12615 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2435, - "step": 12616 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2486, - "step": 12617 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2326, - "step": 12618 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2384, - "step": 12619 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2451, - "step": 12620 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2091, - "step": 12621 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2328, - "step": 12622 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2176, - "step": 12623 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.24, - "step": 12624 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2252, - "step": 12625 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2211, - "step": 12626 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2373, - "step": 12627 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2235, - "step": 12628 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2469, - "step": 12629 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2182, - "step": 12630 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2272, - "step": 12631 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2375, - "step": 12632 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2309, - "step": 12633 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2291, - "step": 12634 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2231, - "step": 12635 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2204, - "step": 12636 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.214, - "step": 12637 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.228, - "step": 12638 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2239, - "step": 12639 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.24, - "step": 12640 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2391, - "step": 12641 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2349, - "step": 12642 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2211, - "step": 12643 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2349, - "step": 12644 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2382, - "step": 12645 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2214, - "step": 12646 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.221, - "step": 12647 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2224, - "step": 12648 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2162, - "step": 12649 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2427, - "step": 12650 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2256, - "step": 12651 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2276, - "step": 12652 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2331, - "step": 12653 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.208, - "step": 12654 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2205, - "step": 12655 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2186, - "step": 12656 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2327, - "step": 12657 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2305, - "step": 12658 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2337, - "step": 12659 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2284, - "step": 12660 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2374, - "step": 12661 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2186, - "step": 12662 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2284, - "step": 12663 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2318, - "step": 12664 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2292, - "step": 12665 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2405, - "step": 12666 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.231, - "step": 12667 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2337, - "step": 12668 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2066, - "step": 12669 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2112, - "step": 12670 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2309, - "step": 12671 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2276, - "step": 12672 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2272, - "step": 12673 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2369, - "step": 12674 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2048, - "step": 12675 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2422, - "step": 12676 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2272, - "step": 12677 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2179, - "step": 12678 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2301, - "step": 12679 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.224, - "step": 12680 - }, - { - "epoch": 1.56, - "learning_rate": 0.0003, - "loss": 0.2164, - "step": 12681 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2285, - "step": 12682 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.229, - "step": 12683 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2217, - "step": 12684 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2218, - "step": 12685 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2371, - "step": 12686 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2218, - "step": 12687 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2137, - "step": 12688 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2274, - "step": 12689 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2366, - "step": 12690 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2199, - "step": 12691 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2308, - "step": 12692 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2139, - "step": 12693 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2259, - "step": 12694 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2179, - "step": 12695 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2031, - "step": 12696 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2285, - "step": 12697 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2298, - "step": 12698 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2245, - "step": 12699 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2336, - "step": 12700 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2337, - "step": 12701 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2346, - "step": 12702 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2178, - "step": 12703 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2201, - "step": 12704 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2212, - "step": 12705 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2215, - "step": 12706 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2329, - "step": 12707 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2084, - "step": 12708 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2317, - "step": 12709 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2414, - "step": 12710 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2176, - "step": 12711 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2236, - "step": 12712 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2356, - "step": 12713 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2249, - "step": 12714 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2368, - "step": 12715 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2324, - "step": 12716 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2194, - "step": 12717 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2182, - "step": 12718 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2316, - "step": 12719 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2362, - "step": 12720 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2171, - "step": 12721 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2322, - "step": 12722 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2395, - "step": 12723 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.24, - "step": 12724 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2252, - "step": 12725 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2246, - "step": 12726 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2309, - "step": 12727 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2311, - "step": 12728 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2316, - "step": 12729 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2342, - "step": 12730 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2288, - "step": 12731 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2184, - "step": 12732 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2239, - "step": 12733 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2259, - "step": 12734 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2311, - "step": 12735 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2302, - "step": 12736 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2349, - "step": 12737 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2299, - "step": 12738 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2141, - "step": 12739 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2349, - "step": 12740 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2157, - "step": 12741 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.224, - "step": 12742 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2287, - "step": 12743 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.215, - "step": 12744 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2293, - "step": 12745 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2355, - "step": 12746 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2295, - "step": 12747 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2322, - "step": 12748 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2279, - "step": 12749 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2399, - "step": 12750 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2207, - "step": 12751 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2088, - "step": 12752 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2164, - "step": 12753 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.233, - "step": 12754 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2294, - "step": 12755 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2294, - "step": 12756 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2303, - "step": 12757 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2298, - "step": 12758 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2136, - "step": 12759 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2115, - "step": 12760 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2303, - "step": 12761 - }, - { - "epoch": 1.57, - "learning_rate": 0.0003, - "loss": 0.2389, - "step": 12762 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2245, - "step": 12763 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2301, - "step": 12764 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2276, - "step": 12765 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2359, - "step": 12766 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2322, - "step": 12767 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2312, - "step": 12768 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2462, - "step": 12769 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2297, - "step": 12770 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.225, - "step": 12771 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2281, - "step": 12772 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2207, - "step": 12773 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2324, - "step": 12774 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2164, - "step": 12775 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2199, - "step": 12776 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2224, - "step": 12777 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2362, - "step": 12778 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2243, - "step": 12779 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2256, - "step": 12780 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2171, - "step": 12781 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2334, - "step": 12782 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2254, - "step": 12783 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2283, - "step": 12784 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2369, - "step": 12785 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.234, - "step": 12786 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2226, - "step": 12787 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2301, - "step": 12788 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2346, - "step": 12789 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2291, - "step": 12790 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2346, - "step": 12791 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2304, - "step": 12792 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2199, - "step": 12793 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2164, - "step": 12794 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2346, - "step": 12795 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2221, - "step": 12796 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2152, - "step": 12797 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2326, - "step": 12798 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2199, - "step": 12799 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2338, - "step": 12800 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2132, - "step": 12801 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2267, - "step": 12802 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2267, - "step": 12803 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.239, - "step": 12804 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2107, - "step": 12805 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2375, - "step": 12806 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.243, - "step": 12807 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2325, - "step": 12808 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2293, - "step": 12809 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2365, - "step": 12810 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2321, - "step": 12811 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2148, - "step": 12812 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2449, - "step": 12813 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2282, - "step": 12814 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2227, - "step": 12815 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2525, - "step": 12816 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2344, - "step": 12817 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2276, - "step": 12818 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2393, - "step": 12819 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2329, - "step": 12820 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2302, - "step": 12821 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2267, - "step": 12822 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2398, - "step": 12823 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2382, - "step": 12824 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2317, - "step": 12825 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2253, - "step": 12826 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2082, - "step": 12827 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2122, - "step": 12828 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2162, - "step": 12829 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2315, - "step": 12830 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2397, - "step": 12831 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2288, - "step": 12832 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2254, - "step": 12833 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.222, - "step": 12834 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2269, - "step": 12835 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2111, - "step": 12836 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2302, - "step": 12837 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2401, - "step": 12838 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2245, - "step": 12839 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2238, - "step": 12840 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2241, - "step": 12841 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2231, - "step": 12842 - }, - { - "epoch": 1.58, - "learning_rate": 0.0003, - "loss": 0.2362, - "step": 12843 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2134, - "step": 12844 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2415, - "step": 12845 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2317, - "step": 12846 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2143, - "step": 12847 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2261, - "step": 12848 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2301, - "step": 12849 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2324, - "step": 12850 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2101, - "step": 12851 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2422, - "step": 12852 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.231, - "step": 12853 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2125, - "step": 12854 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2247, - "step": 12855 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2267, - "step": 12856 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2415, - "step": 12857 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2309, - "step": 12858 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2292, - "step": 12859 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2098, - "step": 12860 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2334, - "step": 12861 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2273, - "step": 12862 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2227, - "step": 12863 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2211, - "step": 12864 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2215, - "step": 12865 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2332, - "step": 12866 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2379, - "step": 12867 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2176, - "step": 12868 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2165, - "step": 12869 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2234, - "step": 12870 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2118, - "step": 12871 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2254, - "step": 12872 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2324, - "step": 12873 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2279, - "step": 12874 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2318, - "step": 12875 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2426, - "step": 12876 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2299, - "step": 12877 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.213, - "step": 12878 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.221, - "step": 12879 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2207, - "step": 12880 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2285, - "step": 12881 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.222, - "step": 12882 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2066, - "step": 12883 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2264, - "step": 12884 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.1974, - "step": 12885 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2315, - "step": 12886 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2199, - "step": 12887 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2297, - "step": 12888 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2305, - "step": 12889 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2307, - "step": 12890 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2389, - "step": 12891 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2261, - "step": 12892 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2242, - "step": 12893 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2085, - "step": 12894 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2163, - "step": 12895 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2263, - "step": 12896 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2341, - "step": 12897 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.227, - "step": 12898 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2256, - "step": 12899 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2362, - "step": 12900 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2393, - "step": 12901 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2368, - "step": 12902 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2227, - "step": 12903 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2098, - "step": 12904 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2309, - "step": 12905 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2205, - "step": 12906 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2269, - "step": 12907 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2182, - "step": 12908 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2211, - "step": 12909 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2297, - "step": 12910 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2342, - "step": 12911 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2314, - "step": 12912 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2443, - "step": 12913 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2173, - "step": 12914 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.218, - "step": 12915 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2387, - "step": 12916 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2293, - "step": 12917 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2047, - "step": 12918 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2417, - "step": 12919 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.224, - "step": 12920 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2174, - "step": 12921 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2379, - "step": 12922 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2337, - "step": 12923 - }, - { - "epoch": 1.59, - "learning_rate": 0.0003, - "loss": 0.2319, - "step": 12924 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2069, - "step": 12925 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2227, - "step": 12926 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2258, - "step": 12927 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2261, - "step": 12928 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2296, - "step": 12929 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2134, - "step": 12930 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2358, - "step": 12931 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2411, - "step": 12932 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2374, - "step": 12933 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2282, - "step": 12934 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2266, - "step": 12935 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.236, - "step": 12936 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2271, - "step": 12937 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2403, - "step": 12938 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2454, - "step": 12939 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2381, - "step": 12940 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2317, - "step": 12941 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2097, - "step": 12942 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2428, - "step": 12943 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2282, - "step": 12944 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2316, - "step": 12945 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2316, - "step": 12946 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2309, - "step": 12947 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.209, - "step": 12948 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2316, - "step": 12949 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2376, - "step": 12950 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2289, - "step": 12951 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2349, - "step": 12952 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2247, - "step": 12953 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2234, - "step": 12954 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2096, - "step": 12955 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.219, - "step": 12956 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2277, - "step": 12957 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2162, - "step": 12958 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.228, - "step": 12959 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2235, - "step": 12960 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2242, - "step": 12961 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2126, - "step": 12962 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2327, - "step": 12963 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2274, - "step": 12964 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2097, - "step": 12965 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2323, - "step": 12966 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2244, - "step": 12967 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.231, - "step": 12968 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2389, - "step": 12969 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2261, - "step": 12970 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.234, - "step": 12971 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2252, - "step": 12972 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2168, - "step": 12973 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.22, - "step": 12974 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2208, - "step": 12975 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2343, - "step": 12976 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2239, - "step": 12977 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2299, - "step": 12978 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2248, - "step": 12979 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2361, - "step": 12980 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2354, - "step": 12981 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2307, - "step": 12982 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2168, - "step": 12983 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2352, - "step": 12984 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2253, - "step": 12985 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2235, - "step": 12986 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2258, - "step": 12987 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2262, - "step": 12988 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2132, - "step": 12989 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2175, - "step": 12990 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2334, - "step": 12991 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2315, - "step": 12992 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2342, - "step": 12993 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2309, - "step": 12994 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2058, - "step": 12995 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2325, - "step": 12996 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2344, - "step": 12997 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2302, - "step": 12998 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2359, - "step": 12999 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2316, - "step": 13000 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2269, - "step": 13001 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.206, - "step": 13002 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2229, - "step": 13003 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2258, - "step": 13004 - }, - { - "epoch": 1.6, - "learning_rate": 0.0003, - "loss": 0.2301, - "step": 13005 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2313, - "step": 13006 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2255, - "step": 13007 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2171, - "step": 13008 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2311, - "step": 13009 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2234, - "step": 13010 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2276, - "step": 13011 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2303, - "step": 13012 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2269, - "step": 13013 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2168, - "step": 13014 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2208, - "step": 13015 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2114, - "step": 13016 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2173, - "step": 13017 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2187, - "step": 13018 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2347, - "step": 13019 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2187, - "step": 13020 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2387, - "step": 13021 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2307, - "step": 13022 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2386, - "step": 13023 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2295, - "step": 13024 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2235, - "step": 13025 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2237, - "step": 13026 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2176, - "step": 13027 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2165, - "step": 13028 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.225, - "step": 13029 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2238, - "step": 13030 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2273, - "step": 13031 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2217, - "step": 13032 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2268, - "step": 13033 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2304, - "step": 13034 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2404, - "step": 13035 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2178, - "step": 13036 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2216, - "step": 13037 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2094, - "step": 13038 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2426, - "step": 13039 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2308, - "step": 13040 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.22, - "step": 13041 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2064, - "step": 13042 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2374, - "step": 13043 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2295, - "step": 13044 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2288, - "step": 13045 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2315, - "step": 13046 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2168, - "step": 13047 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.235, - "step": 13048 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2227, - "step": 13049 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2391, - "step": 13050 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2247, - "step": 13051 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2246, - "step": 13052 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2179, - "step": 13053 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2346, - "step": 13054 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2221, - "step": 13055 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2281, - "step": 13056 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2334, - "step": 13057 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2282, - "step": 13058 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2386, - "step": 13059 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.23, - "step": 13060 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2241, - "step": 13061 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2149, - "step": 13062 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2343, - "step": 13063 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2243, - "step": 13064 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2217, - "step": 13065 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2209, - "step": 13066 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2309, - "step": 13067 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2234, - "step": 13068 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2297, - "step": 13069 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2324, - "step": 13070 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2358, - "step": 13071 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2332, - "step": 13072 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2449, - "step": 13073 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2396, - "step": 13074 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2281, - "step": 13075 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2207, - "step": 13076 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2174, - "step": 13077 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2422, - "step": 13078 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2235, - "step": 13079 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.222, - "step": 13080 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2191, - "step": 13081 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2215, - "step": 13082 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2241, - "step": 13083 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2283, - "step": 13084 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2183, - "step": 13085 - }, - { - "epoch": 1.61, - "learning_rate": 0.0003, - "loss": 0.2344, - "step": 13086 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2253, - "step": 13087 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2223, - "step": 13088 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2174, - "step": 13089 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2347, - "step": 13090 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2101, - "step": 13091 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2291, - "step": 13092 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2102, - "step": 13093 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2187, - "step": 13094 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.217, - "step": 13095 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2331, - "step": 13096 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2291, - "step": 13097 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.218, - "step": 13098 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2141, - "step": 13099 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2214, - "step": 13100 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2244, - "step": 13101 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2232, - "step": 13102 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2341, - "step": 13103 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2228, - "step": 13104 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2184, - "step": 13105 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2354, - "step": 13106 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2384, - "step": 13107 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.245, - "step": 13108 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2373, - "step": 13109 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2278, - "step": 13110 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2384, - "step": 13111 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2142, - "step": 13112 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2308, - "step": 13113 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2225, - "step": 13114 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2236, - "step": 13115 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2146, - "step": 13116 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.231, - "step": 13117 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2221, - "step": 13118 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2323, - "step": 13119 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.219, - "step": 13120 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2321, - "step": 13121 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2226, - "step": 13122 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2214, - "step": 13123 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2175, - "step": 13124 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2414, - "step": 13125 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2176, - "step": 13126 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2399, - "step": 13127 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2269, - "step": 13128 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2322, - "step": 13129 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2432, - "step": 13130 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.233, - "step": 13131 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2339, - "step": 13132 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2221, - "step": 13133 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2109, - "step": 13134 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2261, - "step": 13135 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.228, - "step": 13136 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2222, - "step": 13137 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.219, - "step": 13138 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2403, - "step": 13139 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2265, - "step": 13140 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2179, - "step": 13141 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2252, - "step": 13142 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2245, - "step": 13143 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2398, - "step": 13144 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2326, - "step": 13145 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2328, - "step": 13146 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2318, - "step": 13147 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2162, - "step": 13148 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2254, - "step": 13149 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2215, - "step": 13150 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2145, - "step": 13151 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2304, - "step": 13152 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2156, - "step": 13153 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2096, - "step": 13154 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2489, - "step": 13155 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2439, - "step": 13156 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2029, - "step": 13157 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.223, - "step": 13158 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2255, - "step": 13159 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2193, - "step": 13160 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2264, - "step": 13161 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2201, - "step": 13162 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2443, - "step": 13163 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2175, - "step": 13164 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2237, - "step": 13165 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.223, - "step": 13166 - }, - { - "epoch": 1.62, - "learning_rate": 0.0003, - "loss": 0.2257, - "step": 13167 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2419, - "step": 13168 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2425, - "step": 13169 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2374, - "step": 13170 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2156, - "step": 13171 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2331, - "step": 13172 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2177, - "step": 13173 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2043, - "step": 13174 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2178, - "step": 13175 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2286, - "step": 13176 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2245, - "step": 13177 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2191, - "step": 13178 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2078, - "step": 13179 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2195, - "step": 13180 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2431, - "step": 13181 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.227, - "step": 13182 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2292, - "step": 13183 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2274, - "step": 13184 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2322, - "step": 13185 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2338, - "step": 13186 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2437, - "step": 13187 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2524, - "step": 13188 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2267, - "step": 13189 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2249, - "step": 13190 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2161, - "step": 13191 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2316, - "step": 13192 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2317, - "step": 13193 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2445, - "step": 13194 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2191, - "step": 13195 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2247, - "step": 13196 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.232, - "step": 13197 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2378, - "step": 13198 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.218, - "step": 13199 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2163, - "step": 13200 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2344, - "step": 13201 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2055, - "step": 13202 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.217, - "step": 13203 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2256, - "step": 13204 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2091, - "step": 13205 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2433, - "step": 13206 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2164, - "step": 13207 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2336, - "step": 13208 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2267, - "step": 13209 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2436, - "step": 13210 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2208, - "step": 13211 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2412, - "step": 13212 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.218, - "step": 13213 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2307, - "step": 13214 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2291, - "step": 13215 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2375, - "step": 13216 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2311, - "step": 13217 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2371, - "step": 13218 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2262, - "step": 13219 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2295, - "step": 13220 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2346, - "step": 13221 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2265, - "step": 13222 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2276, - "step": 13223 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2232, - "step": 13224 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2308, - "step": 13225 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.235, - "step": 13226 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2327, - "step": 13227 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2222, - "step": 13228 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2387, - "step": 13229 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2258, - "step": 13230 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2414, - "step": 13231 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2262, - "step": 13232 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2257, - "step": 13233 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2306, - "step": 13234 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2226, - "step": 13235 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2139, - "step": 13236 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2236, - "step": 13237 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2217, - "step": 13238 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2201, - "step": 13239 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2289, - "step": 13240 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2318, - "step": 13241 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.234, - "step": 13242 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2055, - "step": 13243 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2321, - "step": 13244 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2115, - "step": 13245 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2286, - "step": 13246 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.218, - "step": 13247 - }, - { - "epoch": 1.63, - "learning_rate": 0.0003, - "loss": 0.2388, - "step": 13248 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2284, - "step": 13249 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2404, - "step": 13250 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2335, - "step": 13251 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2188, - "step": 13252 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2272, - "step": 13253 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2295, - "step": 13254 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2434, - "step": 13255 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2166, - "step": 13256 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2179, - "step": 13257 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2499, - "step": 13258 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2108, - "step": 13259 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2253, - "step": 13260 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2282, - "step": 13261 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2355, - "step": 13262 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2203, - "step": 13263 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2321, - "step": 13264 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2219, - "step": 13265 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2176, - "step": 13266 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2266, - "step": 13267 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2287, - "step": 13268 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2287, - "step": 13269 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2335, - "step": 13270 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2186, - "step": 13271 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2301, - "step": 13272 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2166, - "step": 13273 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2372, - "step": 13274 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2326, - "step": 13275 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2081, - "step": 13276 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.237, - "step": 13277 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2265, - "step": 13278 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2231, - "step": 13279 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2295, - "step": 13280 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2239, - "step": 13281 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2219, - "step": 13282 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2188, - "step": 13283 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2107, - "step": 13284 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2344, - "step": 13285 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2465, - "step": 13286 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2128, - "step": 13287 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2282, - "step": 13288 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2053, - "step": 13289 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.226, - "step": 13290 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2278, - "step": 13291 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.246, - "step": 13292 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2278, - "step": 13293 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2247, - "step": 13294 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2135, - "step": 13295 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2309, - "step": 13296 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2156, - "step": 13297 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2306, - "step": 13298 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2313, - "step": 13299 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2337, - "step": 13300 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2068, - "step": 13301 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2167, - "step": 13302 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2273, - "step": 13303 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2114, - "step": 13304 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2325, - "step": 13305 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2235, - "step": 13306 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2271, - "step": 13307 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.22, - "step": 13308 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2252, - "step": 13309 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2216, - "step": 13310 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2141, - "step": 13311 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2182, - "step": 13312 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2293, - "step": 13313 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2229, - "step": 13314 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2186, - "step": 13315 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2392, - "step": 13316 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2329, - "step": 13317 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2385, - "step": 13318 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2198, - "step": 13319 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2168, - "step": 13320 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2339, - "step": 13321 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2357, - "step": 13322 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2405, - "step": 13323 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2342, - "step": 13324 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2238, - "step": 13325 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2222, - "step": 13326 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.236, - "step": 13327 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2245, - "step": 13328 - }, - { - "epoch": 1.64, - "learning_rate": 0.0003, - "loss": 0.2249, - "step": 13329 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2212, - "step": 13330 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2276, - "step": 13331 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2145, - "step": 13332 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2212, - "step": 13333 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2238, - "step": 13334 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2162, - "step": 13335 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2333, - "step": 13336 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2277, - "step": 13337 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2195, - "step": 13338 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2334, - "step": 13339 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2038, - "step": 13340 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2024, - "step": 13341 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2292, - "step": 13342 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2277, - "step": 13343 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2323, - "step": 13344 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2337, - "step": 13345 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.231, - "step": 13346 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2246, - "step": 13347 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2336, - "step": 13348 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2258, - "step": 13349 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2347, - "step": 13350 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2171, - "step": 13351 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2227, - "step": 13352 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2282, - "step": 13353 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2306, - "step": 13354 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.225, - "step": 13355 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2181, - "step": 13356 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2274, - "step": 13357 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.219, - "step": 13358 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2344, - "step": 13359 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2222, - "step": 13360 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2268, - "step": 13361 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2149, - "step": 13362 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2162, - "step": 13363 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2268, - "step": 13364 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2277, - "step": 13365 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2338, - "step": 13366 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2288, - "step": 13367 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2203, - "step": 13368 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2234, - "step": 13369 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.224, - "step": 13370 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2456, - "step": 13371 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2309, - "step": 13372 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2297, - "step": 13373 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2229, - "step": 13374 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2185, - "step": 13375 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2227, - "step": 13376 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2312, - "step": 13377 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2347, - "step": 13378 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2319, - "step": 13379 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2343, - "step": 13380 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2311, - "step": 13381 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2238, - "step": 13382 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2142, - "step": 13383 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2244, - "step": 13384 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2222, - "step": 13385 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2319, - "step": 13386 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2336, - "step": 13387 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2218, - "step": 13388 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2219, - "step": 13389 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2378, - "step": 13390 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2207, - "step": 13391 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2086, - "step": 13392 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2306, - "step": 13393 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2136, - "step": 13394 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2296, - "step": 13395 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2255, - "step": 13396 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2194, - "step": 13397 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2263, - "step": 13398 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.224, - "step": 13399 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2383, - "step": 13400 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2064, - "step": 13401 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2334, - "step": 13402 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.227, - "step": 13403 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2176, - "step": 13404 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2329, - "step": 13405 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2165, - "step": 13406 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2119, - "step": 13407 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2148, - "step": 13408 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2268, - "step": 13409 - }, - { - "epoch": 1.65, - "learning_rate": 0.0003, - "loss": 0.2314, - "step": 13410 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.235, - "step": 13411 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2286, - "step": 13412 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2339, - "step": 13413 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2358, - "step": 13414 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2129, - "step": 13415 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2192, - "step": 13416 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2214, - "step": 13417 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2214, - "step": 13418 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2105, - "step": 13419 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2139, - "step": 13420 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2171, - "step": 13421 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2128, - "step": 13422 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2131, - "step": 13423 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2042, - "step": 13424 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2215, - "step": 13425 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.221, - "step": 13426 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2186, - "step": 13427 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2093, - "step": 13428 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2239, - "step": 13429 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2202, - "step": 13430 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2254, - "step": 13431 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2196, - "step": 13432 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2355, - "step": 13433 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2352, - "step": 13434 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2346, - "step": 13435 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.233, - "step": 13436 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2228, - "step": 13437 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2355, - "step": 13438 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2122, - "step": 13439 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2297, - "step": 13440 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2132, - "step": 13441 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2302, - "step": 13442 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2188, - "step": 13443 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2269, - "step": 13444 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2142, - "step": 13445 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2448, - "step": 13446 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2523, - "step": 13447 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2019, - "step": 13448 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2099, - "step": 13449 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2307, - "step": 13450 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.219, - "step": 13451 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2218, - "step": 13452 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2095, - "step": 13453 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2346, - "step": 13454 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2094, - "step": 13455 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.236, - "step": 13456 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2317, - "step": 13457 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2141, - "step": 13458 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.23, - "step": 13459 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2365, - "step": 13460 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2291, - "step": 13461 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2281, - "step": 13462 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.218, - "step": 13463 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2292, - "step": 13464 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2326, - "step": 13465 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2248, - "step": 13466 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2076, - "step": 13467 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2238, - "step": 13468 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2161, - "step": 13469 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2173, - "step": 13470 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2093, - "step": 13471 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.218, - "step": 13472 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2098, - "step": 13473 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2307, - "step": 13474 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2278, - "step": 13475 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2199, - "step": 13476 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2279, - "step": 13477 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2115, - "step": 13478 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2214, - "step": 13479 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2123, - "step": 13480 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2046, - "step": 13481 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.218, - "step": 13482 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2278, - "step": 13483 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2247, - "step": 13484 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2234, - "step": 13485 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2255, - "step": 13486 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2274, - "step": 13487 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.232, - "step": 13488 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2169, - "step": 13489 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2097, - "step": 13490 - }, - { - "epoch": 1.66, - "learning_rate": 0.0003, - "loss": 0.2261, - "step": 13491 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.246, - "step": 13492 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2418, - "step": 13493 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2254, - "step": 13494 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2414, - "step": 13495 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.227, - "step": 13496 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2208, - "step": 13497 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2259, - "step": 13498 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2139, - "step": 13499 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2385, - "step": 13500 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2323, - "step": 13501 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2159, - "step": 13502 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.227, - "step": 13503 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2107, - "step": 13504 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2266, - "step": 13505 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2222, - "step": 13506 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2071, - "step": 13507 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2185, - "step": 13508 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.23, - "step": 13509 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2161, - "step": 13510 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2208, - "step": 13511 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2375, - "step": 13512 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2144, - "step": 13513 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2164, - "step": 13514 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2284, - "step": 13515 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2176, - "step": 13516 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2357, - "step": 13517 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2379, - "step": 13518 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2416, - "step": 13519 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2364, - "step": 13520 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2375, - "step": 13521 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.231, - "step": 13522 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2198, - "step": 13523 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.229, - "step": 13524 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2308, - "step": 13525 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2287, - "step": 13526 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2198, - "step": 13527 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2221, - "step": 13528 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2226, - "step": 13529 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2429, - "step": 13530 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2219, - "step": 13531 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2246, - "step": 13532 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2195, - "step": 13533 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2401, - "step": 13534 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.226, - "step": 13535 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2308, - "step": 13536 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2337, - "step": 13537 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2111, - "step": 13538 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2227, - "step": 13539 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2298, - "step": 13540 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2119, - "step": 13541 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2321, - "step": 13542 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2271, - "step": 13543 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2238, - "step": 13544 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2341, - "step": 13545 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2282, - "step": 13546 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2314, - "step": 13547 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.215, - "step": 13548 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2098, - "step": 13549 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2175, - "step": 13550 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2256, - "step": 13551 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2326, - "step": 13552 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2111, - "step": 13553 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.212, - "step": 13554 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2401, - "step": 13555 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2046, - "step": 13556 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2357, - "step": 13557 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.224, - "step": 13558 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2133, - "step": 13559 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2197, - "step": 13560 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.232, - "step": 13561 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.233, - "step": 13562 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2232, - "step": 13563 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2291, - "step": 13564 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2363, - "step": 13565 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2252, - "step": 13566 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2093, - "step": 13567 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2177, - "step": 13568 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2223, - "step": 13569 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2313, - "step": 13570 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.225, - "step": 13571 - }, - { - "epoch": 1.67, - "learning_rate": 0.0003, - "loss": 0.2271, - "step": 13572 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.218, - "step": 13573 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2289, - "step": 13574 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2248, - "step": 13575 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2224, - "step": 13576 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.214, - "step": 13577 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2208, - "step": 13578 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2015, - "step": 13579 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2221, - "step": 13580 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.214, - "step": 13581 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2341, - "step": 13582 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2279, - "step": 13583 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.241, - "step": 13584 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2288, - "step": 13585 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2263, - "step": 13586 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.227, - "step": 13587 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2346, - "step": 13588 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2221, - "step": 13589 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2195, - "step": 13590 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.216, - "step": 13591 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.22, - "step": 13592 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2293, - "step": 13593 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.225, - "step": 13594 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2266, - "step": 13595 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2346, - "step": 13596 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2266, - "step": 13597 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2093, - "step": 13598 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2366, - "step": 13599 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2337, - "step": 13600 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2228, - "step": 13601 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2286, - "step": 13602 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2278, - "step": 13603 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2251, - "step": 13604 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2261, - "step": 13605 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2177, - "step": 13606 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2193, - "step": 13607 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2296, - "step": 13608 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2368, - "step": 13609 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2125, - "step": 13610 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2093, - "step": 13611 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2333, - "step": 13612 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2284, - "step": 13613 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2352, - "step": 13614 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2392, - "step": 13615 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.213, - "step": 13616 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2106, - "step": 13617 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2337, - "step": 13618 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2181, - "step": 13619 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.233, - "step": 13620 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2225, - "step": 13621 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2267, - "step": 13622 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2376, - "step": 13623 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2211, - "step": 13624 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2305, - "step": 13625 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2214, - "step": 13626 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2143, - "step": 13627 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2342, - "step": 13628 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2193, - "step": 13629 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2268, - "step": 13630 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2177, - "step": 13631 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.218, - "step": 13632 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2237, - "step": 13633 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.227, - "step": 13634 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2371, - "step": 13635 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2157, - "step": 13636 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2306, - "step": 13637 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2178, - "step": 13638 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2121, - "step": 13639 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2327, - "step": 13640 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2228, - "step": 13641 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2295, - "step": 13642 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2264, - "step": 13643 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2172, - "step": 13644 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2249, - "step": 13645 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2216, - "step": 13646 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2257, - "step": 13647 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2288, - "step": 13648 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2303, - "step": 13649 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2409, - "step": 13650 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2334, - "step": 13651 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2333, - "step": 13652 - }, - { - "epoch": 1.68, - "learning_rate": 0.0003, - "loss": 0.2187, - "step": 13653 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2303, - "step": 13654 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2465, - "step": 13655 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2012, - "step": 13656 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2198, - "step": 13657 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2336, - "step": 13658 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2228, - "step": 13659 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2175, - "step": 13660 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2345, - "step": 13661 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2139, - "step": 13662 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.21, - "step": 13663 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2118, - "step": 13664 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2213, - "step": 13665 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2399, - "step": 13666 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2249, - "step": 13667 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.235, - "step": 13668 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.215, - "step": 13669 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2262, - "step": 13670 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2285, - "step": 13671 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2164, - "step": 13672 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2265, - "step": 13673 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2332, - "step": 13674 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2198, - "step": 13675 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2221, - "step": 13676 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2278, - "step": 13677 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2245, - "step": 13678 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2306, - "step": 13679 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2222, - "step": 13680 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2295, - "step": 13681 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.21, - "step": 13682 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.237, - "step": 13683 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2442, - "step": 13684 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2206, - "step": 13685 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2249, - "step": 13686 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2193, - "step": 13687 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2317, - "step": 13688 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2324, - "step": 13689 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2247, - "step": 13690 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2191, - "step": 13691 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2317, - "step": 13692 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.218, - "step": 13693 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2231, - "step": 13694 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2357, - "step": 13695 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2307, - "step": 13696 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2363, - "step": 13697 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2335, - "step": 13698 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2251, - "step": 13699 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2105, - "step": 13700 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2219, - "step": 13701 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2173, - "step": 13702 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2177, - "step": 13703 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2212, - "step": 13704 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2253, - "step": 13705 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2122, - "step": 13706 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2265, - "step": 13707 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2209, - "step": 13708 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2322, - "step": 13709 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2231, - "step": 13710 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2144, - "step": 13711 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2248, - "step": 13712 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2371, - "step": 13713 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2181, - "step": 13714 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2212, - "step": 13715 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2291, - "step": 13716 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.225, - "step": 13717 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2244, - "step": 13718 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2239, - "step": 13719 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2215, - "step": 13720 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.231, - "step": 13721 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2199, - "step": 13722 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2488, - "step": 13723 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2293, - "step": 13724 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2138, - "step": 13725 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2177, - "step": 13726 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2278, - "step": 13727 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.239, - "step": 13728 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2208, - "step": 13729 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2187, - "step": 13730 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2004, - "step": 13731 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2264, - "step": 13732 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2392, - "step": 13733 - }, - { - "epoch": 1.69, - "learning_rate": 0.0003, - "loss": 0.2246, - "step": 13734 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2345, - "step": 13735 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2255, - "step": 13736 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2361, - "step": 13737 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2314, - "step": 13738 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2243, - "step": 13739 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2318, - "step": 13740 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2209, - "step": 13741 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2121, - "step": 13742 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2282, - "step": 13743 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2342, - "step": 13744 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2052, - "step": 13745 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2063, - "step": 13746 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2208, - "step": 13747 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.22, - "step": 13748 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2284, - "step": 13749 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2277, - "step": 13750 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2338, - "step": 13751 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2214, - "step": 13752 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.232, - "step": 13753 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2039, - "step": 13754 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2301, - "step": 13755 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2167, - "step": 13756 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2246, - "step": 13757 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2295, - "step": 13758 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2231, - "step": 13759 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2214, - "step": 13760 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2211, - "step": 13761 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2085, - "step": 13762 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2212, - "step": 13763 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2196, - "step": 13764 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2228, - "step": 13765 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2447, - "step": 13766 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2329, - "step": 13767 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2171, - "step": 13768 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2379, - "step": 13769 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2159, - "step": 13770 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2241, - "step": 13771 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2246, - "step": 13772 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2572, - "step": 13773 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2217, - "step": 13774 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.226, - "step": 13775 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2258, - "step": 13776 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2193, - "step": 13777 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2189, - "step": 13778 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2161, - "step": 13779 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2231, - "step": 13780 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2208, - "step": 13781 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2255, - "step": 13782 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2197, - "step": 13783 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2191, - "step": 13784 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2226, - "step": 13785 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2205, - "step": 13786 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2363, - "step": 13787 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2321, - "step": 13788 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.211, - "step": 13789 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2297, - "step": 13790 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2236, - "step": 13791 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2432, - "step": 13792 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2383, - "step": 13793 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2356, - "step": 13794 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2216, - "step": 13795 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.209, - "step": 13796 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2214, - "step": 13797 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2166, - "step": 13798 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2316, - "step": 13799 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2312, - "step": 13800 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.229, - "step": 13801 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2306, - "step": 13802 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2203, - "step": 13803 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2246, - "step": 13804 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2122, - "step": 13805 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2241, - "step": 13806 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.213, - "step": 13807 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2085, - "step": 13808 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.212, - "step": 13809 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2362, - "step": 13810 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2428, - "step": 13811 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.2134, - "step": 13812 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.224, - "step": 13813 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.23, - "step": 13814 - }, - { - "epoch": 1.7, - "learning_rate": 0.0003, - "loss": 0.233, - "step": 13815 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2081, - "step": 13816 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2172, - "step": 13817 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2279, - "step": 13818 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2233, - "step": 13819 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.226, - "step": 13820 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2183, - "step": 13821 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2196, - "step": 13822 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2104, - "step": 13823 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2099, - "step": 13824 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2212, - "step": 13825 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.223, - "step": 13826 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2175, - "step": 13827 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.223, - "step": 13828 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2173, - "step": 13829 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2161, - "step": 13830 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2269, - "step": 13831 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2296, - "step": 13832 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2147, - "step": 13833 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2265, - "step": 13834 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2335, - "step": 13835 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2184, - "step": 13836 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2154, - "step": 13837 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2158, - "step": 13838 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2154, - "step": 13839 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2201, - "step": 13840 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2106, - "step": 13841 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2156, - "step": 13842 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2138, - "step": 13843 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2372, - "step": 13844 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2321, - "step": 13845 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2239, - "step": 13846 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2056, - "step": 13847 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.232, - "step": 13848 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2194, - "step": 13849 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2344, - "step": 13850 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2045, - "step": 13851 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2162, - "step": 13852 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2239, - "step": 13853 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2158, - "step": 13854 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2205, - "step": 13855 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.224, - "step": 13856 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2307, - "step": 13857 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.216, - "step": 13858 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2332, - "step": 13859 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2177, - "step": 13860 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2347, - "step": 13861 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2263, - "step": 13862 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2298, - "step": 13863 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2227, - "step": 13864 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2169, - "step": 13865 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2318, - "step": 13866 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.218, - "step": 13867 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2254, - "step": 13868 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2337, - "step": 13869 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2298, - "step": 13870 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2272, - "step": 13871 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2163, - "step": 13872 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2288, - "step": 13873 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.234, - "step": 13874 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.22, - "step": 13875 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2234, - "step": 13876 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2309, - "step": 13877 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.206, - "step": 13878 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2346, - "step": 13879 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2277, - "step": 13880 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2438, - "step": 13881 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2077, - "step": 13882 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2187, - "step": 13883 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2444, - "step": 13884 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2293, - "step": 13885 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2201, - "step": 13886 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2116, - "step": 13887 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2156, - "step": 13888 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2103, - "step": 13889 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2235, - "step": 13890 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2248, - "step": 13891 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2309, - "step": 13892 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2335, - "step": 13893 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2273, - "step": 13894 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2313, - "step": 13895 - }, - { - "epoch": 1.71, - "learning_rate": 0.0003, - "loss": 0.2298, - "step": 13896 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2182, - "step": 13897 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2147, - "step": 13898 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.208, - "step": 13899 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2372, - "step": 13900 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2178, - "step": 13901 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2207, - "step": 13902 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.236, - "step": 13903 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2226, - "step": 13904 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.225, - "step": 13905 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2259, - "step": 13906 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2183, - "step": 13907 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2213, - "step": 13908 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2082, - "step": 13909 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2121, - "step": 13910 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2293, - "step": 13911 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2374, - "step": 13912 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2288, - "step": 13913 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2259, - "step": 13914 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2304, - "step": 13915 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2284, - "step": 13916 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2241, - "step": 13917 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2243, - "step": 13918 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2191, - "step": 13919 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2322, - "step": 13920 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2214, - "step": 13921 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2226, - "step": 13922 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2191, - "step": 13923 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2143, - "step": 13924 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2141, - "step": 13925 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2321, - "step": 13926 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2359, - "step": 13927 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2261, - "step": 13928 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2267, - "step": 13929 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2329, - "step": 13930 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2355, - "step": 13931 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2136, - "step": 13932 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2207, - "step": 13933 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2225, - "step": 13934 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2108, - "step": 13935 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2184, - "step": 13936 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2076, - "step": 13937 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2334, - "step": 13938 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2157, - "step": 13939 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2288, - "step": 13940 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2109, - "step": 13941 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2208, - "step": 13942 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2115, - "step": 13943 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2206, - "step": 13944 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2396, - "step": 13945 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2194, - "step": 13946 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2227, - "step": 13947 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2187, - "step": 13948 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2109, - "step": 13949 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2375, - "step": 13950 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2325, - "step": 13951 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2153, - "step": 13952 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2213, - "step": 13953 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2359, - "step": 13954 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2379, - "step": 13955 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2225, - "step": 13956 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2153, - "step": 13957 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2194, - "step": 13958 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2205, - "step": 13959 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2322, - "step": 13960 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2267, - "step": 13961 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2262, - "step": 13962 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2332, - "step": 13963 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2285, - "step": 13964 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2353, - "step": 13965 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2369, - "step": 13966 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2202, - "step": 13967 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2207, - "step": 13968 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2216, - "step": 13969 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2197, - "step": 13970 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2193, - "step": 13971 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2104, - "step": 13972 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2242, - "step": 13973 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.209, - "step": 13974 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2268, - "step": 13975 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.2227, - "step": 13976 - }, - { - "epoch": 1.72, - "learning_rate": 0.0003, - "loss": 0.221, - "step": 13977 - }, - { - "epoch": 1.73, - "learning_rate": 0.0003, - "loss": 0.2173, - "step": 13978 - }, - { - "epoch": 1.73, - "learning_rate": 0.0003, - "loss": 0.2259, - "step": 13979 - }, - { - "epoch": 1.73, - "learning_rate": 0.0003, - "loss": 0.2203, - "step": 13980 - }, - { - "epoch": 1.73, - "learning_rate": 0.0003, - "loss": 0.2305, - "step": 13981 - }, - { - "epoch": 1.73, - "learning_rate": 0.0003, - "loss": 0.2332, - "step": 13982 - }, - { - "epoch": 1.73, - "learning_rate": 0.0003, - "loss": 0.2137, - "step": 13983 - }, - { - "epoch": 1.73, - "learning_rate": 0.0003, - "loss": 0.2215, - "step": 13984 - }, - { - "epoch": 1.73, - "learning_rate": 0.0003, - "loss": 0.2222, - "step": 13985 - }, - { - "epoch": 1.73, - "learning_rate": 0.0003, - "loss": 0.211, - "step": 13986 - }, - { - "epoch": 1.73, - "learning_rate": 0.0003, - "loss": 0.2189, - "step": 13987 - }, - { - "epoch": 1.73, - "learning_rate": 0.0003, - "loss": 0.2366, - "step": 13988 - }, - { - "epoch": 1.73, - "learning_rate": 0.0003, - "loss": 0.2279, - "step": 13989 - }, - { - "epoch": 1.73, - "learning_rate": 0.0003, - "loss": 0.2286, - "step": 13990 - }, - { - "epoch": 1.73, - "learning_rate": 0.0003, - "loss": 0.2163, - "step": 13991 - }, - { - "epoch": 1.73, - "learning_rate": 0.0003, - "loss": 0.2124, - "step": 13992 - }, - { - "epoch": 1.73, - "learning_rate": 0.0003, - "loss": 0.2318, - "step": 13993 - }, - { - "epoch": 1.73, - "learning_rate": 0.0003, - "loss": 0.2321, - "step": 13994 - }, - { - "epoch": 1.73, - "learning_rate": 0.0003, - "loss": 0.2186, - "step": 13995 - }, - { - "epoch": 1.73, - "learning_rate": 0.0003, - "loss": 0.2066, - "step": 13996 - }, - { - "epoch": 1.73, - "learning_rate": 0.0003, - "loss": 0.2248, - "step": 13997 - }, - { - "epoch": 1.73, - "learning_rate": 0.0003, - "loss": 0.233, - "step": 13998 - }, - { - "epoch": 1.73, - "learning_rate": 0.0003, - "loss": 0.2162, - "step": 13999 - }, - { - "epoch": 1.73, - "learning_rate": 0.0003, - "loss": 0.2361, - "step": 14000 } ], "logging_steps": 1.0, - "max_steps": 16206, - "num_train_epochs": 2, - "save_steps": 200, + "max_steps": 762, + "num_train_epochs": 1, + "save_steps": 50, "total_flos": 0.0, "trial_name": null, "trial_params": null