{ "best_metric": 1.011842966079712, "best_model_checkpoint": "ai-light-dance_drums_ft_pretrain_wav2vec2-base-new-v3/checkpoint-198", "epoch": 99.69565217391305, "global_step": 200, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.7, "eval_loss": 65.68504333496094, "eval_runtime": 2.5882, "eval_samples_per_second": 6.568, "eval_steps_per_second": 1.159, "eval_wer": 0.9201430274135876, "step": 2 }, { "epoch": 1.7, "eval_loss": 65.31504821777344, "eval_runtime": 2.8243, "eval_samples_per_second": 6.019, "eval_steps_per_second": 1.062, "eval_wer": 0.9165673420738975, "step": 4 }, { "epoch": 2.7, "eval_loss": 63.401397705078125, "eval_runtime": 2.7045, "eval_samples_per_second": 6.286, "eval_steps_per_second": 1.109, "eval_wer": 0.8986889153754469, "step": 6 }, { "epoch": 3.7, "eval_loss": 61.84690856933594, "eval_runtime": 2.7848, "eval_samples_per_second": 6.105, "eval_steps_per_second": 1.077, "eval_wer": 0.8700834326579261, "step": 8 }, { "epoch": 4.7, "learning_rate": 0.00010499999999999999, "loss": 20.497, "step": 10 }, { "epoch": 4.7, "eval_loss": 57.46735382080078, "eval_runtime": 2.7178, "eval_samples_per_second": 6.255, "eval_steps_per_second": 1.104, "eval_wer": 0.8557806912991657, "step": 10 }, { "epoch": 5.7, "eval_loss": 51.37147903442383, "eval_runtime": 2.7102, "eval_samples_per_second": 6.273, "eval_steps_per_second": 1.107, "eval_wer": 0.9356376638855781, "step": 12 }, { "epoch": 6.7, "eval_loss": 43.46580123901367, "eval_runtime": 2.6418, "eval_samples_per_second": 6.435, "eval_steps_per_second": 1.136, "eval_wer": 0.9868891537544696, "step": 14 }, { "epoch": 7.7, "eval_loss": 33.7960319519043, "eval_runtime": 2.6634, "eval_samples_per_second": 6.383, "eval_steps_per_second": 1.126, "eval_wer": 1.0, "step": 16 }, { "epoch": 8.7, "eval_loss": 22.868000030517578, "eval_runtime": 2.6558, "eval_samples_per_second": 6.401, "eval_steps_per_second": 1.13, "eval_wer": 1.0, "step": 18 }, { "epoch": 9.7, "learning_rate": 0.00025499999999999996, "loss": 13.2039, "step": 20 }, { "epoch": 9.7, "eval_loss": 12.010748863220215, "eval_runtime": 2.6219, "eval_samples_per_second": 6.484, "eval_steps_per_second": 1.144, "eval_wer": 1.0, "step": 20 }, { "epoch": 10.7, "eval_loss": 4.675407886505127, "eval_runtime": 2.566, "eval_samples_per_second": 6.625, "eval_steps_per_second": 1.169, "eval_wer": 1.0, "step": 22 }, { "epoch": 11.7, "eval_loss": 2.5355348587036133, "eval_runtime": 2.5403, "eval_samples_per_second": 6.692, "eval_steps_per_second": 1.181, "eval_wer": 1.0, "step": 24 }, { "epoch": 12.7, "eval_loss": 2.2340898513793945, "eval_runtime": 2.5381, "eval_samples_per_second": 6.698, "eval_steps_per_second": 1.182, "eval_wer": 1.0, "step": 26 }, { "epoch": 13.7, "eval_loss": 2.8692574501037598, "eval_runtime": 2.5952, "eval_samples_per_second": 6.55, "eval_steps_per_second": 1.156, "eval_wer": 1.0, "step": 28 }, { "epoch": 14.7, "learning_rate": 0.0002883333333333333, "loss": 3.0397, "step": 30 }, { "epoch": 14.7, "eval_loss": 3.508324384689331, "eval_runtime": 2.5954, "eval_samples_per_second": 6.55, "eval_steps_per_second": 1.156, "eval_wer": 1.0, "step": 30 }, { "epoch": 15.7, "eval_loss": 3.1664485931396484, "eval_runtime": 2.587, "eval_samples_per_second": 6.571, "eval_steps_per_second": 1.16, "eval_wer": 1.0, "step": 32 }, { "epoch": 16.7, "eval_loss": 2.6171875, "eval_runtime": 2.5928, "eval_samples_per_second": 6.557, "eval_steps_per_second": 1.157, "eval_wer": 1.0, "step": 34 }, { "epoch": 17.7, "eval_loss": 2.2690131664276123, "eval_runtime": 2.5759, "eval_samples_per_second": 6.6, "eval_steps_per_second": 1.165, "eval_wer": 1.0, "step": 36 }, { "epoch": 18.7, "eval_loss": 2.380885124206543, "eval_runtime": 2.5845, "eval_samples_per_second": 6.578, "eval_steps_per_second": 1.161, "eval_wer": 1.0, "step": 38 }, { "epoch": 19.7, "learning_rate": 0.00027166666666666664, "loss": 2.133, "step": 40 }, { "epoch": 19.7, "eval_loss": 2.2537014484405518, "eval_runtime": 2.5569, "eval_samples_per_second": 6.649, "eval_steps_per_second": 1.173, "eval_wer": 1.0, "step": 40 }, { "epoch": 20.7, "eval_loss": 1.9851531982421875, "eval_runtime": 2.532, "eval_samples_per_second": 6.714, "eval_steps_per_second": 1.185, "eval_wer": 1.0, "step": 42 }, { "epoch": 21.7, "eval_loss": 2.072378396987915, "eval_runtime": 2.6203, "eval_samples_per_second": 6.488, "eval_steps_per_second": 1.145, "eval_wer": 1.0, "step": 44 }, { "epoch": 22.7, "eval_loss": 2.00761342048645, "eval_runtime": 2.532, "eval_samples_per_second": 6.714, "eval_steps_per_second": 1.185, "eval_wer": 1.0, "step": 46 }, { "epoch": 23.7, "eval_loss": 1.94607675075531, "eval_runtime": 2.5261, "eval_samples_per_second": 6.73, "eval_steps_per_second": 1.188, "eval_wer": 1.0, "step": 48 }, { "epoch": 24.7, "learning_rate": 0.00025499999999999996, "loss": 1.8964, "step": 50 }, { "epoch": 24.7, "eval_loss": 2.0850636959075928, "eval_runtime": 2.5842, "eval_samples_per_second": 6.578, "eval_steps_per_second": 1.161, "eval_wer": 1.0, "step": 50 }, { "epoch": 25.7, "eval_loss": 2.0501198768615723, "eval_runtime": 2.5619, "eval_samples_per_second": 6.636, "eval_steps_per_second": 1.171, "eval_wer": 1.0, "step": 52 }, { "epoch": 26.7, "eval_loss": 1.8149293661117554, "eval_runtime": 2.5646, "eval_samples_per_second": 6.629, "eval_steps_per_second": 1.17, "eval_wer": 1.0, "step": 54 }, { "epoch": 27.7, "eval_loss": 1.8059440851211548, "eval_runtime": 2.5604, "eval_samples_per_second": 6.64, "eval_steps_per_second": 1.172, "eval_wer": 1.0, "step": 56 }, { "epoch": 28.7, "eval_loss": 1.9727060794830322, "eval_runtime": 2.5065, "eval_samples_per_second": 6.782, "eval_steps_per_second": 1.197, "eval_wer": 1.0, "step": 58 }, { "epoch": 29.7, "learning_rate": 0.0002383333333333333, "loss": 1.8599, "step": 60 }, { "epoch": 29.7, "eval_loss": 1.7996188402175903, "eval_runtime": 2.5606, "eval_samples_per_second": 6.639, "eval_steps_per_second": 1.172, "eval_wer": 1.0, "step": 60 }, { "epoch": 30.7, "eval_loss": 1.64518141746521, "eval_runtime": 2.5395, "eval_samples_per_second": 6.694, "eval_steps_per_second": 1.181, "eval_wer": 1.0, "step": 62 }, { "epoch": 31.7, "eval_loss": 1.8070778846740723, "eval_runtime": 2.5418, "eval_samples_per_second": 6.688, "eval_steps_per_second": 1.18, "eval_wer": 1.0, "step": 64 }, { "epoch": 32.7, "eval_loss": 1.7773442268371582, "eval_runtime": 2.5825, "eval_samples_per_second": 6.583, "eval_steps_per_second": 1.162, "eval_wer": 1.0, "step": 66 }, { "epoch": 33.7, "eval_loss": 1.6233692169189453, "eval_runtime": 2.5954, "eval_samples_per_second": 6.55, "eval_steps_per_second": 1.156, "eval_wer": 1.0, "step": 68 }, { "epoch": 34.7, "learning_rate": 0.00022166666666666667, "loss": 1.7166, "step": 70 }, { "epoch": 34.7, "eval_loss": 1.6564326286315918, "eval_runtime": 2.5596, "eval_samples_per_second": 6.642, "eval_steps_per_second": 1.172, "eval_wer": 1.0, "step": 70 }, { "epoch": 35.7, "eval_loss": 1.6549872159957886, "eval_runtime": 2.5502, "eval_samples_per_second": 6.666, "eval_steps_per_second": 1.176, "eval_wer": 1.0, "step": 72 }, { "epoch": 36.7, "eval_loss": 1.565232753753662, "eval_runtime": 2.5958, "eval_samples_per_second": 6.549, "eval_steps_per_second": 1.156, "eval_wer": 1.0, "step": 74 }, { "epoch": 37.7, "eval_loss": 1.5213314294815063, "eval_runtime": 2.6219, "eval_samples_per_second": 6.484, "eval_steps_per_second": 1.144, "eval_wer": 0.9952324195470799, "step": 76 }, { "epoch": 38.7, "eval_loss": 1.47950279712677, "eval_runtime": 2.6468, "eval_samples_per_second": 6.423, "eval_steps_per_second": 1.133, "eval_wer": 0.9856972586412396, "step": 78 }, { "epoch": 39.7, "learning_rate": 0.000205, "loss": 1.4764, "step": 80 }, { "epoch": 39.7, "eval_loss": 1.4402477741241455, "eval_runtime": 2.6428, "eval_samples_per_second": 6.433, "eval_steps_per_second": 1.135, "eval_wer": 0.9868891537544696, "step": 80 }, { "epoch": 40.7, "eval_loss": 1.4424933195114136, "eval_runtime": 2.631, "eval_samples_per_second": 6.461, "eval_steps_per_second": 1.14, "eval_wer": 0.9415971394517283, "step": 82 }, { "epoch": 41.7, "eval_loss": 1.4473284482955933, "eval_runtime": 2.6449, "eval_samples_per_second": 6.427, "eval_steps_per_second": 1.134, "eval_wer": 0.8462455303933254, "step": 84 }, { "epoch": 42.7, "eval_loss": 1.3785685300827026, "eval_runtime": 2.6492, "eval_samples_per_second": 6.417, "eval_steps_per_second": 1.132, "eval_wer": 0.899880810488677, "step": 86 }, { "epoch": 43.7, "eval_loss": 1.460979700088501, "eval_runtime": 2.6782, "eval_samples_per_second": 6.348, "eval_steps_per_second": 1.12, "eval_wer": 0.8486293206197855, "step": 88 }, { "epoch": 44.7, "learning_rate": 0.00018833333333333332, "loss": 1.3782, "step": 90 }, { "epoch": 44.7, "eval_loss": 1.6983370780944824, "eval_runtime": 2.6416, "eval_samples_per_second": 6.436, "eval_steps_per_second": 1.136, "eval_wer": 0.8498212157330155, "step": 90 }, { "epoch": 45.7, "eval_loss": 1.5572391748428345, "eval_runtime": 2.6072, "eval_samples_per_second": 6.52, "eval_steps_per_second": 1.151, "eval_wer": 0.9129916567342073, "step": 92 }, { "epoch": 46.7, "eval_loss": 1.6036518812179565, "eval_runtime": 2.6041, "eval_samples_per_second": 6.528, "eval_steps_per_second": 1.152, "eval_wer": 0.8128724672228844, "step": 94 }, { "epoch": 47.7, "eval_loss": 1.6874778270721436, "eval_runtime": 2.5174, "eval_samples_per_second": 6.753, "eval_steps_per_second": 1.192, "eval_wer": 0.7151370679380215, "step": 96 }, { "epoch": 48.7, "eval_loss": 1.6261805295944214, "eval_runtime": 2.5248, "eval_samples_per_second": 6.733, "eval_steps_per_second": 1.188, "eval_wer": 0.7783075089392133, "step": 98 }, { "epoch": 49.7, "learning_rate": 0.00017166666666666665, "loss": 1.3406, "step": 100 }, { "epoch": 49.7, "eval_loss": 1.6008760929107666, "eval_runtime": 2.5052, "eval_samples_per_second": 6.786, "eval_steps_per_second": 1.197, "eval_wer": 0.7306317044100119, "step": 100 }, { "epoch": 50.7, "eval_loss": 1.5744612216949463, "eval_runtime": 2.5272, "eval_samples_per_second": 6.727, "eval_steps_per_second": 1.187, "eval_wer": 0.6758045292014303, "step": 102 }, { "epoch": 51.7, "eval_loss": 1.5347764492034912, "eval_runtime": 2.562, "eval_samples_per_second": 6.636, "eval_steps_per_second": 1.171, "eval_wer": 0.6805721096543504, "step": 104 }, { "epoch": 52.7, "eval_loss": 1.5455317497253418, "eval_runtime": 2.5351, "eval_samples_per_second": 6.706, "eval_steps_per_second": 1.183, "eval_wer": 0.6591179976162098, "step": 106 }, { "epoch": 53.7, "eval_loss": 1.4915562868118286, "eval_runtime": 2.5349, "eval_samples_per_second": 6.706, "eval_steps_per_second": 1.183, "eval_wer": 0.6293206197854588, "step": 108 }, { "epoch": 54.7, "learning_rate": 0.000155, "loss": 1.1939, "step": 110 }, { "epoch": 54.7, "eval_loss": 1.399192214012146, "eval_runtime": 2.5718, "eval_samples_per_second": 6.61, "eval_steps_per_second": 1.166, "eval_wer": 0.6317044100119189, "step": 110 }, { "epoch": 55.7, "eval_loss": 1.3632481098175049, "eval_runtime": 2.531, "eval_samples_per_second": 6.717, "eval_steps_per_second": 1.185, "eval_wer": 0.6078665077473182, "step": 112 }, { "epoch": 56.7, "eval_loss": 1.297105073928833, "eval_runtime": 2.5234, "eval_samples_per_second": 6.737, "eval_steps_per_second": 1.189, "eval_wer": 0.6126340882002383, "step": 114 }, { "epoch": 57.7, "eval_loss": 1.2397348880767822, "eval_runtime": 2.589, "eval_samples_per_second": 6.566, "eval_steps_per_second": 1.159, "eval_wer": 0.6257449344457687, "step": 116 }, { "epoch": 58.7, "eval_loss": 1.2213208675384521, "eval_runtime": 2.5427, "eval_samples_per_second": 6.686, "eval_steps_per_second": 1.18, "eval_wer": 0.6114421930870083, "step": 118 }, { "epoch": 59.7, "learning_rate": 0.00013833333333333333, "loss": 1.2298, "step": 120 }, { "epoch": 59.7, "eval_loss": 1.270306944847107, "eval_runtime": 2.5565, "eval_samples_per_second": 6.65, "eval_steps_per_second": 1.173, "eval_wer": 0.600715137067938, "step": 120 }, { "epoch": 60.7, "eval_loss": 1.328464388847351, "eval_runtime": 2.5828, "eval_samples_per_second": 6.582, "eval_steps_per_second": 1.162, "eval_wer": 0.5935637663885578, "step": 122 }, { "epoch": 61.7, "eval_loss": 1.4112215042114258, "eval_runtime": 2.5426, "eval_samples_per_second": 6.686, "eval_steps_per_second": 1.18, "eval_wer": 0.599523241954708, "step": 124 }, { "epoch": 62.7, "eval_loss": 1.4663811922073364, "eval_runtime": 2.5264, "eval_samples_per_second": 6.729, "eval_steps_per_second": 1.187, "eval_wer": 0.599523241954708, "step": 126 }, { "epoch": 63.7, "eval_loss": 1.5034104585647583, "eval_runtime": 2.5056, "eval_samples_per_second": 6.785, "eval_steps_per_second": 1.197, "eval_wer": 0.6042908224076281, "step": 128 }, { "epoch": 64.7, "learning_rate": 0.00012166666666666665, "loss": 1.1321, "step": 130 }, { "epoch": 64.7, "eval_loss": 1.4717862606048584, "eval_runtime": 2.5441, "eval_samples_per_second": 6.682, "eval_steps_per_second": 1.179, "eval_wer": 0.6126340882002383, "step": 130 }, { "epoch": 65.7, "eval_loss": 1.4656554460525513, "eval_runtime": 2.5454, "eval_samples_per_second": 6.679, "eval_steps_per_second": 1.179, "eval_wer": 0.6293206197854588, "step": 132 }, { "epoch": 66.7, "eval_loss": 1.4940413236618042, "eval_runtime": 2.5574, "eval_samples_per_second": 6.647, "eval_steps_per_second": 1.173, "eval_wer": 0.600715137067938, "step": 134 }, { "epoch": 67.7, "eval_loss": 1.5150542259216309, "eval_runtime": 2.5242, "eval_samples_per_second": 6.735, "eval_steps_per_second": 1.189, "eval_wer": 0.5899880810488677, "step": 136 }, { "epoch": 68.7, "eval_loss": 1.4332056045532227, "eval_runtime": 2.5934, "eval_samples_per_second": 6.555, "eval_steps_per_second": 1.157, "eval_wer": 0.601907032181168, "step": 138 }, { "epoch": 69.7, "learning_rate": 0.00010499999999999999, "loss": 1.068, "step": 140 }, { "epoch": 69.7, "eval_loss": 1.317719578742981, "eval_runtime": 2.5535, "eval_samples_per_second": 6.658, "eval_steps_per_second": 1.175, "eval_wer": 0.6138259833134684, "step": 140 }, { "epoch": 70.7, "eval_loss": 1.2635740041732788, "eval_runtime": 2.5266, "eval_samples_per_second": 6.728, "eval_steps_per_second": 1.187, "eval_wer": 0.6138259833134684, "step": 142 }, { "epoch": 71.7, "eval_loss": 1.2209337949752808, "eval_runtime": 2.5438, "eval_samples_per_second": 6.683, "eval_steps_per_second": 1.179, "eval_wer": 0.600715137067938, "step": 144 }, { "epoch": 72.7, "eval_loss": 1.1463706493377686, "eval_runtime": 2.5299, "eval_samples_per_second": 6.72, "eval_steps_per_second": 1.186, "eval_wer": 0.601907032181168, "step": 146 }, { "epoch": 73.7, "eval_loss": 1.0894441604614258, "eval_runtime": 2.5089, "eval_samples_per_second": 6.776, "eval_steps_per_second": 1.196, "eval_wer": 0.6245530393325387, "step": 148 }, { "epoch": 74.7, "learning_rate": 8.833333333333333e-05, "loss": 1.0462, "step": 150 }, { "epoch": 74.7, "eval_loss": 1.0838207006454468, "eval_runtime": 2.5093, "eval_samples_per_second": 6.775, "eval_steps_per_second": 1.196, "eval_wer": 0.6245530393325387, "step": 150 }, { "epoch": 75.7, "eval_loss": 1.0775409936904907, "eval_runtime": 2.5517, "eval_samples_per_second": 6.662, "eval_steps_per_second": 1.176, "eval_wer": 0.6221692491060786, "step": 152 }, { "epoch": 76.7, "eval_loss": 1.0624889135360718, "eval_runtime": 2.5824, "eval_samples_per_second": 6.583, "eval_steps_per_second": 1.162, "eval_wer": 0.6114421930870083, "step": 154 }, { "epoch": 77.7, "eval_loss": 1.052101492881775, "eval_runtime": 2.5652, "eval_samples_per_second": 6.627, "eval_steps_per_second": 1.17, "eval_wer": 0.6042908224076281, "step": 156 }, { "epoch": 78.7, "eval_loss": 1.045043706893921, "eval_runtime": 2.5323, "eval_samples_per_second": 6.713, "eval_steps_per_second": 1.185, "eval_wer": 0.599523241954708, "step": 158 }, { "epoch": 79.7, "learning_rate": 7.166666666666667e-05, "loss": 1.0199, "step": 160 }, { "epoch": 79.7, "eval_loss": 1.0607061386108398, "eval_runtime": 2.5995, "eval_samples_per_second": 6.54, "eval_steps_per_second": 1.154, "eval_wer": 0.5947556615017878, "step": 160 }, { "epoch": 80.7, "eval_loss": 1.0569047927856445, "eval_runtime": 2.5398, "eval_samples_per_second": 6.694, "eval_steps_per_second": 1.181, "eval_wer": 0.5923718712753278, "step": 162 }, { "epoch": 81.7, "eval_loss": 1.0500773191452026, "eval_runtime": 2.5189, "eval_samples_per_second": 6.749, "eval_steps_per_second": 1.191, "eval_wer": 0.5911799761620977, "step": 164 }, { "epoch": 82.7, "eval_loss": 1.051140546798706, "eval_runtime": 2.5362, "eval_samples_per_second": 6.703, "eval_steps_per_second": 1.183, "eval_wer": 0.5887961859356377, "step": 166 }, { "epoch": 83.7, "eval_loss": 1.0690089464187622, "eval_runtime": 2.5428, "eval_samples_per_second": 6.686, "eval_steps_per_second": 1.18, "eval_wer": 0.5828367103694875, "step": 168 }, { "epoch": 84.7, "learning_rate": 5.499999999999999e-05, "loss": 0.9651, "step": 170 }, { "epoch": 84.7, "eval_loss": 1.0684703588485718, "eval_runtime": 2.5471, "eval_samples_per_second": 6.674, "eval_steps_per_second": 1.178, "eval_wer": 0.5804529201430274, "step": 170 }, { "epoch": 85.7, "eval_loss": 1.0487909317016602, "eval_runtime": 2.4883, "eval_samples_per_second": 6.832, "eval_steps_per_second": 1.206, "eval_wer": 0.5864123957091776, "step": 172 }, { "epoch": 86.7, "eval_loss": 1.031644344329834, "eval_runtime": 2.5435, "eval_samples_per_second": 6.684, "eval_steps_per_second": 1.179, "eval_wer": 0.5899880810488677, "step": 174 }, { "epoch": 87.7, "eval_loss": 1.0346258878707886, "eval_runtime": 2.5551, "eval_samples_per_second": 6.653, "eval_steps_per_second": 1.174, "eval_wer": 0.5899880810488677, "step": 176 }, { "epoch": 88.7, "eval_loss": 1.0490374565124512, "eval_runtime": 2.5304, "eval_samples_per_second": 6.718, "eval_steps_per_second": 1.186, "eval_wer": 0.5828367103694875, "step": 178 }, { "epoch": 89.7, "learning_rate": 3.833333333333333e-05, "loss": 0.9867, "step": 180 }, { "epoch": 89.7, "eval_loss": 1.046677827835083, "eval_runtime": 2.5362, "eval_samples_per_second": 6.703, "eval_steps_per_second": 1.183, "eval_wer": 0.5828367103694875, "step": 180 }, { "epoch": 90.7, "eval_loss": 1.0315073728561401, "eval_runtime": 2.5361, "eval_samples_per_second": 6.703, "eval_steps_per_second": 1.183, "eval_wer": 0.5887961859356377, "step": 182 }, { "epoch": 91.7, "eval_loss": 1.0205892324447632, "eval_runtime": 2.5305, "eval_samples_per_second": 6.718, "eval_steps_per_second": 1.186, "eval_wer": 0.5911799761620977, "step": 184 }, { "epoch": 92.7, "eval_loss": 1.0165022611618042, "eval_runtime": 2.5148, "eval_samples_per_second": 6.76, "eval_steps_per_second": 1.193, "eval_wer": 0.5923718712753278, "step": 186 }, { "epoch": 93.7, "eval_loss": 1.0147016048431396, "eval_runtime": 2.5058, "eval_samples_per_second": 6.784, "eval_steps_per_second": 1.197, "eval_wer": 0.5899880810488677, "step": 188 }, { "epoch": 94.7, "learning_rate": 2.1666666666666664e-05, "loss": 0.9332, "step": 190 }, { "epoch": 94.7, "eval_loss": 1.0174245834350586, "eval_runtime": 2.538, "eval_samples_per_second": 6.698, "eval_steps_per_second": 1.182, "eval_wer": 0.5876042908224076, "step": 190 }, { "epoch": 95.7, "eval_loss": 1.0195481777191162, "eval_runtime": 2.5587, "eval_samples_per_second": 6.644, "eval_steps_per_second": 1.172, "eval_wer": 0.5852205005959475, "step": 192 }, { "epoch": 96.7, "eval_loss": 1.0195115804672241, "eval_runtime": 2.5251, "eval_samples_per_second": 6.732, "eval_steps_per_second": 1.188, "eval_wer": 0.5840286054827175, "step": 194 }, { "epoch": 97.7, "eval_loss": 1.015172004699707, "eval_runtime": 2.5398, "eval_samples_per_second": 6.694, "eval_steps_per_second": 1.181, "eval_wer": 0.5840286054827175, "step": 196 }, { "epoch": 98.7, "eval_loss": 1.011842966079712, "eval_runtime": 2.6053, "eval_samples_per_second": 6.525, "eval_steps_per_second": 1.151, "eval_wer": 0.5852205005959475, "step": 198 }, { "epoch": 99.7, "learning_rate": 4.9999999999999996e-06, "loss": 0.9299, "step": 200 }, { "epoch": 99.7, "eval_loss": 1.0128355026245117, "eval_runtime": 2.5227, "eval_samples_per_second": 6.739, "eval_steps_per_second": 1.189, "eval_wer": 0.5852205005959475, "step": 200 }, { "epoch": 99.7, "step": 200, "total_flos": 1.8368228141544445e+18, "train_loss": 2.952321643829346, "train_runtime": 3905.0975, "train_samples_per_second": 4.584, "train_steps_per_second": 0.051 } ], "max_steps": 200, "num_train_epochs": 100, "total_flos": 1.8368228141544445e+18, "trial_name": null, "trial_params": null }