{ "best_metric": null, "best_model_checkpoint": null, "epoch": 60.0, "global_step": 7440, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.81, "learning_rate": 1.3172043010752688e-05, "loss": 13.9663, "step": 100 }, { "epoch": 0.81, "eval_loss": 15.575762748718262, "eval_runtime": 98.9721, "eval_samples_per_second": 18.632, "eval_steps_per_second": 2.334, "eval_wer": 1.0, "step": 100 }, { "epoch": 1.61, "learning_rate": 2.6344086021505376e-05, "loss": 6.7623, "step": 200 }, { "epoch": 1.61, "eval_loss": 3.259247064590454, "eval_runtime": 99.4059, "eval_samples_per_second": 18.55, "eval_steps_per_second": 2.324, "eval_wer": 1.0, "step": 200 }, { "epoch": 2.42, "learning_rate": 3.978494623655914e-05, "loss": 3.0242, "step": 300 }, { "epoch": 2.42, "eval_loss": 2.9369125366210938, "eval_runtime": 98.1481, "eval_samples_per_second": 18.788, "eval_steps_per_second": 2.354, "eval_wer": 1.0, "step": 300 }, { "epoch": 3.23, "learning_rate": 5.32258064516129e-05, "loss": 2.8806, "step": 400 }, { "epoch": 3.23, "eval_loss": 2.8887438774108887, "eval_runtime": 97.5774, "eval_samples_per_second": 18.898, "eval_steps_per_second": 2.367, "eval_wer": 1.0, "step": 400 }, { "epoch": 4.03, "learning_rate": 6.666666666666667e-05, "loss": 2.8344, "step": 500 }, { "epoch": 4.03, "eval_loss": 2.8125975131988525, "eval_runtime": 97.5647, "eval_samples_per_second": 18.9, "eval_steps_per_second": 2.368, "eval_wer": 1.0, "step": 500 }, { "epoch": 4.84, "learning_rate": 8.010752688172043e-05, "loss": 2.7158, "step": 600 }, { "epoch": 4.84, "eval_loss": 2.304689884185791, "eval_runtime": 97.2319, "eval_samples_per_second": 18.965, "eval_steps_per_second": 2.376, "eval_wer": 1.003542793212754, "step": 600 }, { "epoch": 5.65, "learning_rate": 9.35483870967742e-05, "loss": 1.7164, "step": 700 }, { "epoch": 5.65, "eval_loss": 0.7104876041412354, "eval_runtime": 96.4932, "eval_samples_per_second": 19.11, "eval_steps_per_second": 2.394, "eval_wer": 0.7594629871340668, "step": 700 }, { "epoch": 6.45, "learning_rate": 0.0001, "loss": 1.0757, "step": 800 }, { "epoch": 6.45, "eval_loss": 0.5160450339317322, "eval_runtime": 97.694, "eval_samples_per_second": 18.875, "eval_steps_per_second": 2.365, "eval_wer": 0.6501025545403692, "step": 800 }, { "epoch": 7.26, "learning_rate": 0.0001, "loss": 0.9208, "step": 900 }, { "epoch": 7.26, "eval_loss": 0.43188726902008057, "eval_runtime": 101.9111, "eval_samples_per_second": 18.094, "eval_steps_per_second": 2.267, "eval_wer": 0.5842811859034123, "step": 900 }, { "epoch": 8.06, "learning_rate": 0.0001, "loss": 0.8012, "step": 1000 }, { "epoch": 8.06, "eval_loss": 0.39437660574913025, "eval_runtime": 97.2792, "eval_samples_per_second": 18.956, "eval_steps_per_second": 2.375, "eval_wer": 0.5456833861644602, "step": 1000 }, { "epoch": 8.87, "learning_rate": 0.0001, "loss": 0.7334, "step": 1100 }, { "epoch": 8.87, "eval_loss": 0.36806735396385193, "eval_runtime": 97.7448, "eval_samples_per_second": 18.865, "eval_steps_per_second": 2.363, "eval_wer": 0.5120268506432967, "step": 1100 }, { "epoch": 9.68, "learning_rate": 0.0001, "loss": 0.6839, "step": 1200 }, { "epoch": 9.68, "eval_loss": 0.35295596718788147, "eval_runtime": 104.7228, "eval_samples_per_second": 17.608, "eval_steps_per_second": 2.206, "eval_wer": 0.49822860339362296, "step": 1200 }, { "epoch": 10.48, "learning_rate": 0.0001, "loss": 0.6599, "step": 1300 }, { "epoch": 10.48, "eval_loss": 0.34405317902565, "eval_runtime": 100.6994, "eval_samples_per_second": 18.312, "eval_steps_per_second": 2.294, "eval_wer": 0.49561812418422524, "step": 1300 }, { "epoch": 11.29, "learning_rate": 0.0001, "loss": 0.6101, "step": 1400 }, { "epoch": 11.29, "eval_loss": 0.3226686716079712, "eval_runtime": 97.8943, "eval_samples_per_second": 18.837, "eval_steps_per_second": 2.36, "eval_wer": 0.4828454223382435, "step": 1400 }, { "epoch": 12.1, "learning_rate": 0.0001, "loss": 0.5844, "step": 1500 }, { "epoch": 12.1, "eval_loss": 0.34125906229019165, "eval_runtime": 98.6933, "eval_samples_per_second": 18.684, "eval_steps_per_second": 2.341, "eval_wer": 0.47445459630803655, "step": 1500 }, { "epoch": 12.9, "learning_rate": 0.0001, "loss": 0.5754, "step": 1600 }, { "epoch": 12.9, "eval_loss": 0.33336642384529114, "eval_runtime": 99.0007, "eval_samples_per_second": 18.626, "eval_steps_per_second": 2.333, "eval_wer": 0.46140220026104795, "step": 1600 }, { "epoch": 13.71, "learning_rate": 0.0001, "loss": 0.5611, "step": 1700 }, { "epoch": 13.71, "eval_loss": 0.30597391724586487, "eval_runtime": 101.2827, "eval_samples_per_second": 18.206, "eval_steps_per_second": 2.281, "eval_wer": 0.4672757784821928, "step": 1700 }, { "epoch": 14.52, "learning_rate": 0.0001, "loss": 0.5476, "step": 1800 }, { "epoch": 14.52, "eval_loss": 0.3194342851638794, "eval_runtime": 105.7302, "eval_samples_per_second": 17.441, "eval_steps_per_second": 2.185, "eval_wer": 0.44881596121573747, "step": 1800 }, { "epoch": 15.32, "learning_rate": 0.0001, "loss": 0.526, "step": 1900 }, { "epoch": 15.32, "eval_loss": 0.30019786953926086, "eval_runtime": 96.396, "eval_samples_per_second": 19.129, "eval_steps_per_second": 2.396, "eval_wer": 0.4449934738019765, "step": 1900 }, { "epoch": 16.13, "learning_rate": 0.0001, "loss": 0.5267, "step": 2000 }, { "epoch": 16.13, "eval_loss": 0.3249629735946655, "eval_runtime": 105.1317, "eval_samples_per_second": 17.54, "eval_steps_per_second": 2.197, "eval_wer": 0.43660264777176955, "step": 2000 }, { "epoch": 16.94, "learning_rate": 0.0001, "loss": 0.49, "step": 2100 }, { "epoch": 16.94, "eval_loss": 0.2999746799468994, "eval_runtime": 97.027, "eval_samples_per_second": 19.005, "eval_steps_per_second": 2.381, "eval_wer": 0.4337124743613649, "step": 2100 }, { "epoch": 17.74, "learning_rate": 0.0001, "loss": 0.4945, "step": 2200 }, { "epoch": 17.74, "eval_loss": 0.30671271681785583, "eval_runtime": 96.8855, "eval_samples_per_second": 19.033, "eval_steps_per_second": 2.384, "eval_wer": 0.43100876375163155, "step": 2200 }, { "epoch": 18.55, "learning_rate": 0.0001, "loss": 0.485, "step": 2300 }, { "epoch": 18.55, "eval_loss": 0.3134038746356964, "eval_runtime": 98.1951, "eval_samples_per_second": 18.779, "eval_steps_per_second": 2.352, "eval_wer": 0.43706880477344767, "step": 2300 }, { "epoch": 19.35, "learning_rate": 0.0001, "loss": 0.486, "step": 2400 }, { "epoch": 19.35, "eval_loss": 0.3182927072048187, "eval_runtime": 100.6349, "eval_samples_per_second": 18.324, "eval_steps_per_second": 2.295, "eval_wer": 0.43044937534961775, "step": 2400 }, { "epoch": 20.16, "learning_rate": 0.0001, "loss": 0.4617, "step": 2500 }, { "epoch": 20.16, "eval_loss": 0.3004864752292633, "eval_runtime": 102.1006, "eval_samples_per_second": 18.061, "eval_steps_per_second": 2.262, "eval_wer": 0.4238299459257878, "step": 2500 }, { "epoch": 20.97, "learning_rate": 0.0001, "loss": 0.465, "step": 2600 }, { "epoch": 20.97, "eval_loss": 0.313532292842865, "eval_runtime": 101.2873, "eval_samples_per_second": 18.206, "eval_steps_per_second": 2.281, "eval_wer": 0.4311019951519672, "step": 2600 }, { "epoch": 21.77, "learning_rate": 0.0001, "loss": 0.4414, "step": 2700 }, { "epoch": 21.77, "eval_loss": 0.3118414580821991, "eval_runtime": 97.4069, "eval_samples_per_second": 18.931, "eval_steps_per_second": 2.371, "eval_wer": 0.4256013425321648, "step": 2700 }, { "epoch": 22.58, "learning_rate": 0.0001, "loss": 0.4424, "step": 2800 }, { "epoch": 22.58, "eval_loss": 0.3086116313934326, "eval_runtime": 97.4809, "eval_samples_per_second": 18.917, "eval_steps_per_second": 2.37, "eval_wer": 0.4160917396979303, "step": 2800 }, { "epoch": 23.39, "learning_rate": 0.0001, "loss": 0.4352, "step": 2900 }, { "epoch": 23.39, "eval_loss": 0.3213385045528412, "eval_runtime": 96.5991, "eval_samples_per_second": 19.089, "eval_steps_per_second": 2.391, "eval_wer": 0.41879545030766363, "step": 2900 }, { "epoch": 24.19, "learning_rate": 0.0001, "loss": 0.4324, "step": 3000 }, { "epoch": 24.19, "eval_loss": 0.3011772036552429, "eval_runtime": 97.1915, "eval_samples_per_second": 18.973, "eval_steps_per_second": 2.377, "eval_wer": 0.4236434831251165, "step": 3000 }, { "epoch": 25.0, "learning_rate": 0.0001, "loss": 0.4246, "step": 3100 }, { "epoch": 25.0, "eval_loss": 0.30194172263145447, "eval_runtime": 100.0292, "eval_samples_per_second": 18.435, "eval_steps_per_second": 2.309, "eval_wer": 0.4165578966996084, "step": 3100 }, { "epoch": 25.81, "learning_rate": 0.0001, "loss": 0.4132, "step": 3200 }, { "epoch": 25.81, "eval_loss": 0.299437552690506, "eval_runtime": 97.7952, "eval_samples_per_second": 18.856, "eval_steps_per_second": 2.362, "eval_wer": 0.4160917396979303, "step": 3200 }, { "epoch": 26.61, "learning_rate": 0.0001, "loss": 0.4074, "step": 3300 }, { "epoch": 26.61, "eval_loss": 0.31787610054016113, "eval_runtime": 97.3925, "eval_samples_per_second": 18.934, "eval_steps_per_second": 2.372, "eval_wer": 0.41795636770464295, "step": 3300 }, { "epoch": 27.42, "learning_rate": 0.0001, "loss": 0.4031, "step": 3400 }, { "epoch": 27.42, "eval_loss": 0.296748548746109, "eval_runtime": 101.7762, "eval_samples_per_second": 18.118, "eval_steps_per_second": 2.27, "eval_wer": 0.40760768226738764, "step": 3400 }, { "epoch": 28.23, "learning_rate": 0.0001, "loss": 0.4082, "step": 3500 }, { "epoch": 28.23, "eval_loss": 0.31329259276390076, "eval_runtime": 102.7944, "eval_samples_per_second": 17.939, "eval_steps_per_second": 2.247, "eval_wer": 0.41310833488719, "step": 3500 }, { "epoch": 29.03, "learning_rate": 0.0001, "loss": 0.3912, "step": 3600 }, { "epoch": 29.03, "eval_loss": 0.3259478509426117, "eval_runtime": 98.5616, "eval_samples_per_second": 18.709, "eval_steps_per_second": 2.344, "eval_wer": 0.41133693828081297, "step": 3600 }, { "epoch": 29.84, "learning_rate": 0.0001, "loss": 0.3922, "step": 3700 }, { "epoch": 29.84, "eval_loss": 0.32406386733055115, "eval_runtime": 96.8005, "eval_samples_per_second": 19.049, "eval_steps_per_second": 2.386, "eval_wer": 0.41226925228416933, "step": 3700 }, { "epoch": 30.65, "learning_rate": 9.795698924731184e-05, "loss": 0.3851, "step": 3800 }, { "epoch": 30.65, "eval_loss": 0.29852330684661865, "eval_runtime": 105.0804, "eval_samples_per_second": 17.548, "eval_steps_per_second": 2.198, "eval_wer": 0.41133693828081297, "step": 3800 }, { "epoch": 31.45, "learning_rate": 9.526881720430108e-05, "loss": 0.3768, "step": 3900 }, { "epoch": 31.45, "eval_loss": 0.3223101794719696, "eval_runtime": 97.6458, "eval_samples_per_second": 18.885, "eval_steps_per_second": 2.366, "eval_wer": 0.41040462427745666, "step": 3900 }, { "epoch": 32.26, "learning_rate": 9.258064516129033e-05, "loss": 0.3728, "step": 4000 }, { "epoch": 32.26, "eval_loss": 0.3212699890136719, "eval_runtime": 100.4336, "eval_samples_per_second": 18.36, "eval_steps_per_second": 2.3, "eval_wer": 0.40770091366772326, "step": 4000 }, { "epoch": 33.06, "learning_rate": 8.989247311827958e-05, "loss": 0.3646, "step": 4100 }, { "epoch": 33.06, "eval_loss": 0.31770506501197815, "eval_runtime": 97.2462, "eval_samples_per_second": 18.962, "eval_steps_per_second": 2.375, "eval_wer": 0.4116166324818199, "step": 4100 }, { "epoch": 33.87, "learning_rate": 8.720430107526883e-05, "loss": 0.3681, "step": 4200 }, { "epoch": 33.87, "eval_loss": 0.3010982871055603, "eval_runtime": 99.148, "eval_samples_per_second": 18.598, "eval_steps_per_second": 2.33, "eval_wer": 0.4105910870781279, "step": 4200 }, { "epoch": 34.68, "learning_rate": 8.451612903225808e-05, "loss": 0.3634, "step": 4300 }, { "epoch": 34.68, "eval_loss": 0.3075733780860901, "eval_runtime": 99.8799, "eval_samples_per_second": 18.462, "eval_steps_per_second": 2.313, "eval_wer": 0.4069550624650382, "step": 4300 }, { "epoch": 35.48, "learning_rate": 8.182795698924732e-05, "loss": 0.3471, "step": 4400 }, { "epoch": 35.48, "eval_loss": 0.31304171681404114, "eval_runtime": 99.6768, "eval_samples_per_second": 18.5, "eval_steps_per_second": 2.317, "eval_wer": 0.40266641804959913, "step": 4400 }, { "epoch": 36.29, "learning_rate": 7.913978494623657e-05, "loss": 0.3398, "step": 4500 }, { "epoch": 36.29, "eval_loss": 0.306076318025589, "eval_runtime": 103.5936, "eval_samples_per_second": 17.8, "eval_steps_per_second": 2.23, "eval_wer": 0.4037851948536267, "step": 4500 }, { "epoch": 37.1, "learning_rate": 7.645161290322582e-05, "loss": 0.3394, "step": 4600 }, { "epoch": 37.1, "eval_loss": 0.31049424409866333, "eval_runtime": 98.5424, "eval_samples_per_second": 18.713, "eval_steps_per_second": 2.344, "eval_wer": 0.4037851948536267, "step": 4600 }, { "epoch": 37.9, "learning_rate": 7.376344086021507e-05, "loss": 0.331, "step": 4700 }, { "epoch": 37.9, "eval_loss": 0.3191221058368683, "eval_runtime": 102.0886, "eval_samples_per_second": 18.063, "eval_steps_per_second": 2.263, "eval_wer": 0.3992168562371807, "step": 4700 }, { "epoch": 38.71, "learning_rate": 7.10752688172043e-05, "loss": 0.3221, "step": 4800 }, { "epoch": 38.71, "eval_loss": 0.3119024336338043, "eval_runtime": 99.689, "eval_samples_per_second": 18.498, "eval_steps_per_second": 2.317, "eval_wer": 0.39958978183852323, "step": 4800 }, { "epoch": 39.52, "learning_rate": 6.838709677419355e-05, "loss": 0.3207, "step": 4900 }, { "epoch": 39.52, "eval_loss": 0.3276441991329193, "eval_runtime": 96.7884, "eval_samples_per_second": 19.052, "eval_steps_per_second": 2.387, "eval_wer": 0.40313257505127725, "step": 4900 }, { "epoch": 40.32, "learning_rate": 6.56989247311828e-05, "loss": 0.3186, "step": 5000 }, { "epoch": 40.32, "eval_loss": 0.3335840106010437, "eval_runtime": 98.1942, "eval_samples_per_second": 18.779, "eval_steps_per_second": 2.352, "eval_wer": 0.4032258064516129, "step": 5000 }, { "epoch": 41.13, "learning_rate": 6.301075268817205e-05, "loss": 0.3152, "step": 5100 }, { "epoch": 41.13, "eval_loss": 0.3129470944404602, "eval_runtime": 99.396, "eval_samples_per_second": 18.552, "eval_steps_per_second": 2.324, "eval_wer": 0.3941823606190565, "step": 5100 }, { "epoch": 41.94, "learning_rate": 6.0322580645161295e-05, "loss": 0.3093, "step": 5200 }, { "epoch": 41.94, "eval_loss": 0.31502029299736023, "eval_runtime": 97.1686, "eval_samples_per_second": 18.977, "eval_steps_per_second": 2.377, "eval_wer": 0.3930635838150289, "step": 5200 }, { "epoch": 42.74, "learning_rate": 5.763440860215054e-05, "loss": 0.2949, "step": 5300 }, { "epoch": 42.74, "eval_loss": 0.3235335052013397, "eval_runtime": 102.899, "eval_samples_per_second": 17.92, "eval_steps_per_second": 2.245, "eval_wer": 0.3953011374230841, "step": 5300 }, { "epoch": 43.55, "learning_rate": 5.494623655913979e-05, "loss": 0.3013, "step": 5400 }, { "epoch": 43.55, "eval_loss": 0.3291964530944824, "eval_runtime": 97.4704, "eval_samples_per_second": 18.919, "eval_steps_per_second": 2.37, "eval_wer": 0.3934365094163714, "step": 5400 }, { "epoch": 44.35, "learning_rate": 5.225806451612903e-05, "loss": 0.3092, "step": 5500 }, { "epoch": 44.35, "eval_loss": 0.3066520392894745, "eval_runtime": 96.9166, "eval_samples_per_second": 19.027, "eval_steps_per_second": 2.383, "eval_wer": 0.38616446019019207, "step": 5500 }, { "epoch": 45.16, "learning_rate": 4.956989247311828e-05, "loss": 0.2938, "step": 5600 }, { "epoch": 45.16, "eval_loss": 0.32365530729293823, "eval_runtime": 98.8953, "eval_samples_per_second": 18.646, "eval_steps_per_second": 2.336, "eval_wer": 0.38756293119522656, "step": 5600 }, { "epoch": 45.97, "learning_rate": 4.688172043010753e-05, "loss": 0.2985, "step": 5700 }, { "epoch": 45.97, "eval_loss": 0.3358381390571594, "eval_runtime": 96.7245, "eval_samples_per_second": 19.064, "eval_steps_per_second": 2.388, "eval_wer": 0.3876561625955622, "step": 5700 }, { "epoch": 46.77, "learning_rate": 4.4193548387096775e-05, "loss": 0.2943, "step": 5800 }, { "epoch": 46.77, "eval_loss": 0.3283197283744812, "eval_runtime": 98.5499, "eval_samples_per_second": 18.711, "eval_steps_per_second": 2.344, "eval_wer": 0.3928771210143576, "step": 5800 }, { "epoch": 47.58, "learning_rate": 4.1505376344086025e-05, "loss": 0.2754, "step": 5900 }, { "epoch": 47.58, "eval_loss": 0.33124613761901855, "eval_runtime": 97.2557, "eval_samples_per_second": 18.96, "eval_steps_per_second": 2.375, "eval_wer": 0.38952079060227485, "step": 5900 }, { "epoch": 48.39, "learning_rate": 3.881720430107527e-05, "loss": 0.2906, "step": 6000 }, { "epoch": 48.39, "eval_loss": 0.33012691140174866, "eval_runtime": 99.7418, "eval_samples_per_second": 18.488, "eval_steps_per_second": 2.316, "eval_wer": 0.39045310460563115, "step": 6000 }, { "epoch": 49.19, "learning_rate": 3.612903225806452e-05, "loss": 0.2751, "step": 6100 }, { "epoch": 49.19, "eval_loss": 0.3261188566684723, "eval_runtime": 98.7276, "eval_samples_per_second": 18.678, "eval_steps_per_second": 2.34, "eval_wer": 0.3873764683945553, "step": 6100 }, { "epoch": 50.0, "learning_rate": 3.344086021505377e-05, "loss": 0.2825, "step": 6200 }, { "epoch": 50.0, "eval_loss": 0.3322080671787262, "eval_runtime": 97.0188, "eval_samples_per_second": 19.007, "eval_steps_per_second": 2.381, "eval_wer": 0.38700354279321275, "step": 6200 }, { "epoch": 50.81, "learning_rate": 3.075268817204301e-05, "loss": 0.2727, "step": 6300 }, { "epoch": 50.81, "eval_loss": 0.3448057770729065, "eval_runtime": 98.9754, "eval_samples_per_second": 18.631, "eval_steps_per_second": 2.334, "eval_wer": 0.3928771210143576, "step": 6300 }, { "epoch": 51.61, "learning_rate": 2.806451612903226e-05, "loss": 0.2896, "step": 6400 }, { "epoch": 51.61, "eval_loss": 0.33276790380477905, "eval_runtime": 96.9108, "eval_samples_per_second": 19.028, "eval_steps_per_second": 2.384, "eval_wer": 0.38858847659891854, "step": 6400 }, { "epoch": 52.42, "learning_rate": 2.537634408602151e-05, "loss": 0.2753, "step": 6500 }, { "epoch": 52.42, "eval_loss": 0.32856670022010803, "eval_runtime": 105.68, "eval_samples_per_second": 17.449, "eval_steps_per_second": 2.186, "eval_wer": 0.3876561625955622, "step": 6500 }, { "epoch": 53.23, "learning_rate": 2.268817204301075e-05, "loss": 0.271, "step": 6600 }, { "epoch": 53.23, "eval_loss": 0.3287724256515503, "eval_runtime": 100.7427, "eval_samples_per_second": 18.304, "eval_steps_per_second": 2.293, "eval_wer": 0.3876561625955622, "step": 6600 }, { "epoch": 54.03, "learning_rate": 2e-05, "loss": 0.2664, "step": 6700 }, { "epoch": 54.03, "eval_loss": 0.3290824890136719, "eval_runtime": 98.5577, "eval_samples_per_second": 18.71, "eval_steps_per_second": 2.344, "eval_wer": 0.3893343278016036, "step": 6700 }, { "epoch": 54.84, "learning_rate": 1.7311827956989248e-05, "loss": 0.2491, "step": 6800 }, { "epoch": 54.84, "eval_loss": 0.33568552136421204, "eval_runtime": 103.2565, "eval_samples_per_second": 17.858, "eval_steps_per_second": 2.237, "eval_wer": 0.388215550997576, "step": 6800 }, { "epoch": 55.65, "learning_rate": 1.4623655913978495e-05, "loss": 0.2569, "step": 6900 }, { "epoch": 55.65, "eval_loss": 0.3253258466720581, "eval_runtime": 104.0214, "eval_samples_per_second": 17.727, "eval_steps_per_second": 2.221, "eval_wer": 0.3876561625955622, "step": 6900 }, { "epoch": 56.45, "learning_rate": 1.1935483870967743e-05, "loss": 0.2568, "step": 7000 }, { "epoch": 56.45, "eval_loss": 0.3199854791164398, "eval_runtime": 103.944, "eval_samples_per_second": 17.74, "eval_steps_per_second": 2.222, "eval_wer": 0.3868170799925415, "step": 7000 }, { "epoch": 57.26, "learning_rate": 9.24731182795699e-06, "loss": 0.2668, "step": 7100 }, { "epoch": 57.26, "eval_loss": 0.32368558645248413, "eval_runtime": 103.5633, "eval_samples_per_second": 17.806, "eval_steps_per_second": 2.231, "eval_wer": 0.3862576915905277, "step": 7100 }, { "epoch": 58.06, "learning_rate": 6.586021505376344e-06, "loss": 0.253, "step": 7200 }, { "epoch": 58.06, "eval_loss": 0.3248105049133301, "eval_runtime": 103.7822, "eval_samples_per_second": 17.768, "eval_steps_per_second": 2.226, "eval_wer": 0.38504568338616446, "step": 7200 }, { "epoch": 58.87, "learning_rate": 3.8978494623655915e-06, "loss": 0.2621, "step": 7300 }, { "epoch": 58.87, "eval_loss": 0.3238443434238434, "eval_runtime": 97.9464, "eval_samples_per_second": 18.827, "eval_steps_per_second": 2.358, "eval_wer": 0.38448629498415066, "step": 7300 }, { "epoch": 59.68, "learning_rate": 1.2096774193548388e-06, "loss": 0.2571, "step": 7400 }, { "epoch": 59.68, "eval_loss": 0.3273279666900635, "eval_runtime": 101.5169, "eval_samples_per_second": 18.164, "eval_steps_per_second": 2.275, "eval_wer": 0.3852321461868357, "step": 7400 }, { "epoch": 60.0, "step": 7440, "total_flos": 2.7388066347434852e+19, "train_loss": 0.8272683016715511, "train_runtime": 19767.0967, "train_samples_per_second": 12.035, "train_steps_per_second": 0.376 } ], "max_steps": 7440, "num_train_epochs": 60, "total_flos": 2.7388066347434852e+19, "trial_name": null, "trial_params": null }