{ "best_metric": null, "best_model_checkpoint": null, "epoch": 5.0, "global_step": 11395, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.04, "eval_loss": Infinity, "eval_runtime": 762.0088, "eval_samples_per_second": 19.376, "eval_steps_per_second": 2.423, "eval_wer": 1.0, "step": 100 }, { "epoch": 0.09, "eval_loss": Infinity, "eval_runtime": 760.7665, "eval_samples_per_second": 19.408, "eval_steps_per_second": 2.427, "eval_wer": 0.9983381717130623, "step": 200 }, { "epoch": 0.13, "eval_loss": Infinity, "eval_runtime": 758.492, "eval_samples_per_second": 19.466, "eval_steps_per_second": 2.434, "eval_wer": 0.7671578598961529, "step": 300 }, { "epoch": 0.18, "eval_loss": Infinity, "eval_runtime": 763.9298, "eval_samples_per_second": 19.328, "eval_steps_per_second": 2.416, "eval_wer": 0.6919342715882527, "step": 400 }, { "epoch": 0.22, "learning_rate": 0.000996, "loss": 2.9929, "step": 500 }, { "epoch": 0.22, "eval_loss": Infinity, "eval_runtime": 771.5199, "eval_samples_per_second": 19.138, "eval_steps_per_second": 2.393, "eval_wer": 0.6265920108122272, "step": 500 }, { "epoch": 0.26, "eval_loss": Infinity, "eval_runtime": 768.8673, "eval_samples_per_second": 19.204, "eval_steps_per_second": 2.401, "eval_wer": 0.5512649892084595, "step": 600 }, { "epoch": 0.31, "eval_loss": Infinity, "eval_runtime": 774.562, "eval_samples_per_second": 19.062, "eval_steps_per_second": 2.383, "eval_wer": 0.508133304831714, "step": 700 }, { "epoch": 0.35, "eval_loss": Infinity, "eval_runtime": 770.4155, "eval_samples_per_second": 19.165, "eval_steps_per_second": 2.396, "eval_wer": 0.4944870053302625, "step": 800 }, { "epoch": 0.39, "eval_loss": Infinity, "eval_runtime": 769.5888, "eval_samples_per_second": 19.186, "eval_steps_per_second": 2.399, "eval_wer": 0.4720419801270161, "step": 900 }, { "epoch": 0.44, "learning_rate": 0.0009542909591555759, "loss": 0.5311, "step": 1000 }, { "epoch": 0.44, "eval_loss": Infinity, "eval_runtime": 772.8626, "eval_samples_per_second": 19.104, "eval_steps_per_second": 2.389, "eval_wer": 0.4387433544107405, "step": 1000 }, { "epoch": 0.48, "eval_loss": Infinity, "eval_runtime": 769.5289, "eval_samples_per_second": 19.187, "eval_steps_per_second": 2.399, "eval_wer": 0.4410533646851146, "step": 1100 }, { "epoch": 0.53, "eval_loss": Infinity, "eval_runtime": 780.8054, "eval_samples_per_second": 18.91, "eval_steps_per_second": 2.364, "eval_wer": 0.44290826845767167, "step": 1200 }, { "epoch": 0.57, "eval_loss": Infinity, "eval_runtime": 774.2302, "eval_samples_per_second": 19.071, "eval_steps_per_second": 2.384, "eval_wer": 0.43216499679356785, "step": 1300 }, { "epoch": 0.61, "eval_loss": Infinity, "eval_runtime": 768.9729, "eval_samples_per_second": 19.201, "eval_steps_per_second": 2.401, "eval_wer": 0.4531826425138428, "step": 1400 }, { "epoch": 0.66, "learning_rate": 0.0009083983478659936, "loss": 0.4654, "step": 1500 }, { "epoch": 0.66, "eval_loss": Infinity, "eval_runtime": 777.4905, "eval_samples_per_second": 18.991, "eval_steps_per_second": 2.374, "eval_wer": 0.44915563952806836, "step": 1500 }, { "epoch": 0.7, "eval_loss": Infinity, "eval_runtime": 773.9985, "eval_samples_per_second": 19.076, "eval_steps_per_second": 2.385, "eval_wer": 0.3878817550561643, "step": 1600 }, { "epoch": 0.75, "eval_loss": Infinity, "eval_runtime": 773.8841, "eval_samples_per_second": 19.079, "eval_steps_per_second": 2.385, "eval_wer": 0.3835927210541922, "step": 1700 }, { "epoch": 0.79, "eval_loss": Infinity, "eval_runtime": 773.515, "eval_samples_per_second": 19.088, "eval_steps_per_second": 2.387, "eval_wer": 0.37425614221388626, "step": 1800 }, { "epoch": 0.83, "eval_loss": Infinity, "eval_runtime": 774.3742, "eval_samples_per_second": 19.067, "eval_steps_per_second": 2.384, "eval_wer": 0.36867074423704155, "step": 1900 }, { "epoch": 0.88, "learning_rate": 0.0008625975217989904, "loss": 0.4254, "step": 2000 }, { "epoch": 0.88, "eval_loss": Infinity, "eval_runtime": 774.0591, "eval_samples_per_second": 19.075, "eval_steps_per_second": 2.385, "eval_wer": 0.3792830003930465, "step": 2000 }, { "epoch": 0.92, "eval_loss": Infinity, "eval_runtime": 768.0215, "eval_samples_per_second": 19.225, "eval_steps_per_second": 2.404, "eval_wer": 0.3766006302535495, "step": 2100 }, { "epoch": 0.97, "eval_loss": Infinity, "eval_runtime": 772.2372, "eval_samples_per_second": 19.12, "eval_steps_per_second": 2.39, "eval_wer": 0.3705256480095986, "step": 2200 }, { "epoch": 1.01, "eval_loss": Infinity, "eval_runtime": 767.2028, "eval_samples_per_second": 19.245, "eval_steps_per_second": 2.406, "eval_wer": 0.3271802014880604, "step": 2300 }, { "epoch": 1.05, "eval_loss": Infinity, "eval_runtime": 768.4281, "eval_samples_per_second": 19.215, "eval_steps_per_second": 2.402, "eval_wer": 0.31850559574130644, "step": 2400 }, { "epoch": 1.1, "learning_rate": 0.000816704910509408, "loss": 0.3997, "step": 2500 }, { "epoch": 1.1, "eval_loss": Infinity, "eval_runtime": 767.2666, "eval_samples_per_second": 19.244, "eval_steps_per_second": 2.406, "eval_wer": 0.3244426669241006, "step": 2500 }, { "epoch": 1.14, "eval_loss": Infinity, "eval_runtime": 767.2447, "eval_samples_per_second": 19.244, "eval_steps_per_second": 2.406, "eval_wer": 0.30816916170761477, "step": 2600 }, { "epoch": 1.18, "eval_loss": Infinity, "eval_runtime": 771.1785, "eval_samples_per_second": 19.146, "eval_steps_per_second": 2.394, "eval_wer": 0.30403872542597277, "step": 2700 }, { "epoch": 1.23, "eval_loss": Infinity, "eval_runtime": 761.2544, "eval_samples_per_second": 19.396, "eval_steps_per_second": 2.425, "eval_wer": 0.30282510808779417, "step": 2800 }, { "epoch": 1.27, "eval_loss": Infinity, "eval_runtime": 770.9042, "eval_samples_per_second": 19.153, "eval_steps_per_second": 2.395, "eval_wer": 0.3112101006061191, "step": 2900 }, { "epoch": 1.32, "learning_rate": 0.0007709040844424048, "loss": 0.3668, "step": 3000 }, { "epoch": 1.32, "eval_loss": Infinity, "eval_runtime": 763.6174, "eval_samples_per_second": 19.336, "eval_steps_per_second": 2.417, "eval_wer": 0.31098944290826847, "step": 3000 }, { "epoch": 1.36, "eval_loss": Infinity, "eval_runtime": 765.7415, "eval_samples_per_second": 19.282, "eval_steps_per_second": 2.411, "eval_wer": 0.3066521400348915, "step": 3100 }, { "epoch": 1.4, "eval_loss": Infinity, "eval_runtime": 762.1465, "eval_samples_per_second": 19.373, "eval_steps_per_second": 2.422, "eval_wer": 0.29612952606863835, "step": 3200 }, { "epoch": 1.45, "eval_loss": Infinity, "eval_runtime": 764.1293, "eval_samples_per_second": 19.323, "eval_steps_per_second": 2.416, "eval_wer": 0.3080933106239786, "step": 3300 }, { "epoch": 1.49, "eval_loss": Infinity, "eval_runtime": 764.6533, "eval_samples_per_second": 19.309, "eval_steps_per_second": 2.414, "eval_wer": 0.2936195447555871, "step": 3400 }, { "epoch": 1.54, "learning_rate": 0.0007250114731528225, "loss": 0.3645, "step": 3500 }, { "epoch": 1.54, "eval_loss": Infinity, "eval_runtime": 762.2683, "eval_samples_per_second": 19.37, "eval_steps_per_second": 2.422, "eval_wer": 0.30368015666696546, "step": 3500 }, { "epoch": 1.58, "eval_loss": Infinity, "eval_runtime": 760.0026, "eval_samples_per_second": 19.428, "eval_steps_per_second": 2.429, "eval_wer": 0.2973914122782218, "step": 3600 }, { "epoch": 1.62, "eval_loss": Infinity, "eval_runtime": 760.5942, "eval_samples_per_second": 19.412, "eval_steps_per_second": 2.427, "eval_wer": 0.30096330876217925, "step": 3700 }, { "epoch": 1.67, "eval_loss": Infinity, "eval_runtime": 761.2356, "eval_samples_per_second": 19.396, "eval_steps_per_second": 2.425, "eval_wer": 0.2985498651919377, "step": 3800 }, { "epoch": 1.71, "eval_loss": Infinity, "eval_runtime": 767.0946, "eval_samples_per_second": 19.248, "eval_steps_per_second": 2.406, "eval_wer": 0.2975775922107833, "step": 3900 }, { "epoch": 1.76, "learning_rate": 0.00067911886186324, "loss": 0.3624, "step": 4000 }, { "epoch": 1.76, "eval_loss": Infinity, "eval_runtime": 764.3373, "eval_samples_per_second": 19.317, "eval_steps_per_second": 2.415, "eval_wer": 0.292757600623358, "step": 4000 }, { "epoch": 1.8, "eval_loss": Infinity, "eval_runtime": 778.1044, "eval_samples_per_second": 18.976, "eval_steps_per_second": 2.372, "eval_wer": 0.2859516897552768, "step": 4100 }, { "epoch": 1.84, "eval_loss": Infinity, "eval_runtime": 780.7174, "eval_samples_per_second": 18.912, "eval_steps_per_second": 2.364, "eval_wer": 0.29222664303790485, "step": 4200 }, { "epoch": 1.89, "eval_loss": Infinity, "eval_runtime": 778.463, "eval_samples_per_second": 18.967, "eval_steps_per_second": 2.371, "eval_wer": 0.2865929761896553, "step": 4300 }, { "epoch": 1.93, "eval_loss": Infinity, "eval_runtime": 777.1309, "eval_samples_per_second": 18.999, "eval_steps_per_second": 2.375, "eval_wer": 0.2775529061308362, "step": 4400 }, { "epoch": 1.97, "learning_rate": 0.0006332262505736577, "loss": 0.3527, "step": 4500 }, { "epoch": 1.97, "eval_loss": Infinity, "eval_runtime": 776.0915, "eval_samples_per_second": 19.025, "eval_steps_per_second": 2.379, "eval_wer": 0.27924921218306314, "step": 4500 }, { "epoch": 2.02, "eval_loss": Infinity, "eval_runtime": 777.8615, "eval_samples_per_second": 18.982, "eval_steps_per_second": 2.373, "eval_wer": 0.2857655098227153, "step": 4600 }, { "epoch": 2.06, "eval_loss": Infinity, "eval_runtime": 779.7088, "eval_samples_per_second": 18.937, "eval_steps_per_second": 2.368, "eval_wer": 0.27665648423331796, "step": 4700 }, { "epoch": 2.11, "eval_loss": Infinity, "eval_runtime": 780.5896, "eval_samples_per_second": 18.915, "eval_steps_per_second": 2.365, "eval_wer": 0.28240047993049283, "step": 4800 }, { "epoch": 2.15, "eval_loss": Infinity, "eval_runtime": 781.7435, "eval_samples_per_second": 18.887, "eval_steps_per_second": 2.361, "eval_wer": 0.27986291640521027, "step": 4900 }, { "epoch": 2.19, "learning_rate": 0.0005873336392840752, "loss": 0.3162, "step": 5000 }, { "epoch": 2.19, "eval_loss": Infinity, "eval_runtime": 785.7508, "eval_samples_per_second": 18.791, "eval_steps_per_second": 2.349, "eval_wer": 0.26727853207466507, "step": 5000 }, { "epoch": 2.24, "eval_loss": Infinity, "eval_runtime": 789.097, "eval_samples_per_second": 18.711, "eval_steps_per_second": 2.339, "eval_wer": 0.2961915860461588, "step": 5100 }, { "epoch": 2.28, "eval_loss": Infinity, "eval_runtime": 782.4986, "eval_samples_per_second": 18.869, "eval_steps_per_second": 2.359, "eval_wer": 0.2735948586756401, "step": 5200 }, { "epoch": 2.33, "eval_loss": Infinity, "eval_runtime": 780.5596, "eval_samples_per_second": 18.916, "eval_steps_per_second": 2.365, "eval_wer": 0.2651547017328525, "step": 5300 }, { "epoch": 2.37, "eval_loss": Infinity, "eval_runtime": 782.8773, "eval_samples_per_second": 18.86, "eval_steps_per_second": 2.358, "eval_wer": 0.2550527165031271, "step": 5400 }, { "epoch": 2.41, "learning_rate": 0.0005414410279944929, "loss": 0.3063, "step": 5500 }, { "epoch": 2.41, "eval_loss": Infinity, "eval_runtime": 779.9742, "eval_samples_per_second": 18.93, "eval_steps_per_second": 2.367, "eval_wer": 0.26804393846408453, "step": 5500 }, { "epoch": 2.46, "eval_loss": Infinity, "eval_runtime": 783.4711, "eval_samples_per_second": 18.846, "eval_steps_per_second": 2.356, "eval_wer": 0.2557767495741996, "step": 5600 }, { "epoch": 2.5, "eval_loss": Infinity, "eval_runtime": 792.9653, "eval_samples_per_second": 18.62, "eval_steps_per_second": 2.328, "eval_wer": 0.2597830659008006, "step": 5700 }, { "epoch": 2.54, "eval_loss": Infinity, "eval_runtime": 788.5494, "eval_samples_per_second": 18.724, "eval_steps_per_second": 2.341, "eval_wer": 0.25175664214148297, "step": 5800 }, { "epoch": 2.59, "eval_loss": Infinity, "eval_runtime": 777.5477, "eval_samples_per_second": 18.989, "eval_steps_per_second": 2.374, "eval_wer": 0.254149399052551, "step": 5900 }, { "epoch": 2.63, "learning_rate": 0.0004955484167049105, "loss": 0.2913, "step": 6000 }, { "epoch": 2.63, "eval_loss": Infinity, "eval_runtime": 785.1255, "eval_samples_per_second": 18.806, "eval_steps_per_second": 2.351, "eval_wer": 0.2507361002889237, "step": 6000 }, { "epoch": 2.68, "eval_loss": Infinity, "eval_runtime": 785.3479, "eval_samples_per_second": 18.801, "eval_steps_per_second": 2.351, "eval_wer": 0.24998448500561987, "step": 6100 }, { "epoch": 2.72, "eval_loss": Infinity, "eval_runtime": 781.3987, "eval_samples_per_second": 18.896, "eval_steps_per_second": 2.362, "eval_wer": 0.24352335179043036, "step": 6200 }, { "epoch": 2.76, "eval_loss": Infinity, "eval_runtime": 781.4686, "eval_samples_per_second": 18.894, "eval_steps_per_second": 2.362, "eval_wer": 0.23755180284234698, "step": 6300 }, { "epoch": 2.81, "eval_loss": Infinity, "eval_runtime": 775.7634, "eval_samples_per_second": 19.033, "eval_steps_per_second": 2.38, "eval_wer": 0.23476599940698245, "step": 6400 }, { "epoch": 2.85, "learning_rate": 0.0004497475906379073, "loss": 0.2797, "step": 6500 }, { "epoch": 2.85, "eval_loss": Infinity, "eval_runtime": 772.9219, "eval_samples_per_second": 19.103, "eval_steps_per_second": 2.388, "eval_wer": 0.2512049978968563, "step": 6500 }, { "epoch": 2.9, "eval_loss": Infinity, "eval_runtime": 771.2336, "eval_samples_per_second": 19.145, "eval_steps_per_second": 2.394, "eval_wer": 0.23818619372366762, "step": 6600 }, { "epoch": 2.94, "eval_loss": Infinity, "eval_runtime": 777.0185, "eval_samples_per_second": 19.002, "eval_steps_per_second": 2.376, "eval_wer": 0.2523082863861096, "step": 6700 }, { "epoch": 2.98, "eval_loss": Infinity, "eval_runtime": 773.6017, "eval_samples_per_second": 19.086, "eval_steps_per_second": 2.386, "eval_wer": 0.25221864419635776, "step": 6800 }, { "epoch": 3.03, "eval_loss": Infinity, "eval_runtime": 780.1394, "eval_samples_per_second": 18.926, "eval_steps_per_second": 2.366, "eval_wer": 0.24091683273456949, "step": 6900 }, { "epoch": 3.07, "learning_rate": 0.0004038549793483249, "loss": 0.2766, "step": 7000 }, { "epoch": 3.07, "eval_loss": Infinity, "eval_runtime": 783.1904, "eval_samples_per_second": 18.852, "eval_steps_per_second": 2.357, "eval_wer": 0.24534377779769825, "step": 7000 }, { "epoch": 3.12, "eval_loss": Infinity, "eval_runtime": 777.1186, "eval_samples_per_second": 19.0, "eval_steps_per_second": 2.375, "eval_wer": 0.2326076912998807, "step": 7100 }, { "epoch": 3.16, "eval_loss": Infinity, "eval_runtime": 781.1613, "eval_samples_per_second": 18.901, "eval_steps_per_second": 2.363, "eval_wer": 0.22860137497327973, "step": 7200 }, { "epoch": 3.2, "eval_loss": Infinity, "eval_runtime": 786.2675, "eval_samples_per_second": 18.779, "eval_steps_per_second": 2.348, "eval_wer": 0.23420745960929795, "step": 7300 }, { "epoch": 3.25, "eval_loss": Infinity, "eval_runtime": 781.7233, "eval_samples_per_second": 18.888, "eval_steps_per_second": 2.361, "eval_wer": 0.23047006985195248, "step": 7400 }, { "epoch": 3.29, "learning_rate": 0.0003579623680587425, "loss": 0.2468, "step": 7500 }, { "epoch": 3.29, "eval_loss": Infinity, "eval_runtime": 777.7207, "eval_samples_per_second": 18.985, "eval_steps_per_second": 2.374, "eval_wer": 0.2238089655980858, "step": 7500 }, { "epoch": 3.33, "eval_loss": Infinity, "eval_runtime": 786.7846, "eval_samples_per_second": 18.766, "eval_steps_per_second": 2.346, "eval_wer": 0.23211121147971672, "step": 7600 }, { "epoch": 3.38, "eval_loss": Infinity, "eval_runtime": 784.5553, "eval_samples_per_second": 18.82, "eval_steps_per_second": 2.353, "eval_wer": 0.23048386095806814, "step": 7700 }, { "epoch": 3.42, "eval_loss": Infinity, "eval_runtime": 776.8796, "eval_samples_per_second": 19.006, "eval_steps_per_second": 2.376, "eval_wer": 0.21740989236041677, "step": 7800 }, { "epoch": 3.47, "eval_loss": Infinity, "eval_runtime": 778.8968, "eval_samples_per_second": 18.956, "eval_steps_per_second": 2.37, "eval_wer": 0.22008536694685596, "step": 7900 }, { "epoch": 3.51, "learning_rate": 0.00031206975676916014, "loss": 0.2439, "step": 8000 }, { "epoch": 3.51, "eval_loss": Infinity, "eval_runtime": 785.8625, "eval_samples_per_second": 18.788, "eval_steps_per_second": 2.349, "eval_wer": 0.21332772495017963, "step": 8000 }, { "epoch": 3.55, "eval_loss": Infinity, "eval_runtime": 778.9388, "eval_samples_per_second": 18.955, "eval_steps_per_second": 2.37, "eval_wer": 0.22168513525627323, "step": 8100 }, { "epoch": 3.6, "eval_loss": Infinity, "eval_runtime": 779.3965, "eval_samples_per_second": 18.944, "eval_steps_per_second": 2.368, "eval_wer": 0.21885106294950388, "step": 8200 }, { "epoch": 3.64, "eval_loss": Infinity, "eval_runtime": 786.4104, "eval_samples_per_second": 18.775, "eval_steps_per_second": 2.347, "eval_wer": 0.2105212348556416, "step": 8300 }, { "epoch": 3.69, "eval_loss": Infinity, "eval_runtime": 784.1132, "eval_samples_per_second": 18.83, "eval_steps_per_second": 2.354, "eval_wer": 0.21176932995910938, "step": 8400 }, { "epoch": 3.73, "learning_rate": 0.0002661771454795778, "loss": 0.2357, "step": 8500 }, { "epoch": 3.73, "eval_loss": Infinity, "eval_runtime": 776.0702, "eval_samples_per_second": 19.025, "eval_steps_per_second": 2.379, "eval_wer": 0.20932830417663648, "step": 8500 }, { "epoch": 3.77, "eval_loss": Infinity, "eval_runtime": 777.6609, "eval_samples_per_second": 18.986, "eval_steps_per_second": 2.374, "eval_wer": 0.21030747271084876, "step": 8600 }, { "epoch": 3.82, "eval_loss": Infinity, "eval_runtime": 773.9787, "eval_samples_per_second": 19.077, "eval_steps_per_second": 2.385, "eval_wer": 0.20353603960805677, "step": 8700 }, { "epoch": 3.86, "eval_loss": Infinity, "eval_runtime": 780.5659, "eval_samples_per_second": 18.916, "eval_steps_per_second": 2.365, "eval_wer": 0.2019362712986395, "step": 8800 }, { "epoch": 3.91, "eval_loss": Infinity, "eval_runtime": 779.996, "eval_samples_per_second": 18.93, "eval_steps_per_second": 2.367, "eval_wer": 0.20323953082656995, "step": 8900 }, { "epoch": 3.95, "learning_rate": 0.0002203763194125746, "loss": 0.2217, "step": 9000 }, { "epoch": 3.95, "eval_loss": Infinity, "eval_runtime": 778.6538, "eval_samples_per_second": 18.962, "eval_steps_per_second": 2.371, "eval_wer": 0.20561849663152232, "step": 9000 }, { "epoch": 3.99, "eval_loss": Infinity, "eval_runtime": 778.3405, "eval_samples_per_second": 18.97, "eval_steps_per_second": 2.372, "eval_wer": 0.20215003344343233, "step": 9100 }, { "epoch": 4.04, "eval_loss": Infinity, "eval_runtime": 787.2038, "eval_samples_per_second": 18.756, "eval_steps_per_second": 2.345, "eval_wer": 0.19324787444576993, "step": 9200 }, { "epoch": 4.08, "eval_loss": Infinity, "eval_runtime": 775.7143, "eval_samples_per_second": 19.034, "eval_steps_per_second": 2.38, "eval_wer": 0.19350300990890976, "step": 9300 }, { "epoch": 4.12, "eval_loss": Infinity, "eval_runtime": 773.9153, "eval_samples_per_second": 19.078, "eval_steps_per_second": 2.385, "eval_wer": 0.1905655043062729, "step": 9400 }, { "epoch": 4.17, "learning_rate": 0.0001744837081229922, "loss": 0.2025, "step": 9500 }, { "epoch": 4.17, "eval_loss": Infinity, "eval_runtime": 779.0392, "eval_samples_per_second": 18.953, "eval_steps_per_second": 2.37, "eval_wer": 0.18794519414429633, "step": 9500 }, { "epoch": 4.21, "eval_loss": Infinity, "eval_runtime": 779.0747, "eval_samples_per_second": 18.952, "eval_steps_per_second": 2.369, "eval_wer": 0.18824859847884098, "step": 9600 }, { "epoch": 4.26, "eval_loss": Infinity, "eval_runtime": 777.6573, "eval_samples_per_second": 18.987, "eval_steps_per_second": 2.374, "eval_wer": 0.18538004840678246, "step": 9700 }, { "epoch": 4.3, "eval_loss": Infinity, "eval_runtime": 772.7615, "eval_samples_per_second": 19.107, "eval_steps_per_second": 2.389, "eval_wer": 0.18654539687355626, "step": 9800 }, { "epoch": 4.34, "eval_loss": Infinity, "eval_runtime": 778.0179, "eval_samples_per_second": 18.978, "eval_steps_per_second": 2.373, "eval_wer": 0.18438708876645452, "step": 9900 }, { "epoch": 4.39, "learning_rate": 0.00012859109683340984, "loss": 0.1869, "step": 10000 }, { "epoch": 4.39, "eval_loss": Infinity, "eval_runtime": 778.8028, "eval_samples_per_second": 18.959, "eval_steps_per_second": 2.37, "eval_wer": 0.1821667206818323, "step": 10000 }, { "epoch": 4.43, "eval_loss": Infinity, "eval_runtime": 777.366, "eval_samples_per_second": 18.994, "eval_steps_per_second": 2.375, "eval_wer": 0.1815461209066273, "step": 10100 }, { "epoch": 4.48, "eval_loss": Infinity, "eval_runtime": 781.9611, "eval_samples_per_second": 18.882, "eval_steps_per_second": 2.361, "eval_wer": 0.18118755214762, "step": 10200 }, { "epoch": 4.52, "eval_loss": Infinity, "eval_runtime": 760.9314, "eval_samples_per_second": 19.404, "eval_steps_per_second": 2.426, "eval_wer": 0.17923611063225325, "step": 10300 }, { "epoch": 4.56, "eval_loss": Infinity, "eval_runtime": 761.9088, "eval_samples_per_second": 19.379, "eval_steps_per_second": 2.423, "eval_wer": 0.17967742602795458, "step": 10400 }, { "epoch": 4.61, "learning_rate": 8.269848554382745e-05, "loss": 0.1863, "step": 10500 }, { "epoch": 4.61, "eval_loss": Infinity, "eval_runtime": 760.7934, "eval_samples_per_second": 19.407, "eval_steps_per_second": 2.426, "eval_wer": 0.1773812068596962, "step": 10500 }, { "epoch": 4.65, "eval_loss": Infinity, "eval_runtime": 755.7192, "eval_samples_per_second": 19.538, "eval_steps_per_second": 2.443, "eval_wer": 0.1767330248722599, "step": 10600 }, { "epoch": 4.7, "eval_loss": Infinity, "eval_runtime": 756.3189, "eval_samples_per_second": 19.522, "eval_steps_per_second": 2.441, "eval_wer": 0.17650547162135138, "step": 10700 }, { "epoch": 4.74, "eval_loss": Infinity, "eval_runtime": 761.0501, "eval_samples_per_second": 19.401, "eval_steps_per_second": 2.426, "eval_wer": 0.1752918542831728, "step": 10800 }, { "epoch": 4.78, "eval_loss": Infinity, "eval_runtime": 756.3701, "eval_samples_per_second": 19.521, "eval_steps_per_second": 2.441, "eval_wer": 0.17308527730466622, "step": 10900 }, { "epoch": 4.83, "learning_rate": 3.6805874254245066e-05, "loss": 0.178, "step": 11000 }, { "epoch": 4.83, "eval_loss": Infinity, "eval_runtime": 758.6147, "eval_samples_per_second": 19.463, "eval_steps_per_second": 2.433, "eval_wer": 0.17265775301508057, "step": 11000 }, { "epoch": 4.87, "eval_loss": Infinity, "eval_runtime": 759.5074, "eval_samples_per_second": 19.44, "eval_steps_per_second": 2.431, "eval_wer": 0.17243709531722992, "step": 11100 }, { "epoch": 4.91, "eval_loss": Infinity, "eval_runtime": 757.3653, "eval_samples_per_second": 19.495, "eval_steps_per_second": 2.437, "eval_wer": 0.17223022872549493, "step": 11200 }, { "epoch": 4.96, "eval_loss": Infinity, "eval_runtime": 756.4761, "eval_samples_per_second": 19.518, "eval_steps_per_second": 2.44, "eval_wer": 0.17115452244847298, "step": 11300 }, { "epoch": 5.0, "step": 11395, "total_flos": 1.0194681891264653e+20, "train_loss": 0.4200820018974194, "train_runtime": 124144.1421, "train_samples_per_second": 5.872, "train_steps_per_second": 0.092 } ], "max_steps": 11395, "num_train_epochs": 5, "total_flos": 1.0194681891264653e+20, "trial_name": null, "trial_params": null }