{ "best_metric": 0.14607747395833334, "best_model_checkpoint": "/cluster/home/torstefl/Master/saved_model/W2V/single/NB/NB-1b-19.06/checkpoint-3432", "epoch": 40.0, "eval_steps": 500, "global_step": 3520, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "grad_norm": 10.972672462463379, "learning_rate": 1.1600000000000001e-06, "loss": 0.8305, "step": 88 }, { "epoch": 1.0, "eval_rundkast_loss": 0.506217360496521, "eval_rundkast_runtime": 31.8232, "eval_rundkast_samples_per_second": 42.076, "eval_rundkast_steps_per_second": 1.32, "eval_rundkast_wer": 0.20532714765637497, "step": 88 }, { "epoch": 1.0, "eval_nb_samtale_loss": 0.7159814238548279, "eval_nb_samtale_runtime": 38.8295, "eval_nb_samtale_samples_per_second": 13.727, "eval_nb_samtale_steps_per_second": 0.438, "eval_nb_samtale_wer": 0.20125325520833334, "step": 88 }, { "epoch": 1.0, "eval_bigbrother_loss": 2.73382568359375, "eval_bigbrother_runtime": 45.0269, "eval_bigbrother_samples_per_second": 30.426, "eval_bigbrother_steps_per_second": 0.955, "eval_bigbrother_wer": 0.5745589301538709, "step": 88 }, { "epoch": 2.0, "grad_norm": 6.6329345703125, "learning_rate": 2.3333333333333336e-06, "loss": 0.6423, "step": 176 }, { "epoch": 2.0, "eval_rundkast_loss": 0.42037609219551086, "eval_rundkast_runtime": 31.233, "eval_rundkast_samples_per_second": 42.871, "eval_rundkast_steps_per_second": 1.345, "eval_rundkast_wer": 0.2020476723724204, "step": 176 }, { "epoch": 2.0, "eval_nb_samtale_loss": 0.5762496590614319, "eval_nb_samtale_runtime": 38.6529, "eval_nb_samtale_samples_per_second": 13.789, "eval_nb_samtale_steps_per_second": 0.44, "eval_nb_samtale_wer": 0.19417317708333334, "step": 176 }, { "epoch": 2.0, "eval_bigbrother_loss": 2.2738213539123535, "eval_bigbrother_runtime": 44.7689, "eval_bigbrother_samples_per_second": 30.602, "eval_bigbrother_steps_per_second": 0.96, "eval_bigbrother_wer": 0.5613469749456216, "step": 176 }, { "epoch": 3.0, "grad_norm": 4.364439964294434, "learning_rate": 3.5066666666666673e-06, "loss": 0.5857, "step": 264 }, { "epoch": 3.0, "eval_rundkast_loss": 0.41098639369010925, "eval_rundkast_runtime": 31.3258, "eval_rundkast_samples_per_second": 42.744, "eval_rundkast_steps_per_second": 1.341, "eval_rundkast_wer": 0.1977283634618461, "step": 264 }, { "epoch": 3.0, "eval_nb_samtale_loss": 0.5280192494392395, "eval_nb_samtale_runtime": 38.586, "eval_nb_samtale_samples_per_second": 13.813, "eval_nb_samtale_steps_per_second": 0.441, "eval_nb_samtale_wer": 0.18359375, "step": 264 }, { "epoch": 3.0, "eval_bigbrother_loss": 2.192491054534912, "eval_bigbrother_runtime": 44.8015, "eval_bigbrother_samples_per_second": 30.579, "eval_bigbrother_steps_per_second": 0.96, "eval_bigbrother_wer": 0.5548215580439861, "step": 264 }, { "epoch": 4.0, "grad_norm": 5.418688774108887, "learning_rate": 4.680000000000001e-06, "loss": 0.5332, "step": 352 }, { "epoch": 4.0, "eval_rundkast_loss": 0.3839390277862549, "eval_rundkast_runtime": 31.2002, "eval_rundkast_samples_per_second": 42.916, "eval_rundkast_steps_per_second": 1.346, "eval_rundkast_wer": 0.19900815869460886, "step": 352 }, { "epoch": 4.0, "eval_nb_samtale_loss": 0.48143112659454346, "eval_nb_samtale_runtime": 38.3454, "eval_nb_samtale_samples_per_second": 13.9, "eval_nb_samtale_steps_per_second": 0.443, "eval_nb_samtale_wer": 0.179443359375, "step": 352 }, { "epoch": 4.0, "eval_bigbrother_loss": 2.0169622898101807, "eval_bigbrother_runtime": 44.7675, "eval_bigbrother_samples_per_second": 30.603, "eval_bigbrother_steps_per_second": 0.961, "eval_bigbrother_wer": 0.5486183839523081, "step": 352 }, { "epoch": 5.0, "grad_norm": 6.6992034912109375, "learning_rate": 5.853333333333335e-06, "loss": 0.5117, "step": 440 }, { "epoch": 5.0, "eval_rundkast_loss": 0.38616734743118286, "eval_rundkast_runtime": 31.1274, "eval_rundkast_samples_per_second": 43.017, "eval_rundkast_steps_per_second": 1.349, "eval_rundkast_wer": 0.1986082226843705, "step": 440 }, { "epoch": 5.0, "eval_nb_samtale_loss": 0.46892496943473816, "eval_nb_samtale_runtime": 38.4436, "eval_nb_samtale_samples_per_second": 13.864, "eval_nb_samtale_steps_per_second": 0.442, "eval_nb_samtale_wer": 0.17545572916666666, "step": 440 }, { "epoch": 5.0, "eval_bigbrother_loss": 1.9676716327667236, "eval_bigbrother_runtime": 44.7467, "eval_bigbrother_samples_per_second": 30.617, "eval_bigbrother_steps_per_second": 0.961, "eval_bigbrother_wer": 0.5392733424635463, "step": 440 }, { "epoch": 6.0, "grad_norm": 4.8291120529174805, "learning_rate": 7.0266666666666674e-06, "loss": 0.4809, "step": 528 }, { "epoch": 6.0, "eval_rundkast_loss": 0.37009599804878235, "eval_rundkast_runtime": 31.2555, "eval_rundkast_samples_per_second": 42.84, "eval_rundkast_steps_per_second": 1.344, "eval_rundkast_wer": 0.19636858102703567, "step": 528 }, { "epoch": 6.0, "eval_nb_samtale_loss": 0.4429633915424347, "eval_nb_samtale_runtime": 38.3862, "eval_nb_samtale_samples_per_second": 13.885, "eval_nb_samtale_steps_per_second": 0.443, "eval_nb_samtale_wer": 0.17342122395833334, "step": 528 }, { "epoch": 6.0, "eval_bigbrother_loss": 1.9097399711608887, "eval_bigbrother_runtime": 44.7043, "eval_bigbrother_samples_per_second": 30.646, "eval_bigbrother_steps_per_second": 0.962, "eval_bigbrother_wer": 0.5354869894465479, "step": 528 }, { "epoch": 7.0, "grad_norm": 6.0818376541137695, "learning_rate": 8.2e-06, "loss": 0.4485, "step": 616 }, { "epoch": 7.0, "eval_rundkast_loss": 0.39074423909187317, "eval_rundkast_runtime": 31.2655, "eval_rundkast_samples_per_second": 42.827, "eval_rundkast_steps_per_second": 1.343, "eval_rundkast_wer": 0.19580867061270196, "step": 616 }, { "epoch": 7.0, "eval_nb_samtale_loss": 0.44968363642692566, "eval_nb_samtale_runtime": 38.4136, "eval_nb_samtale_samples_per_second": 13.875, "eval_nb_samtale_steps_per_second": 0.443, "eval_nb_samtale_wer": 0.17179361979166666, "step": 616 }, { "epoch": 7.0, "eval_bigbrother_loss": 2.002044439315796, "eval_bigbrother_runtime": 44.9245, "eval_bigbrother_samples_per_second": 30.496, "eval_bigbrother_steps_per_second": 0.957, "eval_bigbrother_wer": 0.5383871747361637, "step": 616 }, { "epoch": 8.0, "grad_norm": 5.505432605743408, "learning_rate": 9.373333333333334e-06, "loss": 0.4364, "step": 704 }, { "epoch": 8.0, "eval_rundkast_loss": 0.38471347093582153, "eval_rundkast_runtime": 31.9089, "eval_rundkast_samples_per_second": 41.963, "eval_rundkast_steps_per_second": 1.316, "eval_rundkast_wer": 0.1968485042393217, "step": 704 }, { "epoch": 8.0, "eval_nb_samtale_loss": 0.45092540979385376, "eval_nb_samtale_runtime": 38.457, "eval_nb_samtale_samples_per_second": 13.86, "eval_nb_samtale_steps_per_second": 0.442, "eval_nb_samtale_wer": 0.16552734375, "step": 704 }, { "epoch": 8.0, "eval_bigbrother_loss": 1.967365026473999, "eval_bigbrother_runtime": 45.046, "eval_bigbrother_samples_per_second": 30.413, "eval_bigbrother_steps_per_second": 0.955, "eval_bigbrother_wer": 0.5337146539917829, "step": 704 }, { "epoch": 9.0, "grad_norm": 12.103546142578125, "learning_rate": 1.0546666666666667e-05, "loss": 0.4194, "step": 792 }, { "epoch": 9.0, "eval_rundkast_loss": 0.37225037813186646, "eval_rundkast_runtime": 31.1897, "eval_rundkast_samples_per_second": 42.931, "eval_rundkast_steps_per_second": 1.347, "eval_rundkast_wer": 0.1936490161574148, "step": 792 }, { "epoch": 9.0, "eval_nb_samtale_loss": 0.42615896463394165, "eval_nb_samtale_runtime": 38.2289, "eval_nb_samtale_samples_per_second": 13.942, "eval_nb_samtale_steps_per_second": 0.445, "eval_nb_samtale_wer": 0.164306640625, "step": 792 }, { "epoch": 9.0, "eval_bigbrother_loss": 1.930216908454895, "eval_bigbrother_runtime": 44.8984, "eval_bigbrother_samples_per_second": 30.513, "eval_bigbrother_steps_per_second": 0.958, "eval_bigbrother_wer": 0.5332312897768469, "step": 792 }, { "epoch": 10.0, "grad_norm": 8.539125442504883, "learning_rate": 1.172e-05, "loss": 0.4004, "step": 880 }, { "epoch": 10.0, "eval_rundkast_loss": 0.3706592917442322, "eval_rundkast_runtime": 31.2141, "eval_rundkast_samples_per_second": 42.897, "eval_rundkast_steps_per_second": 1.346, "eval_rundkast_wer": 0.1950887857942729, "step": 880 }, { "epoch": 10.0, "eval_nb_samtale_loss": 0.4074735939502716, "eval_nb_samtale_runtime": 38.275, "eval_nb_samtale_samples_per_second": 13.926, "eval_nb_samtale_steps_per_second": 0.444, "eval_nb_samtale_wer": 0.16300455729166666, "step": 880 }, { "epoch": 10.0, "eval_bigbrother_loss": 1.9817578792572021, "eval_bigbrother_runtime": 44.6517, "eval_bigbrother_samples_per_second": 30.682, "eval_bigbrother_steps_per_second": 0.963, "eval_bigbrother_wer": 0.5371787641988238, "step": 880 }, { "epoch": 11.0, "grad_norm": 4.635890007019043, "learning_rate": 1.2893333333333336e-05, "loss": 0.3842, "step": 968 }, { "epoch": 11.0, "eval_rundkast_loss": 0.39748790860176086, "eval_rundkast_runtime": 31.2552, "eval_rundkast_samples_per_second": 42.841, "eval_rundkast_steps_per_second": 1.344, "eval_rundkast_wer": 0.19588865781474965, "step": 968 }, { "epoch": 11.0, "eval_nb_samtale_loss": 0.4311392307281494, "eval_nb_samtale_runtime": 38.4527, "eval_nb_samtale_samples_per_second": 13.861, "eval_nb_samtale_steps_per_second": 0.442, "eval_nb_samtale_wer": 0.164794921875, "step": 968 }, { "epoch": 11.0, "eval_bigbrother_loss": 1.9875516891479492, "eval_bigbrother_runtime": 44.694, "eval_bigbrother_samples_per_second": 30.653, "eval_bigbrother_steps_per_second": 0.962, "eval_bigbrother_wer": 0.5363731571739305, "step": 968 }, { "epoch": 12.0, "grad_norm": 7.757190704345703, "learning_rate": 1.4053333333333335e-05, "loss": 0.3739, "step": 1056 }, { "epoch": 12.0, "eval_rundkast_loss": 0.41941559314727783, "eval_rundkast_runtime": 31.7689, "eval_rundkast_samples_per_second": 42.148, "eval_rundkast_steps_per_second": 1.322, "eval_rundkast_wer": 0.191649336106223, "step": 1056 }, { "epoch": 12.0, "eval_nb_samtale_loss": 0.4516970217227936, "eval_nb_samtale_runtime": 38.6901, "eval_nb_samtale_samples_per_second": 13.776, "eval_nb_samtale_steps_per_second": 0.439, "eval_nb_samtale_wer": 0.15885416666666666, "step": 1056 }, { "epoch": 12.0, "eval_bigbrother_loss": 2.081986904144287, "eval_bigbrother_runtime": 44.6453, "eval_bigbrother_samples_per_second": 30.686, "eval_bigbrother_steps_per_second": 0.963, "eval_bigbrother_wer": 0.5287198904374446, "step": 1056 }, { "epoch": 13.0, "grad_norm": 12.277324676513672, "learning_rate": 1.5226666666666668e-05, "loss": 0.3641, "step": 1144 }, { "epoch": 13.0, "eval_rundkast_loss": 0.4138753414154053, "eval_rundkast_runtime": 31.1718, "eval_rundkast_samples_per_second": 42.956, "eval_rundkast_steps_per_second": 1.347, "eval_rundkast_wer": 0.19524876019836826, "step": 1144 }, { "epoch": 13.0, "eval_nb_samtale_loss": 0.42660218477249146, "eval_nb_samtale_runtime": 38.7065, "eval_nb_samtale_samples_per_second": 13.77, "eval_nb_samtale_steps_per_second": 0.439, "eval_nb_samtale_wer": 0.16324869791666666, "step": 1144 }, { "epoch": 13.0, "eval_bigbrother_loss": 2.037122964859009, "eval_bigbrother_runtime": 45.1132, "eval_bigbrother_samples_per_second": 30.368, "eval_bigbrother_steps_per_second": 0.953, "eval_bigbrother_wer": 0.5277531620075727, "step": 1144 }, { "epoch": 14.0, "grad_norm": 6.313786506652832, "learning_rate": 1.64e-05, "loss": 0.3745, "step": 1232 }, { "epoch": 14.0, "eval_rundkast_loss": 0.40043848752975464, "eval_rundkast_runtime": 31.4205, "eval_rundkast_samples_per_second": 42.616, "eval_rundkast_steps_per_second": 1.337, "eval_rundkast_wer": 0.196048632218845, "step": 1232 }, { "epoch": 14.0, "eval_nb_samtale_loss": 0.43297895789146423, "eval_nb_samtale_runtime": 38.2868, "eval_nb_samtale_samples_per_second": 13.921, "eval_nb_samtale_steps_per_second": 0.444, "eval_nb_samtale_wer": 0.15926106770833334, "step": 1232 }, { "epoch": 14.0, "eval_bigbrother_loss": 2.02278995513916, "eval_bigbrother_runtime": 44.7867, "eval_bigbrother_samples_per_second": 30.589, "eval_bigbrother_steps_per_second": 0.96, "eval_bigbrother_wer": 0.5295254974623379, "step": 1232 }, { "epoch": 15.0, "grad_norm": 8.265440940856934, "learning_rate": 1.756e-05, "loss": 0.3399, "step": 1320 }, { "epoch": 15.0, "eval_rundkast_loss": 0.4764655530452728, "eval_rundkast_runtime": 31.1836, "eval_rundkast_samples_per_second": 42.939, "eval_rundkast_steps_per_second": 1.347, "eval_rundkast_wer": 0.196528555431131, "step": 1320 }, { "epoch": 15.0, "eval_nb_samtale_loss": 0.4471026062965393, "eval_nb_samtale_runtime": 38.1832, "eval_nb_samtale_samples_per_second": 13.959, "eval_nb_samtale_steps_per_second": 0.445, "eval_nb_samtale_wer": 0.15681966145833334, "step": 1320 }, { "epoch": 15.0, "eval_bigbrother_loss": 2.3220856189727783, "eval_bigbrother_runtime": 44.7848, "eval_bigbrother_samples_per_second": 30.591, "eval_bigbrother_steps_per_second": 0.96, "eval_bigbrother_wer": 0.5332312897768469, "step": 1320 }, { "epoch": 16.0, "grad_norm": 7.783019542694092, "learning_rate": 1.8733333333333336e-05, "loss": 0.3234, "step": 1408 }, { "epoch": 16.0, "eval_rundkast_loss": 0.46145308017730713, "eval_rundkast_runtime": 31.6896, "eval_rundkast_samples_per_second": 42.254, "eval_rundkast_steps_per_second": 1.325, "eval_rundkast_wer": 0.19580867061270196, "step": 1408 }, { "epoch": 16.0, "eval_nb_samtale_loss": 0.42990735173225403, "eval_nb_samtale_runtime": 38.25, "eval_nb_samtale_samples_per_second": 13.935, "eval_nb_samtale_steps_per_second": 0.444, "eval_nb_samtale_wer": 0.156494140625, "step": 1408 }, { "epoch": 16.0, "eval_bigbrother_loss": 2.225994110107422, "eval_bigbrother_runtime": 44.8274, "eval_bigbrother_samples_per_second": 30.562, "eval_bigbrother_steps_per_second": 0.959, "eval_bigbrother_wer": 0.5260613872552968, "step": 1408 }, { "epoch": 17.0, "grad_norm": 4.970972537994385, "learning_rate": 1.9906666666666667e-05, "loss": 0.3201, "step": 1496 }, { "epoch": 17.0, "eval_rundkast_loss": 0.4546896815299988, "eval_rundkast_runtime": 31.3176, "eval_rundkast_samples_per_second": 42.756, "eval_rundkast_steps_per_second": 1.341, "eval_rundkast_wer": 0.19300911854103345, "step": 1496 }, { "epoch": 17.0, "eval_nb_samtale_loss": 0.4340006113052368, "eval_nb_samtale_runtime": 38.2709, "eval_nb_samtale_samples_per_second": 13.927, "eval_nb_samtale_steps_per_second": 0.444, "eval_nb_samtale_wer": 0.15616861979166666, "step": 1496 }, { "epoch": 17.0, "eval_bigbrother_loss": 2.141953945159912, "eval_bigbrother_runtime": 44.7194, "eval_bigbrother_samples_per_second": 30.635, "eval_bigbrother_steps_per_second": 0.962, "eval_bigbrother_wer": 0.5173608313864497, "step": 1496 }, { "epoch": 18.0, "grad_norm": 4.4445576667785645, "learning_rate": 1.91980198019802e-05, "loss": 0.3069, "step": 1584 }, { "epoch": 18.0, "eval_rundkast_loss": 0.47925588488578796, "eval_rundkast_runtime": 31.2291, "eval_rundkast_samples_per_second": 42.877, "eval_rundkast_steps_per_second": 1.345, "eval_rundkast_wer": 0.19676851703727405, "step": 1584 }, { "epoch": 18.0, "eval_nb_samtale_loss": 0.4501398503780365, "eval_nb_samtale_runtime": 38.2766, "eval_nb_samtale_samples_per_second": 13.925, "eval_nb_samtale_steps_per_second": 0.444, "eval_nb_samtale_wer": 0.158203125, "step": 1584 }, { "epoch": 18.0, "eval_bigbrother_loss": 2.33626651763916, "eval_bigbrother_runtime": 44.7536, "eval_bigbrother_samples_per_second": 30.612, "eval_bigbrother_steps_per_second": 0.961, "eval_bigbrother_wer": 0.5310561508096351, "step": 1584 }, { "epoch": 19.0, "grad_norm": 4.55182409286499, "learning_rate": 1.832673267326733e-05, "loss": 0.2912, "step": 1672 }, { "epoch": 19.0, "eval_rundkast_loss": 0.4635383188724518, "eval_rundkast_runtime": 31.6064, "eval_rundkast_samples_per_second": 42.365, "eval_rundkast_steps_per_second": 1.329, "eval_rundkast_wer": 0.20028795392737161, "step": 1672 }, { "epoch": 19.0, "eval_nb_samtale_loss": 0.4135359227657318, "eval_nb_samtale_runtime": 38.4073, "eval_nb_samtale_samples_per_second": 13.878, "eval_nb_samtale_steps_per_second": 0.443, "eval_nb_samtale_wer": 0.156494140625, "step": 1672 }, { "epoch": 19.0, "eval_bigbrother_loss": 2.3355190753936768, "eval_bigbrother_runtime": 44.9365, "eval_bigbrother_samples_per_second": 30.487, "eval_bigbrother_steps_per_second": 0.957, "eval_bigbrother_wer": 0.5369370820913558, "step": 1672 }, { "epoch": 20.0, "grad_norm": 4.11824893951416, "learning_rate": 1.7455445544554458e-05, "loss": 0.2824, "step": 1760 }, { "epoch": 20.0, "eval_rundkast_loss": 0.5276007652282715, "eval_rundkast_runtime": 31.3512, "eval_rundkast_samples_per_second": 42.71, "eval_rundkast_steps_per_second": 1.34, "eval_rundkast_wer": 0.196048632218845, "step": 1760 }, { "epoch": 20.0, "eval_nb_samtale_loss": 0.47676244378089905, "eval_nb_samtale_runtime": 38.3319, "eval_nb_samtale_samples_per_second": 13.905, "eval_nb_samtale_steps_per_second": 0.443, "eval_nb_samtale_wer": 0.15804036458333334, "step": 1760 }, { "epoch": 20.0, "eval_bigbrother_loss": 2.57776141166687, "eval_bigbrother_runtime": 44.7907, "eval_bigbrother_samples_per_second": 30.587, "eval_bigbrother_steps_per_second": 0.96, "eval_bigbrother_wer": 0.5436236203979699, "step": 1760 }, { "epoch": 21.0, "grad_norm": 4.462925434112549, "learning_rate": 1.6584158415841584e-05, "loss": 0.2661, "step": 1848 }, { "epoch": 21.0, "eval_rundkast_loss": 0.5087462067604065, "eval_rundkast_runtime": 31.2914, "eval_rundkast_samples_per_second": 42.791, "eval_rundkast_steps_per_second": 1.342, "eval_rundkast_wer": 0.19732842745160775, "step": 1848 }, { "epoch": 21.0, "eval_nb_samtale_loss": 0.44534921646118164, "eval_nb_samtale_runtime": 38.226, "eval_nb_samtale_samples_per_second": 13.943, "eval_nb_samtale_steps_per_second": 0.445, "eval_nb_samtale_wer": 0.15413411458333334, "step": 1848 }, { "epoch": 21.0, "eval_bigbrother_loss": 2.2979142665863037, "eval_bigbrother_runtime": 44.8351, "eval_bigbrother_samples_per_second": 30.556, "eval_bigbrother_steps_per_second": 0.959, "eval_bigbrother_wer": 0.5297671795698059, "step": 1848 }, { "epoch": 22.0, "grad_norm": 3.7362682819366455, "learning_rate": 1.5712871287128716e-05, "loss": 0.2543, "step": 1936 }, { "epoch": 22.0, "eval_rundkast_loss": 0.5440049171447754, "eval_rundkast_runtime": 31.2654, "eval_rundkast_samples_per_second": 42.827, "eval_rundkast_steps_per_second": 1.343, "eval_rundkast_wer": 0.19756838905775076, "step": 1936 }, { "epoch": 22.0, "eval_nb_samtale_loss": 0.486325204372406, "eval_nb_samtale_runtime": 38.3702, "eval_nb_samtale_samples_per_second": 13.891, "eval_nb_samtale_steps_per_second": 0.443, "eval_nb_samtale_wer": 0.15763346354166666, "step": 1936 }, { "epoch": 22.0, "eval_bigbrother_loss": 2.4817354679107666, "eval_bigbrother_runtime": 44.7425, "eval_bigbrother_samples_per_second": 30.62, "eval_bigbrother_steps_per_second": 0.961, "eval_bigbrother_wer": 0.5300088616772738, "step": 1936 }, { "epoch": 23.0, "grad_norm": 3.388705015182495, "learning_rate": 1.4841584158415842e-05, "loss": 0.2522, "step": 2024 }, { "epoch": 23.0, "eval_rundkast_loss": 0.5401936173439026, "eval_rundkast_runtime": 31.3567, "eval_rundkast_samples_per_second": 42.702, "eval_rundkast_steps_per_second": 1.339, "eval_rundkast_wer": 0.19380899056151016, "step": 2024 }, { "epoch": 23.0, "eval_nb_samtale_loss": 0.45578888058662415, "eval_nb_samtale_runtime": 38.2879, "eval_nb_samtale_samples_per_second": 13.921, "eval_nb_samtale_steps_per_second": 0.444, "eval_nb_samtale_wer": 0.15315755208333334, "step": 2024 }, { "epoch": 23.0, "eval_bigbrother_loss": 2.4559385776519775, "eval_bigbrother_runtime": 44.8922, "eval_bigbrother_samples_per_second": 30.518, "eval_bigbrother_steps_per_second": 0.958, "eval_bigbrother_wer": 0.5254169016353822, "step": 2024 }, { "epoch": 24.0, "grad_norm": 4.662117004394531, "learning_rate": 1.3970297029702971e-05, "loss": 0.2544, "step": 2112 }, { "epoch": 24.0, "eval_rundkast_loss": 0.5467772483825684, "eval_rundkast_runtime": 31.3965, "eval_rundkast_samples_per_second": 42.648, "eval_rundkast_steps_per_second": 1.338, "eval_rundkast_wer": 0.1951687729963206, "step": 2112 }, { "epoch": 24.0, "eval_nb_samtale_loss": 0.45863205194473267, "eval_nb_samtale_runtime": 38.2548, "eval_nb_samtale_samples_per_second": 13.933, "eval_nb_samtale_steps_per_second": 0.444, "eval_nb_samtale_wer": 0.151123046875, "step": 2112 }, { "epoch": 24.0, "eval_bigbrother_loss": 2.302259922027588, "eval_bigbrother_runtime": 44.9057, "eval_bigbrother_samples_per_second": 30.508, "eval_bigbrother_steps_per_second": 0.958, "eval_bigbrother_wer": 0.5301699830822525, "step": 2112 }, { "epoch": 25.0, "grad_norm": 2.7924931049346924, "learning_rate": 1.30990099009901e-05, "loss": 0.2445, "step": 2200 }, { "epoch": 25.0, "eval_rundkast_loss": 0.5389044880867004, "eval_rundkast_runtime": 31.3233, "eval_rundkast_samples_per_second": 42.748, "eval_rundkast_steps_per_second": 1.341, "eval_rundkast_wer": 0.19500879859222525, "step": 2200 }, { "epoch": 25.0, "eval_nb_samtale_loss": 0.4871143698692322, "eval_nb_samtale_runtime": 38.3162, "eval_nb_samtale_samples_per_second": 13.911, "eval_nb_samtale_steps_per_second": 0.444, "eval_nb_samtale_wer": 0.15299479166666666, "step": 2200 }, { "epoch": 25.0, "eval_bigbrother_loss": 2.405670166015625, "eval_bigbrother_runtime": 44.8162, "eval_bigbrother_samples_per_second": 30.569, "eval_bigbrother_steps_per_second": 0.959, "eval_bigbrother_wer": 0.5264641907677435, "step": 2200 }, { "epoch": 26.0, "grad_norm": 5.481632232666016, "learning_rate": 1.2227722772277228e-05, "loss": 0.2255, "step": 2288 }, { "epoch": 26.0, "eval_rundkast_loss": 0.5802582502365112, "eval_rundkast_runtime": 31.3722, "eval_rundkast_samples_per_second": 42.681, "eval_rundkast_steps_per_second": 1.339, "eval_rundkast_wer": 0.19820828667413215, "step": 2288 }, { "epoch": 26.0, "eval_nb_samtale_loss": 0.5078674554824829, "eval_nb_samtale_runtime": 38.1701, "eval_nb_samtale_samples_per_second": 13.964, "eval_nb_samtale_steps_per_second": 0.445, "eval_nb_samtale_wer": 0.1533203125, "step": 2288 }, { "epoch": 26.0, "eval_bigbrother_loss": 2.5950069427490234, "eval_bigbrother_runtime": 45.0629, "eval_bigbrother_samples_per_second": 30.402, "eval_bigbrother_steps_per_second": 0.954, "eval_bigbrother_wer": 0.5358897929589946, "step": 2288 }, { "epoch": 27.0, "grad_norm": 6.247470855712891, "learning_rate": 1.1356435643564357e-05, "loss": 0.2317, "step": 2376 }, { "epoch": 27.0, "eval_rundkast_loss": 0.5534220337867737, "eval_rundkast_runtime": 31.8039, "eval_rundkast_samples_per_second": 42.102, "eval_rundkast_steps_per_second": 1.321, "eval_rundkast_wer": 0.19908814589665655, "step": 2376 }, { "epoch": 27.0, "eval_nb_samtale_loss": 0.46262821555137634, "eval_nb_samtale_runtime": 38.5085, "eval_nb_samtale_samples_per_second": 13.841, "eval_nb_samtale_steps_per_second": 0.441, "eval_nb_samtale_wer": 0.15234375, "step": 2376 }, { "epoch": 27.0, "eval_bigbrother_loss": 2.396604537963867, "eval_bigbrother_runtime": 45.0988, "eval_bigbrother_samples_per_second": 30.378, "eval_bigbrother_steps_per_second": 0.953, "eval_bigbrother_wer": 0.5242084910980424, "step": 2376 }, { "epoch": 28.0, "grad_norm": 5.388619899749756, "learning_rate": 1.0485148514851486e-05, "loss": 0.2157, "step": 2464 }, { "epoch": 28.0, "eval_rundkast_loss": 0.565626859664917, "eval_rundkast_runtime": 31.3606, "eval_rundkast_samples_per_second": 42.697, "eval_rundkast_steps_per_second": 1.339, "eval_rundkast_wer": 0.1988481842905135, "step": 2464 }, { "epoch": 28.0, "eval_nb_samtale_loss": 0.4518119990825653, "eval_nb_samtale_runtime": 38.2392, "eval_nb_samtale_samples_per_second": 13.939, "eval_nb_samtale_steps_per_second": 0.445, "eval_nb_samtale_wer": 0.15185546875, "step": 2464 }, { "epoch": 28.0, "eval_bigbrother_loss": 2.401461601257324, "eval_bigbrother_runtime": 44.8671, "eval_bigbrother_samples_per_second": 30.535, "eval_bigbrother_steps_per_second": 0.958, "eval_bigbrother_wer": 0.5246918553129784, "step": 2464 }, { "epoch": 29.0, "grad_norm": 6.6439738273620605, "learning_rate": 9.613861386138615e-06, "loss": 0.22, "step": 2552 }, { "epoch": 29.0, "eval_rundkast_loss": 0.5526180267333984, "eval_rundkast_runtime": 31.4809, "eval_rundkast_samples_per_second": 42.534, "eval_rundkast_steps_per_second": 1.334, "eval_rundkast_wer": 0.19996800511918092, "step": 2552 }, { "epoch": 29.0, "eval_nb_samtale_loss": 0.4727042317390442, "eval_nb_samtale_runtime": 38.2477, "eval_nb_samtale_samples_per_second": 13.935, "eval_nb_samtale_steps_per_second": 0.444, "eval_nb_samtale_wer": 0.15364583333333334, "step": 2552 }, { "epoch": 29.0, "eval_bigbrother_loss": 2.432448387145996, "eval_bigbrother_runtime": 45.1692, "eval_bigbrother_samples_per_second": 30.33, "eval_bigbrother_steps_per_second": 0.952, "eval_bigbrother_wer": 0.5283976476274873, "step": 2552 }, { "epoch": 30.0, "grad_norm": 6.641559600830078, "learning_rate": 8.742574257425743e-06, "loss": 0.2142, "step": 2640 }, { "epoch": 30.0, "eval_rundkast_loss": 0.5641056299209595, "eval_rundkast_runtime": 31.6944, "eval_rundkast_samples_per_second": 42.247, "eval_rundkast_steps_per_second": 1.325, "eval_rundkast_wer": 0.19580867061270196, "step": 2640 }, { "epoch": 30.0, "eval_nb_samtale_loss": 0.48357564210891724, "eval_nb_samtale_runtime": 38.4852, "eval_nb_samtale_samples_per_second": 13.849, "eval_nb_samtale_steps_per_second": 0.442, "eval_nb_samtale_wer": 0.14640299479166666, "step": 2640 }, { "epoch": 30.0, "eval_bigbrother_loss": 2.3856699466705322, "eval_bigbrother_runtime": 44.9444, "eval_bigbrother_samples_per_second": 30.482, "eval_bigbrother_steps_per_second": 0.957, "eval_bigbrother_wer": 0.52090550229598, "step": 2640 }, { "epoch": 31.0, "grad_norm": 5.838632106781006, "learning_rate": 7.871287128712872e-06, "loss": 0.1948, "step": 2728 }, { "epoch": 31.0, "eval_rundkast_loss": 0.5922185778617859, "eval_rundkast_runtime": 31.5341, "eval_rundkast_samples_per_second": 42.462, "eval_rundkast_steps_per_second": 1.332, "eval_rundkast_wer": 0.19708846584546472, "step": 2728 }, { "epoch": 31.0, "eval_nb_samtale_loss": 0.5342143774032593, "eval_nb_samtale_runtime": 38.0861, "eval_nb_samtale_samples_per_second": 13.995, "eval_nb_samtale_steps_per_second": 0.446, "eval_nb_samtale_wer": 0.14860026041666666, "step": 2728 }, { "epoch": 31.0, "eval_bigbrother_loss": 2.5876622200012207, "eval_bigbrother_runtime": 44.9279, "eval_bigbrother_samples_per_second": 30.493, "eval_bigbrother_steps_per_second": 0.957, "eval_bigbrother_wer": 0.5268669942801901, "step": 2728 }, { "epoch": 32.0, "grad_norm": 7.094357967376709, "learning_rate": 7e-06, "loss": 0.1949, "step": 2816 }, { "epoch": 32.0, "eval_rundkast_loss": 0.5746641159057617, "eval_rundkast_runtime": 31.5695, "eval_rundkast_samples_per_second": 42.414, "eval_rundkast_steps_per_second": 1.33, "eval_rundkast_wer": 0.19524876019836826, "step": 2816 }, { "epoch": 32.0, "eval_nb_samtale_loss": 0.5246254801750183, "eval_nb_samtale_runtime": 38.4186, "eval_nb_samtale_samples_per_second": 13.873, "eval_nb_samtale_steps_per_second": 0.442, "eval_nb_samtale_wer": 0.15120442708333334, "step": 2816 }, { "epoch": 32.0, "eval_bigbrother_loss": 2.5409083366394043, "eval_bigbrother_runtime": 45.1035, "eval_bigbrother_samples_per_second": 30.375, "eval_bigbrother_steps_per_second": 0.953, "eval_bigbrother_wer": 0.5232417626681705, "step": 2816 }, { "epoch": 33.0, "grad_norm": 3.003549098968506, "learning_rate": 6.128712871287129e-06, "loss": 0.204, "step": 2904 }, { "epoch": 33.0, "eval_rundkast_loss": 0.5838789939880371, "eval_rundkast_runtime": 31.6764, "eval_rundkast_samples_per_second": 42.271, "eval_rundkast_steps_per_second": 1.326, "eval_rundkast_wer": 0.19460886258198687, "step": 2904 }, { "epoch": 33.0, "eval_nb_samtale_loss": 0.5083252787590027, "eval_nb_samtale_runtime": 38.236, "eval_nb_samtale_samples_per_second": 13.94, "eval_nb_samtale_steps_per_second": 0.445, "eval_nb_samtale_wer": 0.14876302083333334, "step": 2904 }, { "epoch": 33.0, "eval_bigbrother_loss": 2.4765820503234863, "eval_bigbrother_runtime": 45.0387, "eval_bigbrother_samples_per_second": 30.418, "eval_bigbrother_steps_per_second": 0.955, "eval_bigbrother_wer": 0.5217111093208733, "step": 2904 }, { "epoch": 34.0, "grad_norm": 13.520666122436523, "learning_rate": 5.257425742574258e-06, "loss": 0.1946, "step": 2992 }, { "epoch": 34.0, "eval_rundkast_loss": 0.5890854597091675, "eval_rundkast_runtime": 32.1786, "eval_rundkast_samples_per_second": 41.611, "eval_rundkast_steps_per_second": 1.305, "eval_rundkast_wer": 0.19380899056151016, "step": 2992 }, { "epoch": 34.0, "eval_nb_samtale_loss": 0.5050138235092163, "eval_nb_samtale_runtime": 38.4424, "eval_nb_samtale_samples_per_second": 13.865, "eval_nb_samtale_steps_per_second": 0.442, "eval_nb_samtale_wer": 0.14876302083333334, "step": 2992 }, { "epoch": 34.0, "eval_bigbrother_loss": 2.5397651195526123, "eval_bigbrother_runtime": 46.0852, "eval_bigbrother_samples_per_second": 29.728, "eval_bigbrother_steps_per_second": 0.933, "eval_bigbrother_wer": 0.5208249415934907, "step": 2992 }, { "epoch": 35.0, "grad_norm": 13.422295570373535, "learning_rate": 4.386138613861386e-06, "loss": 0.1953, "step": 3080 }, { "epoch": 35.0, "eval_rundkast_loss": 0.5813275575637817, "eval_rundkast_runtime": 31.8014, "eval_rundkast_samples_per_second": 42.105, "eval_rundkast_steps_per_second": 1.321, "eval_rundkast_wer": 0.19404895216765317, "step": 3080 }, { "epoch": 35.0, "eval_nb_samtale_loss": 0.5057322382926941, "eval_nb_samtale_runtime": 38.3631, "eval_nb_samtale_samples_per_second": 13.894, "eval_nb_samtale_steps_per_second": 0.443, "eval_nb_samtale_wer": 0.14925130208333334, "step": 3080 }, { "epoch": 35.0, "eval_bigbrother_loss": 2.4785802364349365, "eval_bigbrother_runtime": 45.4371, "eval_bigbrother_samples_per_second": 30.152, "eval_bigbrother_steps_per_second": 0.946, "eval_bigbrother_wer": 0.5193748489486828, "step": 3080 }, { "epoch": 36.0, "grad_norm": 5.827705383300781, "learning_rate": 3.514851485148515e-06, "loss": 0.1873, "step": 3168 }, { "epoch": 36.0, "eval_rundkast_loss": 0.5837633609771729, "eval_rundkast_runtime": 31.7208, "eval_rundkast_samples_per_second": 42.212, "eval_rundkast_steps_per_second": 1.324, "eval_rundkast_wer": 0.19444888817789155, "step": 3168 }, { "epoch": 36.0, "eval_nb_samtale_loss": 0.5117051005363464, "eval_nb_samtale_runtime": 38.4155, "eval_nb_samtale_samples_per_second": 13.875, "eval_nb_samtale_steps_per_second": 0.443, "eval_nb_samtale_wer": 0.147216796875, "step": 3168 }, { "epoch": 36.0, "eval_bigbrother_loss": 2.5473718643188477, "eval_bigbrother_runtime": 45.3311, "eval_bigbrother_samples_per_second": 30.222, "eval_bigbrother_steps_per_second": 0.949, "eval_bigbrother_wer": 0.5215499879158946, "step": 3168 }, { "epoch": 37.0, "grad_norm": 3.566361427307129, "learning_rate": 2.6435643564356437e-06, "loss": 0.1791, "step": 3256 }, { "epoch": 37.0, "eval_rundkast_loss": 0.6002511382102966, "eval_rundkast_runtime": 31.7763, "eval_rundkast_samples_per_second": 42.138, "eval_rundkast_steps_per_second": 1.322, "eval_rundkast_wer": 0.19588865781474965, "step": 3256 }, { "epoch": 37.0, "eval_nb_samtale_loss": 0.5211741328239441, "eval_nb_samtale_runtime": 38.5386, "eval_nb_samtale_samples_per_second": 13.83, "eval_nb_samtale_steps_per_second": 0.441, "eval_nb_samtale_wer": 0.14713541666666666, "step": 3256 }, { "epoch": 37.0, "eval_bigbrother_loss": 2.629565715789795, "eval_bigbrother_runtime": 45.36, "eval_bigbrother_samples_per_second": 30.203, "eval_bigbrother_steps_per_second": 0.948, "eval_bigbrother_wer": 0.5238056875855958, "step": 3256 }, { "epoch": 38.0, "grad_norm": 6.092939376831055, "learning_rate": 1.7722772277227724e-06, "loss": 0.193, "step": 3344 }, { "epoch": 38.0, "eval_rundkast_loss": 0.595504641532898, "eval_rundkast_runtime": 31.8783, "eval_rundkast_samples_per_second": 42.004, "eval_rundkast_steps_per_second": 1.318, "eval_rundkast_wer": 0.19356902895536715, "step": 3344 }, { "epoch": 38.0, "eval_nb_samtale_loss": 0.5151902437210083, "eval_nb_samtale_runtime": 38.9536, "eval_nb_samtale_samples_per_second": 13.683, "eval_nb_samtale_steps_per_second": 0.436, "eval_nb_samtale_wer": 0.14737955729166666, "step": 3344 }, { "epoch": 38.0, "eval_bigbrother_loss": 2.59112548828125, "eval_bigbrother_runtime": 45.3015, "eval_bigbrother_samples_per_second": 30.242, "eval_bigbrother_steps_per_second": 0.949, "eval_bigbrother_wer": 0.5234028840731492, "step": 3344 }, { "epoch": 39.0, "grad_norm": 4.503037452697754, "learning_rate": 9.00990099009901e-07, "loss": 0.1767, "step": 3432 }, { "epoch": 39.0, "eval_rundkast_loss": 0.5997776389122009, "eval_rundkast_runtime": 31.7079, "eval_rundkast_samples_per_second": 42.229, "eval_rundkast_steps_per_second": 1.325, "eval_rundkast_wer": 0.1945288753799392, "step": 3432 }, { "epoch": 39.0, "eval_nb_samtale_loss": 0.5143499970436096, "eval_nb_samtale_runtime": 38.5399, "eval_nb_samtale_samples_per_second": 13.83, "eval_nb_samtale_steps_per_second": 0.441, "eval_nb_samtale_wer": 0.14607747395833334, "step": 3432 }, { "epoch": 39.0, "eval_bigbrother_loss": 2.604764938354492, "eval_bigbrother_runtime": 45.3914, "eval_bigbrother_samples_per_second": 30.182, "eval_bigbrother_steps_per_second": 0.947, "eval_bigbrother_wer": 0.5224361556432772, "step": 3432 }, { "epoch": 40.0, "grad_norm": 5.29674768447876, "learning_rate": 2.9702970297029707e-08, "loss": 0.1726, "step": 3520 }, { "epoch": 40.0, "eval_rundkast_loss": 0.6034849286079407, "eval_rundkast_runtime": 31.8224, "eval_rundkast_samples_per_second": 42.077, "eval_rundkast_steps_per_second": 1.32, "eval_rundkast_wer": 0.19476883698608222, "step": 3520 }, { "epoch": 40.0, "eval_nb_samtale_loss": 0.5175977945327759, "eval_nb_samtale_runtime": 38.5824, "eval_nb_samtale_samples_per_second": 13.815, "eval_nb_samtale_steps_per_second": 0.441, "eval_nb_samtale_wer": 0.146484375, "step": 3520 }, { "epoch": 40.0, "eval_bigbrother_loss": 2.614839553833008, "eval_bigbrother_runtime": 45.4875, "eval_bigbrother_samples_per_second": 30.118, "eval_bigbrother_steps_per_second": 0.945, "eval_bigbrother_wer": 0.5227583984532345, "step": 3520 } ], "logging_steps": 500, "max_steps": 3520, "num_input_tokens_seen": 0, "num_train_epochs": 40, "save_steps": 500, "total_flos": 1.468412648283622e+20, "train_batch_size": 48, "trial_name": null, "trial_params": null }