{ "best_metric": 0.2430986748380507, "best_model_checkpoint": "/cluster/home/torstefl/Master/saved_model/W2V/Combined/BB-NB-RUND/30.05/checkpoint-65754", "epoch": 40.0, "eval_steps": 500, "global_step": 67440, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "grad_norm": 81.12491607666016, "learning_rate": 9.972247497725206e-05, "loss": 0.8557, "step": 1686 }, { "epoch": 1.0, "eval_bigbrother_loss": 1.6390442848205566, "eval_bigbrother_runtime": 54.9493, "eval_bigbrother_samples_per_second": 24.932, "eval_bigbrother_steps_per_second": 0.783, "eval_bigbrother_wer": 0.6789656005800371, "step": 1686 }, { "epoch": 1.0, "eval_BB_NB_RUND_loss": 0.960404634475708, "eval_BB_NB_RUND_runtime": 215.4543, "eval_BB_NB_RUND_samples_per_second": 15.047, "eval_BB_NB_RUND_steps_per_second": 0.473, "eval_BB_NB_RUND_wer": 0.42735800876273417, "step": 1686 }, { "epoch": 1.0, "eval_rundkast_loss": 0.3885672688484192, "eval_rundkast_runtime": 39.7428, "eval_rundkast_samples_per_second": 33.692, "eval_rundkast_steps_per_second": 1.057, "eval_rundkast_wer": 0.26931690929451285, "step": 1686 }, { "epoch": 1.0, "eval_nb_samtale_loss": 0.6525214910507202, "eval_nb_samtale_runtime": 47.5144, "eval_nb_samtale_samples_per_second": 11.218, "eval_nb_samtale_steps_per_second": 0.358, "eval_nb_samtale_wer": 0.3343098958333333, "step": 1686 }, { "epoch": 2.0, "grad_norm": 55.65499496459961, "learning_rate": 9.71656050955414e-05, "loss": 0.8819, "step": 3372 }, { "epoch": 2.0, "eval_bigbrother_loss": 1.5301967859268188, "eval_bigbrother_runtime": 55.6705, "eval_bigbrother_samples_per_second": 24.609, "eval_bigbrother_steps_per_second": 0.772, "eval_bigbrother_wer": 0.6032385402400708, "step": 3372 }, { "epoch": 2.0, "eval_BB_NB_RUND_loss": 0.8895238637924194, "eval_BB_NB_RUND_runtime": 216.0717, "eval_BB_NB_RUND_samples_per_second": 15.004, "eval_BB_NB_RUND_steps_per_second": 0.472, "eval_BB_NB_RUND_wer": 0.3907211783995914, "step": 3372 }, { "epoch": 2.0, "eval_rundkast_loss": 0.3464510142803192, "eval_rundkast_runtime": 39.915, "eval_rundkast_samples_per_second": 33.546, "eval_rundkast_steps_per_second": 1.052, "eval_rundkast_wer": 0.2510798272276436, "step": 3372 }, { "epoch": 2.0, "eval_nb_samtale_loss": 0.6075140237808228, "eval_nb_samtale_runtime": 47.9711, "eval_nb_samtale_samples_per_second": 11.111, "eval_nb_samtale_steps_per_second": 0.354, "eval_nb_samtale_wer": 0.3182779947916667, "step": 3372 }, { "epoch": 3.0, "grad_norm": 29.089189529418945, "learning_rate": 9.461025174400972e-05, "loss": 0.8064, "step": 5058 }, { "epoch": 3.0, "eval_bigbrother_loss": 1.5702797174453735, "eval_bigbrother_runtime": 55.4022, "eval_bigbrother_samples_per_second": 24.728, "eval_bigbrother_steps_per_second": 0.776, "eval_bigbrother_wer": 0.6068637718520905, "step": 5058 }, { "epoch": 3.0, "eval_BB_NB_RUND_loss": 0.8996490240097046, "eval_BB_NB_RUND_runtime": 238.1867, "eval_BB_NB_RUND_samples_per_second": 13.611, "eval_BB_NB_RUND_steps_per_second": 0.428, "eval_BB_NB_RUND_wer": 0.3820659624223853, "step": 5058 }, { "epoch": 3.0, "eval_rundkast_loss": 0.3366275429725647, "eval_rundkast_runtime": 39.8274, "eval_rundkast_samples_per_second": 33.62, "eval_rundkast_steps_per_second": 1.055, "eval_rundkast_wer": 0.23484242521196608, "step": 5058 }, { "epoch": 3.0, "eval_nb_samtale_loss": 0.59026038646698, "eval_nb_samtale_runtime": 47.7348, "eval_nb_samtale_samples_per_second": 11.166, "eval_nb_samtale_steps_per_second": 0.356, "eval_nb_samtale_wer": 0.3050944010416667, "step": 5058 }, { "epoch": 4.0, "grad_norm": 12.38161563873291, "learning_rate": 9.205338186229906e-05, "loss": 0.7614, "step": 6744 }, { "epoch": 4.0, "eval_bigbrother_loss": 1.5530073642730713, "eval_bigbrother_runtime": 55.7815, "eval_bigbrother_samples_per_second": 24.56, "eval_bigbrother_steps_per_second": 0.771, "eval_bigbrother_wer": 0.5924434061065013, "step": 6744 }, { "epoch": 4.0, "eval_BB_NB_RUND_loss": 0.891120970249176, "eval_BB_NB_RUND_runtime": 215.5766, "eval_BB_NB_RUND_samples_per_second": 15.039, "eval_BB_NB_RUND_steps_per_second": 0.473, "eval_BB_NB_RUND_wer": 0.37961992312447923, "step": 6744 }, { "epoch": 4.0, "eval_rundkast_loss": 0.3337271213531494, "eval_rundkast_runtime": 39.7645, "eval_rundkast_samples_per_second": 33.673, "eval_rundkast_steps_per_second": 1.056, "eval_rundkast_wer": 0.2345224764037754, "step": 6744 }, { "epoch": 4.0, "eval_nb_samtale_loss": 0.5904266238212585, "eval_nb_samtale_runtime": 47.79, "eval_nb_samtale_samples_per_second": 11.153, "eval_nb_samtale_steps_per_second": 0.356, "eval_nb_samtale_wer": 0.3128255208333333, "step": 6744 }, { "epoch": 5.0, "grad_norm": 9.62388801574707, "learning_rate": 8.949802851076737e-05, "loss": 0.716, "step": 8430 }, { "epoch": 5.0, "eval_bigbrother_loss": 1.3175848722457886, "eval_bigbrother_runtime": 56.2695, "eval_bigbrother_samples_per_second": 24.347, "eval_bigbrother_steps_per_second": 0.764, "eval_bigbrother_wer": 0.5748006122613389, "step": 8430 }, { "epoch": 5.0, "eval_BB_NB_RUND_loss": 0.7703477144241333, "eval_BB_NB_RUND_runtime": 213.244, "eval_BB_NB_RUND_samples_per_second": 15.203, "eval_BB_NB_RUND_steps_per_second": 0.478, "eval_BB_NB_RUND_wer": 0.3668521355804639, "step": 8430 }, { "epoch": 5.0, "eval_rundkast_loss": 0.30976158380508423, "eval_rundkast_runtime": 39.6119, "eval_rundkast_samples_per_second": 33.803, "eval_rundkast_steps_per_second": 1.06, "eval_rundkast_wer": 0.2258038713805791, "step": 8430 }, { "epoch": 5.0, "eval_nb_samtale_loss": 0.520818829536438, "eval_nb_samtale_runtime": 47.528, "eval_nb_samtale_samples_per_second": 11.214, "eval_nb_samtale_steps_per_second": 0.358, "eval_nb_samtale_wer": 0.3003743489583333, "step": 8430 }, { "epoch": 6.0, "grad_norm": 24.378128051757812, "learning_rate": 8.694267515923567e-05, "loss": 0.6852, "step": 10116 }, { "epoch": 6.0, "eval_bigbrother_loss": 1.3726727962493896, "eval_bigbrother_runtime": 56.2024, "eval_bigbrother_samples_per_second": 24.376, "eval_bigbrother_steps_per_second": 0.765, "eval_bigbrother_wer": 0.5383066140336744, "step": 10116 }, { "epoch": 6.0, "eval_BB_NB_RUND_loss": 0.798953115940094, "eval_BB_NB_RUND_runtime": 235.4413, "eval_BB_NB_RUND_samples_per_second": 13.77, "eval_BB_NB_RUND_steps_per_second": 0.433, "eval_BB_NB_RUND_wer": 0.3504556084186759, "step": 10116 }, { "epoch": 6.0, "eval_rundkast_loss": 0.30640244483947754, "eval_rundkast_runtime": 39.638, "eval_rundkast_samples_per_second": 33.781, "eval_rundkast_steps_per_second": 1.06, "eval_rundkast_wer": 0.22228443449048152, "step": 10116 }, { "epoch": 6.0, "eval_nb_samtale_loss": 0.5616967082023621, "eval_nb_samtale_runtime": 47.4044, "eval_nb_samtale_samples_per_second": 11.244, "eval_nb_samtale_steps_per_second": 0.359, "eval_nb_samtale_wer": 0.2908528645833333, "step": 10116 }, { "epoch": 7.0, "grad_norm": 17.646387100219727, "learning_rate": 8.438580527752503e-05, "loss": 0.65, "step": 11802 }, { "epoch": 7.0, "eval_bigbrother_loss": 1.296665906906128, "eval_bigbrother_runtime": 56.8276, "eval_bigbrother_samples_per_second": 24.108, "eval_bigbrother_steps_per_second": 0.757, "eval_bigbrother_wer": 0.5387899782486103, "step": 11802 }, { "epoch": 7.0, "eval_BB_NB_RUND_loss": 0.7510452270507812, "eval_BB_NB_RUND_runtime": 219.1946, "eval_BB_NB_RUND_samples_per_second": 14.791, "eval_BB_NB_RUND_steps_per_second": 0.465, "eval_BB_NB_RUND_wer": 0.3475526167244577, "step": 11802 }, { "epoch": 7.0, "eval_rundkast_loss": 0.2876454293727875, "eval_rundkast_runtime": 39.7396, "eval_rundkast_samples_per_second": 33.694, "eval_rundkast_steps_per_second": 1.057, "eval_rundkast_wer": 0.2191649336106223, "step": 11802 }, { "epoch": 7.0, "eval_nb_samtale_loss": 0.5133534073829651, "eval_nb_samtale_runtime": 47.6414, "eval_nb_samtale_samples_per_second": 11.188, "eval_nb_samtale_steps_per_second": 0.357, "eval_nb_samtale_wer": 0.2849934895833333, "step": 11802 }, { "epoch": 8.0, "grad_norm": 9.183784484863281, "learning_rate": 8.183045192599334e-05, "loss": 0.6195, "step": 13488 }, { "epoch": 8.0, "eval_bigbrother_loss": 1.3931747674942017, "eval_bigbrother_runtime": 55.455, "eval_bigbrother_samples_per_second": 24.705, "eval_bigbrother_steps_per_second": 0.775, "eval_bigbrother_wer": 0.5308950294046564, "step": 13488 }, { "epoch": 8.0, "eval_BB_NB_RUND_loss": 0.8028880953788757, "eval_BB_NB_RUND_runtime": 174.7359, "eval_BB_NB_RUND_samples_per_second": 18.554, "eval_BB_NB_RUND_steps_per_second": 0.584, "eval_BB_NB_RUND_wer": 0.34357444292126976, "step": 13488 }, { "epoch": 8.0, "eval_rundkast_loss": 0.31355729699134827, "eval_rundkast_runtime": 39.8585, "eval_rundkast_samples_per_second": 33.594, "eval_rundkast_steps_per_second": 1.054, "eval_rundkast_wer": 0.21404575267957127, "step": 13488 }, { "epoch": 8.0, "eval_nb_samtale_loss": 0.5146628618240356, "eval_nb_samtale_runtime": 47.9963, "eval_nb_samtale_samples_per_second": 11.105, "eval_nb_samtale_steps_per_second": 0.354, "eval_nb_samtale_wer": 0.2861328125, "step": 13488 }, { "epoch": 9.0, "grad_norm": 9.670160293579102, "learning_rate": 7.92735820442827e-05, "loss": 0.592, "step": 15174 }, { "epoch": 9.0, "eval_bigbrother_loss": 1.3019070625305176, "eval_bigbrother_runtime": 55.2104, "eval_bigbrother_samples_per_second": 24.814, "eval_bigbrother_steps_per_second": 0.779, "eval_bigbrother_wer": 0.5215499879158946, "step": 15174 }, { "epoch": 9.0, "eval_BB_NB_RUND_loss": 0.7444170117378235, "eval_BB_NB_RUND_runtime": 237.2263, "eval_BB_NB_RUND_samples_per_second": 13.666, "eval_BB_NB_RUND_steps_per_second": 0.43, "eval_BB_NB_RUND_wer": 0.3310485713517727, "step": 15174 }, { "epoch": 9.0, "eval_rundkast_loss": 0.2764076590538025, "eval_rundkast_runtime": 40.1719, "eval_rundkast_samples_per_second": 33.332, "eval_rundkast_steps_per_second": 1.046, "eval_rundkast_wer": 0.19956806910894256, "step": 15174 }, { "epoch": 9.0, "eval_nb_samtale_loss": 0.4871513545513153, "eval_nb_samtale_runtime": 47.9822, "eval_nb_samtale_samples_per_second": 11.108, "eval_nb_samtale_steps_per_second": 0.354, "eval_nb_samtale_wer": 0.2718098958333333, "step": 15174 }, { "epoch": 10.0, "grad_norm": 6.870215892791748, "learning_rate": 7.671671216257204e-05, "loss": 0.5668, "step": 16860 }, { "epoch": 10.0, "eval_bigbrother_loss": 1.418025255203247, "eval_bigbrother_runtime": 56.4643, "eval_bigbrother_samples_per_second": 24.263, "eval_bigbrother_steps_per_second": 0.762, "eval_bigbrother_wer": 0.5194554096511722, "step": 16860 }, { "epoch": 10.0, "eval_BB_NB_RUND_loss": 0.814452052116394, "eval_BB_NB_RUND_runtime": 187.2873, "eval_BB_NB_RUND_samples_per_second": 17.31, "eval_BB_NB_RUND_steps_per_second": 0.545, "eval_BB_NB_RUND_wer": 0.32844125473752117, "step": 16860 }, { "epoch": 10.0, "eval_rundkast_loss": 0.3035307824611664, "eval_rundkast_runtime": 39.9861, "eval_rundkast_samples_per_second": 33.487, "eval_rundkast_steps_per_second": 1.05, "eval_rundkast_wer": 0.19844824828027516, "step": 16860 }, { "epoch": 10.0, "eval_nb_samtale_loss": 0.5466247200965881, "eval_nb_samtale_runtime": 47.5084, "eval_nb_samtale_samples_per_second": 11.219, "eval_nb_samtale_steps_per_second": 0.358, "eval_nb_samtale_wer": 0.267333984375, "step": 16860 }, { "epoch": 11.0, "grad_norm": 5.365777015686035, "learning_rate": 7.41628753412193e-05, "loss": 0.5501, "step": 18546 }, { "epoch": 11.0, "eval_bigbrother_loss": 1.413320779800415, "eval_bigbrother_runtime": 56.7058, "eval_bigbrother_samples_per_second": 24.16, "eval_bigbrother_steps_per_second": 0.758, "eval_bigbrother_wer": 0.5231612019656812, "step": 18546 }, { "epoch": 11.0, "eval_BB_NB_RUND_loss": 0.8070511817932129, "eval_BB_NB_RUND_runtime": 186.3465, "eval_BB_NB_RUND_samples_per_second": 17.398, "eval_BB_NB_RUND_steps_per_second": 0.547, "eval_BB_NB_RUND_wer": 0.32887132758110904, "step": 18546 }, { "epoch": 11.0, "eval_rundkast_loss": 0.30373072624206543, "eval_rundkast_runtime": 40.0188, "eval_rundkast_samples_per_second": 33.459, "eval_rundkast_steps_per_second": 1.05, "eval_rundkast_wer": 0.19588865781474965, "step": 18546 }, { "epoch": 11.0, "eval_nb_samtale_loss": 0.5129746198654175, "eval_nb_samtale_runtime": 47.3772, "eval_nb_samtale_samples_per_second": 11.25, "eval_nb_samtale_steps_per_second": 0.359, "eval_nb_samtale_wer": 0.2676595052083333, "step": 18546 }, { "epoch": 12.0, "grad_norm": 13.1134033203125, "learning_rate": 7.160600545950865e-05, "loss": 0.5307, "step": 20232 }, { "epoch": 12.0, "eval_bigbrother_loss": 1.269589900970459, "eval_bigbrother_runtime": 54.8931, "eval_bigbrother_samples_per_second": 24.958, "eval_bigbrother_steps_per_second": 0.783, "eval_bigbrother_wer": 0.49617336663175704, "step": 20232 }, { "epoch": 12.0, "eval_BB_NB_RUND_loss": 0.7405148148536682, "eval_BB_NB_RUND_runtime": 189.7158, "eval_BB_NB_RUND_samples_per_second": 17.089, "eval_BB_NB_RUND_steps_per_second": 0.538, "eval_BB_NB_RUND_wer": 0.31540467166626346, "step": 20232 }, { "epoch": 12.0, "eval_rundkast_loss": 0.2901303768157959, "eval_rundkast_runtime": 39.9118, "eval_rundkast_samples_per_second": 33.549, "eval_rundkast_steps_per_second": 1.052, "eval_rundkast_wer": 0.19612861942089266, "step": 20232 }, { "epoch": 12.0, "eval_nb_samtale_loss": 0.5120977759361267, "eval_nb_samtale_runtime": 47.5553, "eval_nb_samtale_samples_per_second": 11.208, "eval_nb_samtale_steps_per_second": 0.357, "eval_nb_samtale_wer": 0.2537434895833333, "step": 20232 }, { "epoch": 13.0, "grad_norm": 5.697801113128662, "learning_rate": 6.9049135577798e-05, "loss": 0.5134, "step": 21918 }, { "epoch": 13.0, "eval_bigbrother_loss": 1.347646951675415, "eval_bigbrother_runtime": 55.3541, "eval_bigbrother_samples_per_second": 24.75, "eval_bigbrother_steps_per_second": 0.777, "eval_bigbrother_wer": 0.4957705631193104, "step": 21918 }, { "epoch": 13.0, "eval_BB_NB_RUND_loss": 0.7735500335693359, "eval_BB_NB_RUND_runtime": 187.3035, "eval_BB_NB_RUND_samples_per_second": 17.309, "eval_BB_NB_RUND_steps_per_second": 0.545, "eval_BB_NB_RUND_wer": 0.3093030131978604, "step": 21918 }, { "epoch": 13.0, "eval_rundkast_loss": 0.29282376170158386, "eval_rundkast_runtime": 39.9603, "eval_rundkast_samples_per_second": 33.508, "eval_rundkast_steps_per_second": 1.051, "eval_rundkast_wer": 0.18285074388097905, "step": 21918 }, { "epoch": 13.0, "eval_nb_samtale_loss": 0.5057567954063416, "eval_nb_samtale_runtime": 47.9932, "eval_nb_samtale_samples_per_second": 11.106, "eval_nb_samtale_steps_per_second": 0.354, "eval_nb_samtale_wer": 0.24934895833333334, "step": 21918 }, { "epoch": 14.0, "grad_norm": 8.790960311889648, "learning_rate": 6.64937822262663e-05, "loss": 0.4883, "step": 23604 }, { "epoch": 14.0, "eval_bigbrother_loss": 1.3468968868255615, "eval_bigbrother_runtime": 54.8463, "eval_bigbrother_samples_per_second": 24.979, "eval_bigbrother_steps_per_second": 0.784, "eval_bigbrother_wer": 0.48843953919278177, "step": 23604 }, { "epoch": 14.0, "eval_BB_NB_RUND_loss": 0.7681761384010315, "eval_BB_NB_RUND_runtime": 174.885, "eval_BB_NB_RUND_samples_per_second": 18.538, "eval_BB_NB_RUND_steps_per_second": 0.583, "eval_BB_NB_RUND_wer": 0.3044646937074967, "step": 23604 }, { "epoch": 14.0, "eval_rundkast_loss": 0.27578702569007874, "eval_rundkast_runtime": 39.9056, "eval_rundkast_samples_per_second": 33.554, "eval_rundkast_steps_per_second": 1.052, "eval_rundkast_wer": 0.17957126859702446, "step": 23604 }, { "epoch": 14.0, "eval_nb_samtale_loss": 0.5177371501922607, "eval_nb_samtale_runtime": 47.3502, "eval_nb_samtale_samples_per_second": 11.257, "eval_nb_samtale_steps_per_second": 0.359, "eval_nb_samtale_wer": 0.2451171875, "step": 23604 }, { "epoch": 15.0, "grad_norm": 10.714680671691895, "learning_rate": 6.393842887473462e-05, "loss": 0.4689, "step": 25290 }, { "epoch": 15.0, "eval_bigbrother_loss": 1.3112008571624756, "eval_bigbrother_runtime": 54.8505, "eval_bigbrother_samples_per_second": 24.977, "eval_bigbrother_steps_per_second": 0.784, "eval_bigbrother_wer": 0.49093692096995084, "step": 25290 }, { "epoch": 15.0, "eval_BB_NB_RUND_loss": 0.7539634704589844, "eval_BB_NB_RUND_runtime": 188.0576, "eval_BB_NB_RUND_samples_per_second": 17.239, "eval_BB_NB_RUND_steps_per_second": 0.542, "eval_BB_NB_RUND_wer": 0.30505604386743007, "step": 25290 }, { "epoch": 15.0, "eval_rundkast_loss": 0.28489232063293457, "eval_rundkast_runtime": 40.0722, "eval_rundkast_samples_per_second": 33.415, "eval_rundkast_steps_per_second": 1.048, "eval_rundkast_wer": 0.17997120460726285, "step": 25290 }, { "epoch": 15.0, "eval_nb_samtale_loss": 0.4998992383480072, "eval_nb_samtale_runtime": 47.6004, "eval_nb_samtale_samples_per_second": 11.197, "eval_nb_samtale_steps_per_second": 0.357, "eval_nb_samtale_wer": 0.24503580729166666, "step": 25290 }, { "epoch": 16.0, "grad_norm": 5.148988246917725, "learning_rate": 6.138459205338186e-05, "loss": 0.4555, "step": 26976 }, { "epoch": 16.0, "eval_bigbrother_loss": 1.3192588090896606, "eval_bigbrother_runtime": 54.8083, "eval_bigbrother_samples_per_second": 24.996, "eval_bigbrother_steps_per_second": 0.785, "eval_bigbrother_wer": 0.475388705389511, "step": 26976 }, { "epoch": 16.0, "eval_BB_NB_RUND_loss": 0.7727116942405701, "eval_BB_NB_RUND_runtime": 175.6567, "eval_BB_NB_RUND_samples_per_second": 18.456, "eval_BB_NB_RUND_steps_per_second": 0.581, "eval_BB_NB_RUND_wer": 0.2980404806064027, "step": 26976 }, { "epoch": 16.0, "eval_rundkast_loss": 0.30636081099510193, "eval_rundkast_runtime": 40.0387, "eval_rundkast_samples_per_second": 33.443, "eval_rundkast_steps_per_second": 1.049, "eval_rundkast_wer": 0.17501199808030715, "step": 26976 }, { "epoch": 16.0, "eval_nb_samtale_loss": 0.5385606288909912, "eval_nb_samtale_runtime": 47.4641, "eval_nb_samtale_samples_per_second": 11.23, "eval_nb_samtale_steps_per_second": 0.358, "eval_nb_samtale_wer": 0.24462890625, "step": 26976 }, { "epoch": 17.0, "grad_norm": 7.1762614250183105, "learning_rate": 5.8827722171671216e-05, "loss": 0.4414, "step": 28662 }, { "epoch": 17.0, "eval_bigbrother_loss": 1.3271602392196655, "eval_bigbrother_runtime": 55.1307, "eval_bigbrother_samples_per_second": 24.85, "eval_bigbrother_steps_per_second": 0.78, "eval_bigbrother_wer": 0.4732135664222992, "step": 28662 }, { "epoch": 17.0, "eval_BB_NB_RUND_loss": 0.7706267237663269, "eval_BB_NB_RUND_runtime": 186.2927, "eval_BB_NB_RUND_samples_per_second": 17.403, "eval_BB_NB_RUND_steps_per_second": 0.548, "eval_BB_NB_RUND_wer": 0.2966427438647421, "step": 28662 }, { "epoch": 17.0, "eval_rundkast_loss": 0.29671627283096313, "eval_rundkast_runtime": 39.937, "eval_rundkast_samples_per_second": 33.528, "eval_rundkast_steps_per_second": 1.052, "eval_rundkast_wer": 0.17677171652535595, "step": 28662 }, { "epoch": 17.0, "eval_nb_samtale_loss": 0.5305598378181458, "eval_nb_samtale_runtime": 47.5425, "eval_nb_samtale_samples_per_second": 11.211, "eval_nb_samtale_steps_per_second": 0.358, "eval_nb_samtale_wer": 0.24007161458333334, "step": 28662 }, { "epoch": 18.0, "grad_norm": 7.369349956512451, "learning_rate": 5.627085228996057e-05, "loss": 0.4215, "step": 30348 }, { "epoch": 18.0, "eval_bigbrother_loss": 1.396024465560913, "eval_bigbrother_runtime": 54.7768, "eval_bigbrother_samples_per_second": 25.011, "eval_bigbrother_steps_per_second": 0.785, "eval_bigbrother_wer": 0.47377749133972447, "step": 30348 }, { "epoch": 18.0, "eval_BB_NB_RUND_loss": 0.8181838393211365, "eval_BB_NB_RUND_runtime": 176.3618, "eval_BB_NB_RUND_samples_per_second": 18.383, "eval_BB_NB_RUND_steps_per_second": 0.578, "eval_BB_NB_RUND_wer": 0.2952450071230815, "step": 30348 }, { "epoch": 18.0, "eval_rundkast_loss": 0.3431045413017273, "eval_rundkast_runtime": 40.0058, "eval_rundkast_samples_per_second": 33.47, "eval_rundkast_steps_per_second": 1.05, "eval_rundkast_wer": 0.17389217725163975, "step": 30348 }, { "epoch": 18.0, "eval_nb_samtale_loss": 0.5264986753463745, "eval_nb_samtale_runtime": 47.5607, "eval_nb_samtale_samples_per_second": 11.207, "eval_nb_samtale_steps_per_second": 0.357, "eval_nb_samtale_wer": 0.237548828125, "step": 30348 }, { "epoch": 19.0, "grad_norm": 5.667070388793945, "learning_rate": 5.371549893842888e-05, "loss": 0.407, "step": 32034 }, { "epoch": 19.0, "eval_bigbrother_loss": 1.402126669883728, "eval_bigbrother_runtime": 55.4841, "eval_bigbrother_samples_per_second": 24.692, "eval_bigbrother_steps_per_second": 0.775, "eval_bigbrother_wer": 0.4772416015467655, "step": 32034 }, { "epoch": 19.0, "eval_BB_NB_RUND_loss": 0.8144161701202393, "eval_BB_NB_RUND_runtime": 193.9029, "eval_BB_NB_RUND_samples_per_second": 16.72, "eval_BB_NB_RUND_steps_per_second": 0.526, "eval_BB_NB_RUND_wer": 0.29502997070128756, "step": 32034 }, { "epoch": 19.0, "eval_rundkast_loss": 0.3256075978279114, "eval_rundkast_runtime": 40.5438, "eval_rundkast_samples_per_second": 33.026, "eval_rundkast_steps_per_second": 1.036, "eval_rundkast_wer": 0.17381219004959206, "step": 32034 }, { "epoch": 19.0, "eval_nb_samtale_loss": 0.5318475365638733, "eval_nb_samtale_runtime": 47.61, "eval_nb_samtale_samples_per_second": 11.195, "eval_nb_samtale_steps_per_second": 0.357, "eval_nb_samtale_wer": 0.234619140625, "step": 32034 }, { "epoch": 20.0, "grad_norm": NaN, "learning_rate": 5.116166211707614e-05, "loss": 0.394, "step": 33720 }, { "epoch": 20.0, "eval_bigbrother_loss": 1.3861628770828247, "eval_bigbrother_runtime": 55.5803, "eval_bigbrother_samples_per_second": 24.649, "eval_bigbrother_steps_per_second": 0.774, "eval_bigbrother_wer": 0.47168291307500204, "step": 33720 }, { "epoch": 20.0, "eval_BB_NB_RUND_loss": 0.8024275302886963, "eval_BB_NB_RUND_runtime": 184.6934, "eval_BB_NB_RUND_samples_per_second": 17.553, "eval_BB_NB_RUND_steps_per_second": 0.552, "eval_BB_NB_RUND_wer": 0.28771873236029355, "step": 33720 }, { "epoch": 20.0, "eval_rundkast_loss": 0.31396913528442383, "eval_rundkast_runtime": 40.1483, "eval_rundkast_samples_per_second": 33.351, "eval_rundkast_steps_per_second": 1.046, "eval_rundkast_wer": 0.16221404575267956, "step": 33720 }, { "epoch": 20.0, "eval_nb_samtale_loss": 0.5292519927024841, "eval_nb_samtale_runtime": 47.252, "eval_nb_samtale_samples_per_second": 11.28, "eval_nb_samtale_steps_per_second": 0.36, "eval_nb_samtale_wer": 0.229248046875, "step": 33720 }, { "epoch": 21.0, "grad_norm": 10.585386276245117, "learning_rate": 4.860479223536549e-05, "loss": 0.3812, "step": 35406 }, { "epoch": 21.0, "eval_bigbrother_loss": 1.368707537651062, "eval_bigbrother_runtime": 55.1721, "eval_bigbrother_samples_per_second": 24.831, "eval_bigbrother_steps_per_second": 0.779, "eval_bigbrother_wer": 0.45702086522194474, "step": 35406 }, { "epoch": 21.0, "eval_BB_NB_RUND_loss": 0.7922731041908264, "eval_BB_NB_RUND_runtime": 186.0861, "eval_BB_NB_RUND_samples_per_second": 17.422, "eval_BB_NB_RUND_steps_per_second": 0.548, "eval_BB_NB_RUND_wer": 0.2828804128699298, "step": 35406 }, { "epoch": 21.0, "eval_rundkast_loss": 0.3038511872291565, "eval_rundkast_runtime": 40.036, "eval_rundkast_samples_per_second": 33.445, "eval_rundkast_steps_per_second": 1.049, "eval_rundkast_wer": 0.16437370020796674, "step": 35406 }, { "epoch": 21.0, "eval_nb_samtale_loss": 0.5377490520477295, "eval_nb_samtale_runtime": 47.8978, "eval_nb_samtale_samples_per_second": 11.128, "eval_nb_samtale_steps_per_second": 0.355, "eval_nb_samtale_wer": 0.227294921875, "step": 35406 }, { "epoch": 22.0, "grad_norm": 5.612251281738281, "learning_rate": 4.604792235365484e-05, "loss": 0.3656, "step": 37092 }, { "epoch": 22.0, "eval_bigbrother_loss": 1.3479688167572021, "eval_bigbrother_runtime": 55.3759, "eval_bigbrother_samples_per_second": 24.74, "eval_bigbrother_steps_per_second": 0.777, "eval_bigbrother_wer": 0.46588254249577055, "step": 37092 }, { "epoch": 22.0, "eval_BB_NB_RUND_loss": 0.7788259387016296, "eval_BB_NB_RUND_runtime": 186.5504, "eval_BB_NB_RUND_samples_per_second": 17.379, "eval_BB_NB_RUND_steps_per_second": 0.547, "eval_BB_NB_RUND_wer": 0.285890922775045, "step": 37092 }, { "epoch": 22.0, "eval_rundkast_loss": 0.30141252279281616, "eval_rundkast_runtime": 40.0476, "eval_rundkast_samples_per_second": 33.435, "eval_rundkast_steps_per_second": 1.049, "eval_rundkast_wer": 0.16549352103663414, "step": 37092 }, { "epoch": 22.0, "eval_nb_samtale_loss": 0.5157301425933838, "eval_nb_samtale_runtime": 47.2633, "eval_nb_samtale_samples_per_second": 11.277, "eval_nb_samtale_steps_per_second": 0.36, "eval_nb_samtale_wer": 0.22599283854166666, "step": 37092 }, { "epoch": 23.0, "grad_norm": 21.909698486328125, "learning_rate": 4.349560206248104e-05, "loss": 0.3507, "step": 38778 }, { "epoch": 23.0, "eval_bigbrother_loss": 1.436195731163025, "eval_bigbrother_runtime": 55.1641, "eval_bigbrother_samples_per_second": 24.835, "eval_bigbrother_steps_per_second": 0.779, "eval_bigbrother_wer": 0.45677918311447674, "step": 38778 }, { "epoch": 23.0, "eval_BB_NB_RUND_loss": 0.8368074893951416, "eval_BB_NB_RUND_runtime": 174.9632, "eval_BB_NB_RUND_samples_per_second": 18.53, "eval_BB_NB_RUND_steps_per_second": 0.583, "eval_BB_NB_RUND_wer": 0.2791979141467086, "step": 38778 }, { "epoch": 23.0, "eval_rundkast_loss": 0.3419454097747803, "eval_rundkast_runtime": 40.1893, "eval_rundkast_samples_per_second": 33.317, "eval_rundkast_steps_per_second": 1.045, "eval_rundkast_wer": 0.15853463445848665, "step": 38778 }, { "epoch": 23.0, "eval_nb_samtale_loss": 0.5392637848854065, "eval_nb_samtale_runtime": 47.8657, "eval_nb_samtale_samples_per_second": 11.135, "eval_nb_samtale_steps_per_second": 0.355, "eval_nb_samtale_wer": 0.22233072916666666, "step": 38778 }, { "epoch": 24.0, "grad_norm": 17.75894546508789, "learning_rate": 4.09387321807704e-05, "loss": 0.3407, "step": 40464 }, { "epoch": 24.0, "eval_bigbrother_loss": 1.394923448562622, "eval_bigbrother_runtime": 55.3073, "eval_bigbrother_samples_per_second": 24.771, "eval_bigbrother_steps_per_second": 0.777, "eval_bigbrother_wer": 0.4556513332796262, "step": 40464 }, { "epoch": 24.0, "eval_BB_NB_RUND_loss": 0.8072466850280762, "eval_BB_NB_RUND_runtime": 184.4773, "eval_BB_NB_RUND_samples_per_second": 17.574, "eval_BB_NB_RUND_steps_per_second": 0.553, "eval_BB_NB_RUND_wer": 0.279681746095745, "step": 40464 }, { "epoch": 24.0, "eval_rundkast_loss": 0.32181429862976074, "eval_rundkast_runtime": 40.2553, "eval_rundkast_samples_per_second": 33.263, "eval_rundkast_steps_per_second": 1.043, "eval_rundkast_wer": 0.15709486482162854, "step": 40464 }, { "epoch": 24.0, "eval_nb_samtale_loss": 0.5160051584243774, "eval_nb_samtale_runtime": 48.428, "eval_nb_samtale_samples_per_second": 11.006, "eval_nb_samtale_steps_per_second": 0.351, "eval_nb_samtale_wer": 0.22639973958333334, "step": 40464 }, { "epoch": 25.0, "grad_norm": 7.524557590484619, "learning_rate": 3.838186229905975e-05, "loss": 0.3306, "step": 42150 }, { "epoch": 25.0, "eval_bigbrother_loss": 1.4151748418807983, "eval_bigbrother_runtime": 54.9262, "eval_bigbrother_samples_per_second": 24.943, "eval_bigbrother_steps_per_second": 0.783, "eval_bigbrother_wer": 0.45146217675018124, "step": 42150 }, { "epoch": 25.0, "eval_BB_NB_RUND_loss": 0.8287575840950012, "eval_BB_NB_RUND_runtime": 184.6246, "eval_BB_NB_RUND_samples_per_second": 17.56, "eval_BB_NB_RUND_steps_per_second": 0.552, "eval_BB_NB_RUND_wer": 0.2747896674999328, "step": 42150 }, { "epoch": 25.0, "eval_rundkast_loss": 0.34578415751457214, "eval_rundkast_runtime": 40.2638, "eval_rundkast_samples_per_second": 33.256, "eval_rundkast_steps_per_second": 1.043, "eval_rundkast_wer": 0.15877459606462965, "step": 42150 }, { "epoch": 25.0, "eval_nb_samtale_loss": 0.5345997214317322, "eval_nb_samtale_runtime": 47.4285, "eval_nb_samtale_samples_per_second": 11.238, "eval_nb_samtale_steps_per_second": 0.358, "eval_nb_samtale_wer": 0.214111328125, "step": 42150 }, { "epoch": 26.0, "grad_norm": 45.58380126953125, "learning_rate": 3.582650894752806e-05, "loss": 0.3192, "step": 43836 }, { "epoch": 26.0, "eval_bigbrother_loss": 1.5123320817947388, "eval_bigbrother_runtime": 54.6916, "eval_bigbrother_samples_per_second": 25.05, "eval_bigbrother_steps_per_second": 0.786, "eval_bigbrother_wer": 0.4467896560058004, "step": 43836 }, { "epoch": 26.0, "eval_BB_NB_RUND_loss": 0.8734822869300842, "eval_BB_NB_RUND_runtime": 185.5859, "eval_BB_NB_RUND_samples_per_second": 17.469, "eval_BB_NB_RUND_steps_per_second": 0.55, "eval_BB_NB_RUND_wer": 0.27237050775475097, "step": 43836 }, { "epoch": 26.0, "eval_rundkast_loss": 0.3513795733451843, "eval_rundkast_runtime": 40.0168, "eval_rundkast_samples_per_second": 33.461, "eval_rundkast_steps_per_second": 1.05, "eval_rundkast_wer": 0.1575747880339146, "step": 43836 }, { "epoch": 26.0, "eval_nb_samtale_loss": 0.5426519513130188, "eval_nb_samtale_runtime": 47.2324, "eval_nb_samtale_samples_per_second": 11.285, "eval_nb_samtale_steps_per_second": 0.36, "eval_nb_samtale_wer": 0.212890625, "step": 43836 }, { "epoch": 27.0, "grad_norm": 51.679561614990234, "learning_rate": 3.326963906581741e-05, "loss": 0.3092, "step": 45522 }, { "epoch": 27.0, "eval_bigbrother_loss": 1.4591954946517944, "eval_bigbrother_runtime": 54.7449, "eval_bigbrother_samples_per_second": 25.025, "eval_bigbrother_steps_per_second": 0.785, "eval_bigbrother_wer": 0.44324498509627, "step": 45522 }, { "epoch": 27.0, "eval_BB_NB_RUND_loss": 0.8474361896514893, "eval_BB_NB_RUND_runtime": 185.4261, "eval_BB_NB_RUND_samples_per_second": 17.484, "eval_BB_NB_RUND_steps_per_second": 0.55, "eval_BB_NB_RUND_wer": 0.2704351799586055, "step": 45522 }, { "epoch": 27.0, "eval_rundkast_loss": 0.34611085057258606, "eval_rundkast_runtime": 39.9599, "eval_rundkast_samples_per_second": 33.509, "eval_rundkast_steps_per_second": 1.051, "eval_rundkast_wer": 0.15381538953767399, "step": 45522 }, { "epoch": 27.0, "eval_nb_samtale_loss": 0.5338240265846252, "eval_nb_samtale_runtime": 47.1834, "eval_nb_samtale_samples_per_second": 11.296, "eval_nb_samtale_steps_per_second": 0.36, "eval_nb_samtale_wer": 0.21500651041666666, "step": 45522 }, { "epoch": 28.0, "grad_norm": 6.035738468170166, "learning_rate": 3.071276918410677e-05, "loss": 0.2935, "step": 47208 }, { "epoch": 28.0, "eval_bigbrother_loss": 1.4708665609359741, "eval_bigbrother_runtime": 55.0307, "eval_bigbrother_samples_per_second": 24.895, "eval_bigbrother_steps_per_second": 0.781, "eval_bigbrother_wer": 0.4352694755498268, "step": 47208 }, { "epoch": 28.0, "eval_BB_NB_RUND_loss": 0.8631957173347473, "eval_BB_NB_RUND_runtime": 250.4068, "eval_BB_NB_RUND_samples_per_second": 12.947, "eval_BB_NB_RUND_steps_per_second": 0.407, "eval_BB_NB_RUND_wer": 0.26624196973362363, "step": 47208 }, { "epoch": 28.0, "eval_rundkast_loss": 0.35267603397369385, "eval_rundkast_runtime": 40.1826, "eval_rundkast_samples_per_second": 33.323, "eval_rundkast_steps_per_second": 1.045, "eval_rundkast_wer": 0.1529355303151496, "step": 47208 }, { "epoch": 28.0, "eval_nb_samtale_loss": 0.583747923374176, "eval_nb_samtale_runtime": 47.2983, "eval_nb_samtale_samples_per_second": 11.269, "eval_nb_samtale_steps_per_second": 0.359, "eval_nb_samtale_wer": 0.21053059895833334, "step": 47208 }, { "epoch": 29.0, "grad_norm": 6.352161407470703, "learning_rate": 2.8155899302396122e-05, "loss": 0.2854, "step": 48894 }, { "epoch": 29.0, "eval_bigbrother_loss": 1.5383168458938599, "eval_bigbrother_runtime": 54.9702, "eval_bigbrother_samples_per_second": 24.923, "eval_bigbrother_steps_per_second": 0.782, "eval_bigbrother_wer": 0.4352694755498268, "step": 48894 }, { "epoch": 29.0, "eval_BB_NB_RUND_loss": 0.8866830468177795, "eval_BB_NB_RUND_runtime": 184.2665, "eval_BB_NB_RUND_samples_per_second": 17.594, "eval_BB_NB_RUND_steps_per_second": 0.554, "eval_BB_NB_RUND_wer": 0.2632583393812327, "step": 48894 }, { "epoch": 29.0, "eval_rundkast_loss": 0.3528152108192444, "eval_rundkast_runtime": 40.0458, "eval_rundkast_samples_per_second": 33.437, "eval_rundkast_steps_per_second": 1.049, "eval_rundkast_wer": 0.1476563749800032, "step": 48894 }, { "epoch": 29.0, "eval_nb_samtale_loss": 0.5526814460754395, "eval_nb_samtale_runtime": 47.2216, "eval_nb_samtale_samples_per_second": 11.287, "eval_nb_samtale_steps_per_second": 0.36, "eval_nb_samtale_wer": 0.20662434895833334, "step": 48894 }, { "epoch": 30.0, "grad_norm": 16.592275619506836, "learning_rate": 2.5600545950864424e-05, "loss": 0.2743, "step": 50580 }, { "epoch": 30.0, "eval_bigbrother_loss": 1.491037130355835, "eval_bigbrother_runtime": 55.562, "eval_bigbrother_samples_per_second": 24.657, "eval_bigbrother_steps_per_second": 0.774, "eval_bigbrother_wer": 0.4344638685249335, "step": 50580 }, { "epoch": 30.0, "eval_BB_NB_RUND_loss": 0.8672559261322021, "eval_BB_NB_RUND_runtime": 206.7209, "eval_BB_NB_RUND_samples_per_second": 15.683, "eval_BB_NB_RUND_steps_per_second": 0.493, "eval_BB_NB_RUND_wer": 0.2624519527995054, "step": 50580 }, { "epoch": 30.0, "eval_rundkast_loss": 0.352713406085968, "eval_rundkast_runtime": 40.2922, "eval_rundkast_samples_per_second": 33.232, "eval_rundkast_steps_per_second": 1.042, "eval_rundkast_wer": 0.1478963365861462, "step": 50580 }, { "epoch": 30.0, "eval_nb_samtale_loss": 0.5577544569969177, "eval_nb_samtale_runtime": 47.5456, "eval_nb_samtale_samples_per_second": 11.21, "eval_nb_samtale_steps_per_second": 0.358, "eval_nb_samtale_wer": 0.20467122395833334, "step": 50580 }, { "epoch": 31.0, "grad_norm": 45.161354064941406, "learning_rate": 2.3045192599332726e-05, "loss": 0.2642, "step": 52266 }, { "epoch": 31.0, "eval_bigbrother_loss": 1.5767817497253418, "eval_bigbrother_runtime": 55.8334, "eval_bigbrother_samples_per_second": 24.537, "eval_bigbrother_steps_per_second": 0.77, "eval_bigbrother_wer": 0.43317489728510433, "step": 52266 }, { "epoch": 31.0, "eval_BB_NB_RUND_loss": 0.9109604358673096, "eval_BB_NB_RUND_runtime": 200.853, "eval_BB_NB_RUND_samples_per_second": 16.141, "eval_BB_NB_RUND_steps_per_second": 0.508, "eval_BB_NB_RUND_wer": 0.2612692524796387, "step": 52266 }, { "epoch": 31.0, "eval_rundkast_loss": 0.3539213240146637, "eval_rundkast_runtime": 40.1832, "eval_rundkast_samples_per_second": 33.322, "eval_rundkast_steps_per_second": 1.045, "eval_rundkast_wer": 0.14285714285714285, "step": 52266 }, { "epoch": 31.0, "eval_nb_samtale_loss": 0.5987378358840942, "eval_nb_samtale_runtime": 47.6989, "eval_nb_samtale_samples_per_second": 11.174, "eval_nb_samtale_steps_per_second": 0.356, "eval_nb_samtale_wer": 0.20768229166666666, "step": 52266 }, { "epoch": 32.0, "grad_norm": 11.585915565490723, "learning_rate": 2.0489839247801032e-05, "loss": 0.2547, "step": 53952 }, { "epoch": 32.0, "eval_bigbrother_loss": 1.529497742652893, "eval_bigbrother_runtime": 55.5603, "eval_bigbrother_samples_per_second": 24.658, "eval_bigbrother_steps_per_second": 0.774, "eval_bigbrother_wer": 0.42954966567308467, "step": 53952 }, { "epoch": 32.0, "eval_BB_NB_RUND_loss": 0.8869587779045105, "eval_BB_NB_RUND_runtime": 185.554, "eval_BB_NB_RUND_samples_per_second": 17.472, "eval_BB_NB_RUND_steps_per_second": 0.55, "eval_BB_NB_RUND_wer": 0.25793618794183265, "step": 53952 }, { "epoch": 32.0, "eval_rundkast_loss": 0.3568912148475647, "eval_rundkast_runtime": 40.0636, "eval_rundkast_samples_per_second": 33.422, "eval_rundkast_steps_per_second": 1.048, "eval_rundkast_wer": 0.14397696368581028, "step": 53952 }, { "epoch": 32.0, "eval_nb_samtale_loss": 0.566994309425354, "eval_nb_samtale_runtime": 47.5483, "eval_nb_samtale_samples_per_second": 11.21, "eval_nb_samtale_steps_per_second": 0.358, "eval_nb_samtale_wer": 0.20003255208333334, "step": 53952 }, { "epoch": 33.0, "grad_norm": 6.523238182067871, "learning_rate": 1.7932969366090385e-05, "loss": 0.2471, "step": 55638 }, { "epoch": 33.0, "eval_bigbrother_loss": 1.589526891708374, "eval_bigbrother_runtime": 54.9785, "eval_bigbrother_samples_per_second": 24.919, "eval_bigbrother_steps_per_second": 0.782, "eval_bigbrother_wer": 0.41980182067187627, "step": 55638 }, { "epoch": 33.0, "eval_BB_NB_RUND_loss": 0.9184404611587524, "eval_BB_NB_RUND_runtime": 176.6606, "eval_BB_NB_RUND_samples_per_second": 18.352, "eval_BB_NB_RUND_steps_per_second": 0.577, "eval_BB_NB_RUND_wer": 0.25258715694970835, "step": 55638 }, { "epoch": 33.0, "eval_rundkast_loss": 0.3644249141216278, "eval_rundkast_runtime": 40.0915, "eval_rundkast_samples_per_second": 33.399, "eval_rundkast_steps_per_second": 1.048, "eval_rundkast_wer": 0.14117741161414174, "step": 55638 }, { "epoch": 33.0, "eval_nb_samtale_loss": 0.5854535102844238, "eval_nb_samtale_runtime": 47.6556, "eval_nb_samtale_samples_per_second": 11.184, "eval_nb_samtale_steps_per_second": 0.357, "eval_nb_samtale_wer": 0.19669596354166666, "step": 55638 }, { "epoch": 34.0, "grad_norm": 6.739225387573242, "learning_rate": 1.5376099484379742e-05, "loss": 0.2391, "step": 57324 }, { "epoch": 34.0, "eval_bigbrother_loss": 1.5508168935775757, "eval_bigbrother_runtime": 55.2494, "eval_bigbrother_samples_per_second": 24.797, "eval_bigbrother_steps_per_second": 0.778, "eval_bigbrother_wer": 0.4182711673245791, "step": 57324 }, { "epoch": 34.0, "eval_BB_NB_RUND_loss": 0.9037603139877319, "eval_BB_NB_RUND_runtime": 189.0492, "eval_BB_NB_RUND_samples_per_second": 17.149, "eval_BB_NB_RUND_steps_per_second": 0.54, "eval_BB_NB_RUND_wer": 0.2511356611025993, "step": 57324 }, { "epoch": 34.0, "eval_rundkast_loss": 0.37484127283096313, "eval_rundkast_runtime": 40.5007, "eval_rundkast_samples_per_second": 33.061, "eval_rundkast_steps_per_second": 1.037, "eval_rundkast_wer": 0.1410174372100464, "step": 57324 }, { "epoch": 34.0, "eval_nb_samtale_loss": 0.5698674917221069, "eval_nb_samtale_runtime": 47.7367, "eval_nb_samtale_samples_per_second": 11.165, "eval_nb_samtale_steps_per_second": 0.356, "eval_nb_samtale_wer": 0.19417317708333334, "step": 57324 }, { "epoch": 35.0, "grad_norm": 8.39053726196289, "learning_rate": 1.2819229602669094e-05, "loss": 0.2279, "step": 59010 }, { "epoch": 35.0, "eval_bigbrother_loss": 1.5247896909713745, "eval_bigbrother_runtime": 55.883, "eval_bigbrother_samples_per_second": 24.516, "eval_bigbrother_steps_per_second": 0.769, "eval_bigbrother_wer": 0.41843228872955773, "step": 59010 }, { "epoch": 35.0, "eval_BB_NB_RUND_loss": 0.8858203291893005, "eval_BB_NB_RUND_runtime": 186.0172, "eval_BB_NB_RUND_samples_per_second": 17.428, "eval_BB_NB_RUND_steps_per_second": 0.548, "eval_BB_NB_RUND_wer": 0.24989920167728408, "step": 59010 }, { "epoch": 35.0, "eval_rundkast_loss": 0.3675382137298584, "eval_rundkast_runtime": 39.7117, "eval_rundkast_samples_per_second": 33.718, "eval_rundkast_steps_per_second": 1.058, "eval_rundkast_wer": 0.13845784674452088, "step": 59010 }, { "epoch": 35.0, "eval_nb_samtale_loss": 0.5457141995429993, "eval_nb_samtale_runtime": 47.1407, "eval_nb_samtale_samples_per_second": 11.307, "eval_nb_samtale_steps_per_second": 0.361, "eval_nb_samtale_wer": 0.19327799479166666, "step": 59010 }, { "epoch": 36.0, "grad_norm": 32.44700622558594, "learning_rate": 1.0263876251137398e-05, "loss": 0.2202, "step": 60696 }, { "epoch": 36.0, "eval_bigbrother_loss": 1.6295210123062134, "eval_bigbrother_runtime": 55.7536, "eval_bigbrother_samples_per_second": 24.572, "eval_bigbrother_steps_per_second": 0.771, "eval_bigbrother_wer": 0.4164988318698139, "step": 60696 }, { "epoch": 36.0, "eval_BB_NB_RUND_loss": 0.9496392607688904, "eval_BB_NB_RUND_runtime": 187.239, "eval_BB_NB_RUND_samples_per_second": 17.315, "eval_BB_NB_RUND_steps_per_second": 0.545, "eval_BB_NB_RUND_wer": 0.24809827164475984, "step": 60696 }, { "epoch": 36.0, "eval_rundkast_loss": 0.41033124923706055, "eval_rundkast_runtime": 39.7349, "eval_rundkast_samples_per_second": 33.698, "eval_rundkast_steps_per_second": 1.057, "eval_rundkast_wer": 0.1346184610462326, "step": 60696 }, { "epoch": 36.0, "eval_nb_samtale_loss": 0.5565491318702698, "eval_nb_samtale_runtime": 47.2102, "eval_nb_samtale_samples_per_second": 11.29, "eval_nb_samtale_steps_per_second": 0.36, "eval_nb_samtale_wer": 0.193115234375, "step": 60696 }, { "epoch": 37.0, "grad_norm": 6.115579128265381, "learning_rate": 7.710039429784654e-06, "loss": 0.2134, "step": 62382 }, { "epoch": 37.0, "eval_bigbrother_loss": 1.6113148927688599, "eval_bigbrother_runtime": 55.3118, "eval_bigbrother_samples_per_second": 24.769, "eval_bigbrother_steps_per_second": 0.777, "eval_bigbrother_wer": 0.42068798839925886, "step": 62382 }, { "epoch": 37.0, "eval_BB_NB_RUND_loss": 0.9415259957313538, "eval_BB_NB_RUND_runtime": 186.5349, "eval_BB_NB_RUND_samples_per_second": 17.38, "eval_BB_NB_RUND_steps_per_second": 0.547, "eval_BB_NB_RUND_wer": 0.24963040615004167, "step": 62382 }, { "epoch": 37.0, "eval_rundkast_loss": 0.40727370977401733, "eval_rundkast_runtime": 40.0362, "eval_rundkast_samples_per_second": 33.445, "eval_rundkast_steps_per_second": 1.049, "eval_rundkast_wer": 0.1369380899056151, "step": 62382 }, { "epoch": 37.0, "eval_nb_samtale_loss": 0.5639351606369019, "eval_nb_samtale_runtime": 46.907, "eval_nb_samtale_samples_per_second": 11.363, "eval_nb_samtale_steps_per_second": 0.362, "eval_nb_samtale_wer": 0.19140625, "step": 62382 }, { "epoch": 38.0, "grad_norm": 10.58083438873291, "learning_rate": 5.153169548074007e-06, "loss": 0.2094, "step": 64068 }, { "epoch": 38.0, "eval_bigbrother_loss": 1.6277378797531128, "eval_bigbrother_runtime": 54.6605, "eval_bigbrother_samples_per_second": 25.064, "eval_bigbrother_steps_per_second": 0.787, "eval_bigbrother_wer": 0.41037621848062517, "step": 64068 }, { "epoch": 38.0, "eval_BB_NB_RUND_loss": 0.9503330588340759, "eval_BB_NB_RUND_runtime": 187.301, "eval_BB_NB_RUND_samples_per_second": 17.309, "eval_BB_NB_RUND_steps_per_second": 0.545, "eval_BB_NB_RUND_wer": 0.24508776173964467, "step": 64068 }, { "epoch": 38.0, "eval_rundkast_loss": 0.4076659679412842, "eval_rundkast_runtime": 40.0836, "eval_rundkast_samples_per_second": 33.405, "eval_rundkast_steps_per_second": 1.048, "eval_rundkast_wer": 0.1334986402175652, "step": 64068 }, { "epoch": 38.0, "eval_nb_samtale_loss": 0.5725387334823608, "eval_nb_samtale_runtime": 48.2674, "eval_nb_samtale_samples_per_second": 11.043, "eval_nb_samtale_steps_per_second": 0.352, "eval_nb_samtale_wer": 0.19156901041666666, "step": 64068 }, { "epoch": 39.0, "grad_norm": 9.250320434570312, "learning_rate": 2.5978161965423114e-06, "loss": 0.203, "step": 65754 }, { "epoch": 39.0, "eval_bigbrother_loss": 1.6648077964782715, "eval_bigbrother_runtime": 55.4612, "eval_bigbrother_samples_per_second": 24.702, "eval_bigbrother_steps_per_second": 0.775, "eval_bigbrother_wer": 0.40812051881092404, "step": 65754 }, { "epoch": 39.0, "eval_BB_NB_RUND_loss": 0.9731335639953613, "eval_BB_NB_RUND_runtime": 187.078, "eval_BB_NB_RUND_samples_per_second": 17.33, "eval_BB_NB_RUND_steps_per_second": 0.545, "eval_BB_NB_RUND_wer": 0.2430986748380507, "step": 65754 }, { "epoch": 39.0, "eval_rundkast_loss": 0.41892868280410767, "eval_rundkast_runtime": 39.6687, "eval_rundkast_samples_per_second": 33.755, "eval_rundkast_steps_per_second": 1.059, "eval_rundkast_wer": 0.13181890897456408, "step": 65754 }, { "epoch": 39.0, "eval_nb_samtale_loss": 0.5878060460090637, "eval_nb_samtale_runtime": 46.9935, "eval_nb_samtale_samples_per_second": 11.342, "eval_nb_samtale_steps_per_second": 0.362, "eval_nb_samtale_wer": 0.189697265625, "step": 65754 }, { "epoch": 40.0, "grad_norm": 5.386321067810059, "learning_rate": 4.094631483166515e-08, "loss": 0.1995, "step": 67440 }, { "epoch": 40.0, "eval_bigbrother_loss": 1.6618098020553589, "eval_bigbrother_runtime": 55.1914, "eval_bigbrother_samples_per_second": 24.823, "eval_bigbrother_steps_per_second": 0.779, "eval_bigbrother_wer": 0.4102956577781358, "step": 67440 }, { "epoch": 40.0, "eval_BB_NB_RUND_loss": 0.9701318740844727, "eval_BB_NB_RUND_runtime": 185.1129, "eval_BB_NB_RUND_samples_per_second": 17.514, "eval_BB_NB_RUND_steps_per_second": 0.551, "eval_BB_NB_RUND_wer": 0.24457705023788404, "step": 67440 }, { "epoch": 40.0, "eval_rundkast_loss": 0.4156753122806549, "eval_rundkast_runtime": 39.6972, "eval_rundkast_samples_per_second": 33.73, "eval_rundkast_steps_per_second": 1.058, "eval_rundkast_wer": 0.13397856342985123, "step": 67440 }, { "epoch": 40.0, "eval_nb_samtale_loss": 0.5852100849151611, "eval_nb_samtale_runtime": 47.3346, "eval_nb_samtale_samples_per_second": 11.26, "eval_nb_samtale_steps_per_second": 0.359, "eval_nb_samtale_wer": 0.18896484375, "step": 67440 } ], "logging_steps": 500, "max_steps": 67440, "num_input_tokens_seen": 0, "num_train_epochs": 40, "save_steps": 500, "total_flos": 1.1424949557265292e+21, "train_batch_size": 48, "trial_name": null, "trial_params": null }