{ "best_metric": 0.3309297263622284, "best_model_checkpoint": "nrshoudi/hubert_arabic_mdd/checkpoint-11459", "epoch": 20.0, "eval_steps": 500, "global_step": 32740, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "learning_rate": 5e-05, "loss": 5.6351, "step": 1637 }, { "epoch": 1.0, "eval_loss": 0.7704485058784485, "eval_per": 0.3110336379911429, "eval_runtime": 117.9251, "eval_samples_per_second": 6.894, "eval_steps_per_second": 3.451, "eval_wer": 0.3277028603424945, "step": 1637 }, { "epoch": 2.0, "learning_rate": 0.0001, "loss": 0.3646, "step": 3274 }, { "epoch": 2.0, "eval_loss": 0.433285653591156, "eval_per": 0.05403750117780081, "eval_runtime": 117.5906, "eval_samples_per_second": 6.914, "eval_steps_per_second": 3.461, "eval_wer": 0.06728570761980308, "step": 3274 }, { "epoch": 3.0, "learning_rate": 9.444444444444444e-05, "loss": 0.1587, "step": 4911 }, { "epoch": 3.0, "eval_loss": 0.3875606060028076, "eval_per": 0.05804202393291247, "eval_runtime": 117.765, "eval_samples_per_second": 6.904, "eval_steps_per_second": 3.456, "eval_wer": 0.07101861788997246, "step": 4911 }, { "epoch": 4.0, "learning_rate": 8.888888888888889e-05, "loss": 0.1105, "step": 6548 }, { "epoch": 4.0, "eval_loss": 0.3607988655567169, "eval_per": 0.05578064637708471, "eval_runtime": 117.9127, "eval_samples_per_second": 6.895, "eval_steps_per_second": 3.452, "eval_wer": 0.06695907797116327, "step": 6548 }, { "epoch": 5.0, "learning_rate": 8.333333333333334e-05, "loss": 0.0878, "step": 8185 }, { "epoch": 5.0, "eval_loss": 0.3808358907699585, "eval_per": 0.05618109865259587, "eval_runtime": 117.5542, "eval_samples_per_second": 6.916, "eval_steps_per_second": 3.462, "eval_wer": 0.06775232140357426, "step": 8185 }, { "epoch": 6.0, "learning_rate": 7.777777777777778e-05, "loss": 0.0738, "step": 9822 }, { "epoch": 6.0, "eval_loss": 0.3576147258281708, "eval_per": 0.05177612362197305, "eval_runtime": 118.5636, "eval_samples_per_second": 6.857, "eval_steps_per_second": 3.433, "eval_wer": 0.06392608837665065, "step": 9822 }, { "epoch": 7.0, "learning_rate": 7.222222222222222e-05, "loss": 0.0594, "step": 11459 }, { "epoch": 7.0, "eval_loss": 0.3309297263622284, "eval_per": 0.050810326957504946, "eval_runtime": 117.7279, "eval_samples_per_second": 6.906, "eval_steps_per_second": 3.457, "eval_wer": 0.06173300359292613, "step": 11459 }, { "epoch": 8.0, "learning_rate": 6.666666666666667e-05, "loss": 0.056, "step": 13096 }, { "epoch": 8.0, "eval_loss": 0.3569846451282501, "eval_per": 0.046711580137567134, "eval_runtime": 118.1175, "eval_samples_per_second": 6.883, "eval_steps_per_second": 3.446, "eval_wer": 0.058700013998413514, "step": 13096 }, { "epoch": 9.0, "learning_rate": 6.111111111111112e-05, "loss": 0.0478, "step": 14733 }, { "epoch": 9.0, "eval_loss": 0.34502002596855164, "eval_per": 0.04727692452652407, "eval_runtime": 117.9103, "eval_samples_per_second": 6.895, "eval_steps_per_second": 3.452, "eval_wer": 0.05832672297139657, "step": 14733 }, { "epoch": 10.0, "learning_rate": 5.555555555555556e-05, "loss": 0.0388, "step": 16370 }, { "epoch": 10.0, "eval_loss": 0.3993436396121979, "eval_per": 0.04803071704513333, "eval_runtime": 117.7116, "eval_samples_per_second": 6.907, "eval_steps_per_second": 3.458, "eval_wer": 0.05907330502543045, "step": 16370 }, { "epoch": 11.0, "learning_rate": 5e-05, "loss": 0.0378, "step": 18007 }, { "epoch": 11.0, "eval_loss": 0.4171537160873413, "eval_per": 0.0437435220955432, "eval_runtime": 118.1365, "eval_samples_per_second": 6.882, "eval_steps_per_second": 3.445, "eval_wer": 0.05501376510662125, "step": 18007 }, { "epoch": 12.0, "learning_rate": 4.4444444444444447e-05, "loss": 0.0319, "step": 19644 }, { "epoch": 12.0, "eval_loss": 0.3625492751598358, "eval_per": 0.04131725242626967, "eval_runtime": 118.0928, "eval_samples_per_second": 6.884, "eval_steps_per_second": 3.446, "eval_wer": 0.051794129998600155, "step": 19644 }, { "epoch": 13.0, "learning_rate": 3.888888888888889e-05, "loss": 0.0309, "step": 21281 }, { "epoch": 13.0, "eval_loss": 0.3794006109237671, "eval_per": 0.03919721096768115, "eval_runtime": 118.3172, "eval_samples_per_second": 6.871, "eval_steps_per_second": 3.44, "eval_wer": 0.05053427278241799, "step": 21281 }, { "epoch": 14.0, "learning_rate": 3.3333333333333335e-05, "loss": 0.0257, "step": 22918 }, { "epoch": 14.0, "eval_loss": 0.3896752893924713, "eval_per": 0.04263638933383586, "eval_runtime": 118.7663, "eval_samples_per_second": 6.845, "eval_steps_per_second": 3.427, "eval_wer": 0.05342727824179926, "step": 22918 }, { "epoch": 15.0, "learning_rate": 2.777777777777778e-05, "loss": 0.0202, "step": 24555 }, { "epoch": 15.0, "eval_loss": 0.40769127011299133, "eval_per": 0.04042212381042118, "eval_runtime": 118.2316, "eval_samples_per_second": 6.876, "eval_steps_per_second": 3.442, "eval_wer": 0.05123419345807475, "step": 24555 }, { "epoch": 16.0, "learning_rate": 2.2222222222222223e-05, "loss": 0.0197, "step": 26192 }, { "epoch": 16.0, "eval_loss": 0.38464316725730896, "eval_per": 0.041128804296617354, "eval_runtime": 118.9714, "eval_samples_per_second": 6.834, "eval_steps_per_second": 3.421, "eval_wer": 0.05076757967430358, "step": 26192 }, { "epoch": 17.0, "learning_rate": 1.6666666666666667e-05, "loss": 0.016, "step": 27829 }, { "epoch": 17.0, "eval_loss": 0.3807629942893982, "eval_per": 0.03910298690285499, "eval_runtime": 118.4593, "eval_samples_per_second": 6.863, "eval_steps_per_second": 3.436, "eval_wer": 0.04913443143110448, "step": 27829 }, { "epoch": 18.0, "learning_rate": 1.1111111111111112e-05, "loss": 0.0157, "step": 29466 }, { "epoch": 18.0, "eval_loss": 0.4060150980949402, "eval_per": 0.03726561763874493, "eval_runtime": 118.2175, "eval_samples_per_second": 6.877, "eval_steps_per_second": 3.443, "eval_wer": 0.047127992160888435, "step": 29466 }, { "epoch": 19.0, "learning_rate": 5.555555555555556e-06, "loss": 0.0131, "step": 31103 }, { "epoch": 19.0, "eval_loss": 0.3925394117832184, "eval_per": 0.03611137284462452, "eval_runtime": 118.443, "eval_samples_per_second": 6.864, "eval_steps_per_second": 3.436, "eval_wer": 0.04652139424198591, "step": 31103 }, { "epoch": 20.0, "learning_rate": 0.0, "loss": 0.0115, "step": 32740 }, { "epoch": 20.0, "eval_loss": 0.39911746978759766, "eval_per": 0.036252708941863755, "eval_runtime": 118.88, "eval_samples_per_second": 6.839, "eval_steps_per_second": 3.424, "eval_wer": 0.04656805562036303, "step": 32740 }, { "epoch": 20.0, "step": 32740, "total_flos": 1.0473975577487264e+19, "train_loss": 0.3427419745201153, "train_runtime": 19585.0411, "train_samples_per_second": 3.342, "train_steps_per_second": 1.672 } ], "logging_steps": 500, "max_steps": 32740, "num_train_epochs": 20, "save_steps": 500, "total_flos": 1.0473975577487264e+19, "trial_name": null, "trial_params": null }