{ "best_metric": 0.5284518003463745, "best_model_checkpoint": "nrshoudi/hubert_arabic_mdd/checkpoint-6548", "epoch": 10.0, "eval_steps": 500, "global_step": 16370, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "learning_rate": 0.0001, "loss": 6.3943, "step": 1637 }, { "epoch": 1.0, "eval_loss": 1.2721797227859497, "eval_per": 0.4456091585791011, "eval_runtime": 117.745, "eval_samples_per_second": 6.905, "eval_steps_per_second": 3.457, "eval_wer": 0.4692734823386683, "step": 1637 }, { "epoch": 2.0, "learning_rate": 8.888888888888889e-05, "loss": 0.7962, "step": 3274 }, { "epoch": 2.0, "eval_loss": 0.5990138053894043, "eval_per": 0.11846320550268538, "eval_runtime": 118.7347, "eval_samples_per_second": 6.847, "eval_steps_per_second": 3.428, "eval_wer": 0.13774438896925015, "step": 3274 }, { "epoch": 3.0, "learning_rate": 7.777777777777778e-05, "loss": 0.4245, "step": 4911 }, { "epoch": 3.0, "eval_loss": 0.6075053811073303, "eval_per": 0.06744087439932159, "eval_runtime": 118.3123, "eval_samples_per_second": 6.872, "eval_steps_per_second": 3.44, "eval_wer": 0.08991647613270495, "step": 4911 }, { "epoch": 4.0, "learning_rate": 6.666666666666667e-05, "loss": 0.2898, "step": 6548 }, { "epoch": 4.0, "eval_loss": 0.5284518003463745, "eval_per": 0.07384811080750024, "eval_runtime": 121.2465, "eval_samples_per_second": 6.705, "eval_steps_per_second": 3.357, "eval_wer": 0.09789557183519201, "step": 6548 }, { "epoch": 5.0, "learning_rate": 5.555555555555556e-05, "loss": 0.2262, "step": 8185 }, { "epoch": 5.0, "eval_loss": 0.5600156784057617, "eval_per": 0.07577970413643645, "eval_runtime": 119.4374, "eval_samples_per_second": 6.807, "eval_steps_per_second": 3.408, "eval_wer": 0.09770892632168354, "step": 8185 }, { "epoch": 6.0, "learning_rate": 4.4444444444444447e-05, "loss": 0.1803, "step": 9822 }, { "epoch": 6.0, "eval_loss": 0.5504231452941895, "eval_per": 0.060279845472533684, "eval_runtime": 119.1759, "eval_samples_per_second": 6.822, "eval_steps_per_second": 3.415, "eval_wer": 0.08077084597078998, "step": 9822 }, { "epoch": 7.0, "learning_rate": 3.3333333333333335e-05, "loss": 0.1488, "step": 11459 }, { "epoch": 7.0, "eval_loss": 0.5854084491729736, "eval_per": 0.06998492414962781, "eval_runtime": 119.0832, "eval_samples_per_second": 6.827, "eval_steps_per_second": 3.418, "eval_wer": 0.08982315337595073, "step": 11459 }, { "epoch": 8.0, "learning_rate": 2.2222222222222223e-05, "loss": 0.1267, "step": 13096 }, { "epoch": 8.0, "eval_loss": 0.5438163876533508, "eval_per": 0.07222274568924904, "eval_runtime": 119.6311, "eval_samples_per_second": 6.796, "eval_steps_per_second": 3.402, "eval_wer": 0.09140964024077271, "step": 13096 }, { "epoch": 9.0, "learning_rate": 1.1111111111111112e-05, "loss": 0.1156, "step": 14733 }, { "epoch": 9.0, "eval_loss": 0.5394747257232666, "eval_per": 0.06713464618863657, "eval_runtime": 119.6655, "eval_samples_per_second": 6.794, "eval_steps_per_second": 3.401, "eval_wer": 0.08660351826792964, "step": 14733 }, { "epoch": 10.0, "learning_rate": 0.0, "loss": 0.0993, "step": 16370 }, { "epoch": 10.0, "eval_loss": 0.5404430627822876, "eval_per": 0.06713464618863657, "eval_runtime": 120.5761, "eval_samples_per_second": 6.743, "eval_steps_per_second": 3.375, "eval_wer": 0.08590359759227288, "step": 16370 }, { "epoch": 10.0, "step": 16370, "total_flos": 5.23722142955399e+18, "train_loss": 0.8801708410189657, "train_runtime": 9837.0244, "train_samples_per_second": 3.327, "train_steps_per_second": 1.664 } ], "logging_steps": 500, "max_steps": 16370, "num_train_epochs": 10, "save_steps": 500, "total_flos": 5.23722142955399e+18, "trial_name": null, "trial_params": null }