{ "best_metric": 0.3490070093457944, "best_model_checkpoint": "/content/drive/MyDrive/wav2vec2-large-xlsr-persian-asr-shemo_partial/checkpoint-1900", "epoch": 12.5, "eval_steps": 100, "global_step": 2000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.62, "learning_rate": 2.0000000000000003e-06, "loss": 2.3226, "step": 100 }, { "epoch": 0.62, "eval_loss": 1.4547958374023438, "eval_runtime": 34.1762, "eval_samples_per_second": 8.31, "eval_steps_per_second": 1.053, "eval_wer": 0.48510514018691586, "step": 100 }, { "epoch": 1.25, "learning_rate": 4.000000000000001e-06, "loss": 1.7166, "step": 200 }, { "epoch": 1.25, "eval_loss": 1.2459642887115479, "eval_runtime": 33.6203, "eval_samples_per_second": 8.447, "eval_steps_per_second": 1.071, "eval_wer": 0.4278621495327103, "step": 200 }, { "epoch": 1.88, "learning_rate": 6e-06, "loss": 1.4987, "step": 300 }, { "epoch": 1.88, "eval_loss": 1.0671327114105225, "eval_runtime": 34.2581, "eval_samples_per_second": 8.29, "eval_steps_per_second": 1.051, "eval_wer": 0.41939252336448596, "step": 300 }, { "epoch": 2.5, "learning_rate": 7.980000000000002e-06, "loss": 1.3771, "step": 400 }, { "epoch": 2.5, "eval_loss": 0.9783589243888855, "eval_runtime": 33.3818, "eval_samples_per_second": 8.508, "eval_steps_per_second": 1.078, "eval_wer": 0.4053738317757009, "step": 400 }, { "epoch": 3.12, "learning_rate": 9.980000000000001e-06, "loss": 1.3217, "step": 500 }, { "epoch": 3.12, "eval_loss": 0.9450137615203857, "eval_runtime": 33.8716, "eval_samples_per_second": 8.385, "eval_steps_per_second": 1.063, "eval_wer": 0.3904789719626168, "step": 500 }, { "epoch": 3.75, "learning_rate": 9.340000000000002e-06, "loss": 1.3272, "step": 600 }, { "epoch": 3.75, "eval_loss": 0.8850811719894409, "eval_runtime": 33.8154, "eval_samples_per_second": 8.399, "eval_steps_per_second": 1.065, "eval_wer": 0.384053738317757, "step": 600 }, { "epoch": 4.38, "learning_rate": 8.673333333333334e-06, "loss": 1.3025, "step": 700 }, { "epoch": 4.38, "eval_loss": 0.8747560977935791, "eval_runtime": 33.4341, "eval_samples_per_second": 8.494, "eval_steps_per_second": 1.077, "eval_wer": 0.37792056074766356, "step": 700 }, { "epoch": 5.0, "learning_rate": 8.006666666666667e-06, "loss": 1.2719, "step": 800 }, { "epoch": 5.0, "eval_loss": 0.8673518300056458, "eval_runtime": 33.8685, "eval_samples_per_second": 8.385, "eval_steps_per_second": 1.063, "eval_wer": 0.3723714953271028, "step": 800 }, { "epoch": 5.62, "learning_rate": 7.340000000000001e-06, "loss": 1.2563, "step": 900 }, { "epoch": 5.62, "eval_loss": 0.846738338470459, "eval_runtime": 33.4615, "eval_samples_per_second": 8.487, "eval_steps_per_second": 1.076, "eval_wer": 0.3691588785046729, "step": 900 }, { "epoch": 6.25, "learning_rate": 6.6733333333333335e-06, "loss": 1.2451, "step": 1000 }, { "epoch": 6.25, "eval_loss": 0.8440045714378357, "eval_runtime": 33.5683, "eval_samples_per_second": 8.46, "eval_steps_per_second": 1.072, "eval_wer": 0.3644859813084112, "step": 1000 }, { "epoch": 6.88, "learning_rate": 6.006666666666667e-06, "loss": 1.2585, "step": 1100 }, { "epoch": 6.88, "eval_loss": 0.8292242884635925, "eval_runtime": 33.7508, "eval_samples_per_second": 8.415, "eval_steps_per_second": 1.067, "eval_wer": 0.36098130841121495, "step": 1100 }, { "epoch": 7.5, "learning_rate": 5.3400000000000005e-06, "loss": 1.2633, "step": 1200 }, { "epoch": 7.5, "eval_loss": 0.8137357234954834, "eval_runtime": 33.9332, "eval_samples_per_second": 8.369, "eval_steps_per_second": 1.061, "eval_wer": 0.36010514018691586, "step": 1200 }, { "epoch": 8.12, "learning_rate": 4.673333333333333e-06, "loss": 1.1923, "step": 1300 }, { "epoch": 8.12, "eval_loss": 0.8262812495231628, "eval_runtime": 33.9528, "eval_samples_per_second": 8.365, "eval_steps_per_second": 1.06, "eval_wer": 0.3574766355140187, "step": 1300 }, { "epoch": 8.75, "learning_rate": 4.006666666666667e-06, "loss": 1.2349, "step": 1400 }, { "epoch": 8.75, "eval_loss": 0.8184483647346497, "eval_runtime": 33.8393, "eval_samples_per_second": 8.393, "eval_steps_per_second": 1.064, "eval_wer": 0.35514018691588783, "step": 1400 }, { "epoch": 9.38, "learning_rate": 3.3400000000000006e-06, "loss": 1.2511, "step": 1500 }, { "epoch": 9.38, "eval_loss": 0.8078120350837708, "eval_runtime": 34.5077, "eval_samples_per_second": 8.23, "eval_steps_per_second": 1.043, "eval_wer": 0.3516355140186916, "step": 1500 }, { "epoch": 10.0, "learning_rate": 2.6733333333333333e-06, "loss": 1.1779, "step": 1600 }, { "epoch": 10.0, "eval_loss": 0.8102284669876099, "eval_runtime": 33.4526, "eval_samples_per_second": 8.49, "eval_steps_per_second": 1.076, "eval_wer": 0.35046728971962615, "step": 1600 }, { "epoch": 10.62, "learning_rate": 2.006666666666667e-06, "loss": 1.2161, "step": 1700 }, { "epoch": 10.62, "eval_loss": 0.8123233318328857, "eval_runtime": 33.6692, "eval_samples_per_second": 8.435, "eval_steps_per_second": 1.069, "eval_wer": 0.34988317757009346, "step": 1700 }, { "epoch": 11.25, "learning_rate": 1.34e-06, "loss": 1.1967, "step": 1800 }, { "epoch": 11.25, "eval_loss": 0.8086321353912354, "eval_runtime": 33.5258, "eval_samples_per_second": 8.471, "eval_steps_per_second": 1.074, "eval_wer": 0.3501752336448598, "step": 1800 }, { "epoch": 11.88, "learning_rate": 6.733333333333334e-07, "loss": 1.2454, "step": 1900 }, { "epoch": 11.88, "eval_loss": 0.806648850440979, "eval_runtime": 33.3738, "eval_samples_per_second": 8.51, "eval_steps_per_second": 1.079, "eval_wer": 0.3490070093457944, "step": 1900 }, { "epoch": 12.5, "learning_rate": 6.666666666666667e-09, "loss": 1.1928, "step": 2000 }, { "epoch": 12.5, "eval_loss": 0.8069162368774414, "eval_runtime": 33.1842, "eval_samples_per_second": 8.558, "eval_steps_per_second": 1.085, "eval_wer": 0.3490070093457944, "step": 2000 }, { "epoch": 12.5, "step": 2000, "total_flos": 9.605345431463184e+18, "train_loss": 1.3434337348937988, "train_runtime": 8414.919, "train_samples_per_second": 3.803, "train_steps_per_second": 0.238 } ], "logging_steps": 100, "max_steps": 2000, "num_train_epochs": 13, "save_steps": 100, "total_flos": 9.605345431463184e+18, "trial_name": null, "trial_params": null }