{ "best_metric": 0.33164310455322266, "best_model_checkpoint": "wav2vec2-xls-r-1b-ja/checkpoint-15000", "epoch": 99.99527559055119, "global_step": 15800, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 9.49, "learning_rate": 3.7425e-05, "loss": 3.484, "step": 1500 }, { "epoch": 9.49, "eval_cer": 0.4098974987299405, "eval_loss": 1.1849042177200317, "eval_runtime": 268.3084, "eval_samples_per_second": 16.66, "eval_steps_per_second": 2.083, "eval_wer": 0.7542696367448612, "step": 1500 }, { "epoch": 18.98, "learning_rate": 4.638768115942029e-05, "loss": 1.3582, "step": 3000 }, { "epoch": 18.98, "eval_cer": 0.1590532827301796, "eval_loss": 0.4320400655269623, "eval_runtime": 269.0628, "eval_samples_per_second": 16.613, "eval_steps_per_second": 2.078, "eval_wer": 0.34893639898926543, "step": 3000 }, { "epoch": 28.48, "learning_rate": 4.095289855072464e-05, "loss": 1.1716, "step": 4500 }, { "epoch": 28.48, "eval_cer": 0.1453904312225443, "eval_loss": 0.38348379731178284, "eval_runtime": 270.1414, "eval_samples_per_second": 16.547, "eval_steps_per_second": 2.069, "eval_wer": 0.31746742889912366, "step": 4500 }, { "epoch": 37.97, "learning_rate": 3.552173913043478e-05, "loss": 1.0951, "step": 6000 }, { "epoch": 37.97, "eval_cer": 0.14047754236021875, "eval_loss": 0.3732404410839081, "eval_runtime": 272.8075, "eval_samples_per_second": 16.385, "eval_steps_per_second": 2.049, "eval_wer": 0.3032741348721349, "step": 6000 }, { "epoch": 47.47, "learning_rate": 3.0090579710144927e-05, "loss": 1.04, "step": 7500 }, { "epoch": 47.47, "eval_cer": 0.13603681678271523, "eval_loss": 0.34847018122673035, "eval_runtime": 268.2852, "eval_samples_per_second": 16.661, "eval_steps_per_second": 2.084, "eval_wer": 0.28983351552839554, "step": 7500 }, { "epoch": 56.96, "learning_rate": 2.4655797101449275e-05, "loss": 0.9768, "step": 9000 }, { "epoch": 56.96, "eval_cer": 0.13088485790275828, "eval_loss": 0.33858078718185425, "eval_runtime": 269.384, "eval_samples_per_second": 16.593, "eval_steps_per_second": 2.075, "eval_wer": 0.278722603537571, "step": 9000 }, { "epoch": 66.45, "learning_rate": 1.922463768115942e-05, "loss": 0.9129, "step": 10500 }, { "epoch": 66.45, "eval_cer": 0.1271553656277082, "eval_loss": 0.336273193359375, "eval_runtime": 267.776, "eval_samples_per_second": 16.693, "eval_steps_per_second": 2.088, "eval_wer": 0.27108833175032704, "step": 10500 }, { "epoch": 75.94, "learning_rate": 1.3793478260869565e-05, "loss": 0.8614, "step": 12000 }, { "epoch": 75.94, "eval_cer": 0.12596001553955113, "eval_loss": 0.33856987953186035, "eval_runtime": 268.1172, "eval_samples_per_second": 16.672, "eval_steps_per_second": 2.085, "eval_wer": 0.26755792906937154, "step": 12000 }, { "epoch": 85.44, "learning_rate": 8.358695652173914e-06, "loss": 0.8092, "step": 13500 }, { "epoch": 85.44, "eval_cer": 0.12399964139497355, "eval_loss": 0.3356078565120697, "eval_runtime": 269.2379, "eval_samples_per_second": 16.602, "eval_steps_per_second": 2.076, "eval_wer": 0.26103474848121, "step": 13500 }, { "epoch": 94.93, "learning_rate": 2.9275362318840578e-06, "loss": 0.7658, "step": 15000 }, { "epoch": 94.93, "eval_cer": 0.12175835997967904, "eval_loss": 0.33164310455322266, "eval_runtime": 268.5018, "eval_samples_per_second": 16.648, "eval_steps_per_second": 2.082, "eval_wer": 0.2563574129495887, "step": 15000 }, { "epoch": 100.0, "step": 15800, "total_flos": 4.622164701241047e+20, "train_loss": 1.2220959588545788, "train_runtime": 95146.6811, "train_samples_per_second": 10.674, "train_steps_per_second": 0.166 } ], "max_steps": 15800, "num_train_epochs": 100, "total_flos": 4.622164701241047e+20, "trial_name": null, "trial_params": null }