{ "best_metric": 0.3383650779724121, "best_model_checkpoint": "/scratch/skscla001/speech/results/xls-r-300m-bemgen-combined-hp-tuning-test-model/checkpoint-500", "epoch": 22.228163992869874, "eval_steps": 100, "global_step": 800, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 2.7985739750445635, "eval_loss": 2.9111883640289307, "eval_runtime": 39.716, "eval_samples_per_second": 13.622, "eval_steps_per_second": 3.424, "eval_wer": 1.0, "step": 100 }, { "epoch": 5.570409982174688, "eval_loss": 1.6968202590942383, "eval_runtime": 39.8919, "eval_samples_per_second": 13.562, "eval_steps_per_second": 3.409, "eval_wer": 0.9970951343500363, "step": 200 }, { "epoch": 8.342245989304812, "eval_loss": 0.3893207609653473, "eval_runtime": 40.2019, "eval_samples_per_second": 13.457, "eval_steps_per_second": 3.383, "eval_wer": 0.615831517792302, "step": 300 }, { "epoch": 11.114081996434937, "eval_loss": 0.34530752897262573, "eval_runtime": 40.0609, "eval_samples_per_second": 13.504, "eval_steps_per_second": 3.395, "eval_wer": 0.5106753812636166, "step": 400 }, { "epoch": 13.9126559714795, "grad_norm": 7.798405170440674, "learning_rate": 0.0005819322340474784, "loss": 31.2339, "step": 500 }, { "epoch": 13.9126559714795, "eval_loss": 0.3383650779724121, "eval_runtime": 39.984, "eval_samples_per_second": 13.53, "eval_steps_per_second": 3.401, "eval_wer": 0.49092229484386346, "step": 500 }, { "epoch": 16.684491978609625, "eval_loss": 0.3592090606689453, "eval_runtime": 39.9246, "eval_samples_per_second": 13.551, "eval_steps_per_second": 3.406, "eval_wer": 0.46187363834422657, "step": 600 }, { "epoch": 19.45632798573975, "eval_loss": 0.367597371339798, "eval_runtime": 39.9675, "eval_samples_per_second": 13.536, "eval_steps_per_second": 3.403, "eval_wer": 0.4335511982570806, "step": 700 }, { "epoch": 22.228163992869874, "eval_loss": 0.3925014138221741, "eval_runtime": 39.8278, "eval_samples_per_second": 13.583, "eval_steps_per_second": 3.415, "eval_wer": 0.42280319535221494, "step": 800 }, { "epoch": 22.228163992869874, "step": 800, "total_flos": 3.4912812658192863e+19, "train_loss": 20.112410697937012, "train_runtime": 9256.0708, "train_samples_per_second": 14.527, "train_steps_per_second": 0.113 } ], "logging_steps": 500, "max_steps": 1050, "num_input_tokens_seen": 0, "num_train_epochs": 30, "save_steps": 400, "stateful_callbacks": { "EarlyStoppingCallback": { "args": { "early_stopping_patience": 3, "early_stopping_threshold": 0.0 }, "attributes": { "early_stopping_patience_counter": 3 } }, "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 3.4912812658192863e+19, "train_batch_size": 8, "trial_name": null, "trial_params": null }