{ "best_metric": 0.854691743850708, "best_model_checkpoint": "nrshoudi/hubert-large-ls960-ft-V2-50/checkpoint-11452", "epoch": 20.0, "eval_steps": 500, "global_step": 16360, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "learning_rate": 5e-05, "loss": 12.8849, "step": 818 }, { "epoch": 1.0, "eval_loss": 4.592483043670654, "eval_per": 0.9649250918684632, "eval_runtime": 118.1886, "eval_samples_per_second": 6.879, "eval_steps_per_second": 3.444, "eval_wer": 0.9551117540012132, "step": 818 }, { "epoch": 2.0, "learning_rate": 0.0001, "loss": 2.7511, "step": 1636 }, { "epoch": 2.0, "eval_loss": 1.7072813510894775, "eval_per": 0.4559738057099783, "eval_runtime": 117.681, "eval_samples_per_second": 6.909, "eval_steps_per_second": 3.459, "eval_wer": 0.4692734823386683, "step": 1636 }, { "epoch": 3.0, "learning_rate": 9.444444444444444e-05, "loss": 1.1653, "step": 2454 }, { "epoch": 3.0, "eval_loss": 1.1204495429992676, "eval_per": 0.1317016866107604, "eval_runtime": 118.0673, "eval_samples_per_second": 6.886, "eval_steps_per_second": 3.447, "eval_wer": 0.15342261210396155, "step": 2454 }, { "epoch": 4.0, "learning_rate": 8.888888888888889e-05, "loss": 0.7529, "step": 3272 }, { "epoch": 4.0, "eval_loss": 1.033559799194336, "eval_per": 0.08411853387355131, "eval_runtime": 118.2209, "eval_samples_per_second": 6.877, "eval_steps_per_second": 3.443, "eval_wer": 0.10554803788903924, "step": 3272 }, { "epoch": 5.0, "learning_rate": 8.333333333333334e-05, "loss": 0.6309, "step": 4090 }, { "epoch": 5.0, "eval_loss": 1.0015147924423218, "eval_per": 0.08166870818807123, "eval_runtime": 118.3158, "eval_samples_per_second": 6.871, "eval_steps_per_second": 3.44, "eval_wer": 0.10228174140264103, "step": 4090 }, { "epoch": 6.0, "learning_rate": 7.777777777777778e-05, "loss": 0.5354, "step": 4908 }, { "epoch": 6.0, "eval_loss": 1.0387498140335083, "eval_per": 0.07768774144916611, "eval_runtime": 118.2614, "eval_samples_per_second": 6.875, "eval_steps_per_second": 3.442, "eval_wer": 0.09924875180812841, "step": 4908 }, { "epoch": 7.0, "learning_rate": 7.222222222222222e-05, "loss": 0.4907, "step": 5726 }, { "epoch": 7.0, "eval_loss": 0.9956713318824768, "eval_per": 0.08925374540657684, "eval_runtime": 117.9222, "eval_samples_per_second": 6.894, "eval_steps_per_second": 3.451, "eval_wer": 0.10872101161868322, "step": 5726 }, { "epoch": 8.0, "learning_rate": 6.666666666666667e-05, "loss": 0.4326, "step": 6544 }, { "epoch": 8.0, "eval_loss": 0.8882040977478027, "eval_per": 0.08440120606802977, "eval_runtime": 118.2986, "eval_samples_per_second": 6.872, "eval_steps_per_second": 3.44, "eval_wer": 0.10914096402407727, "step": 6544 }, { "epoch": 9.0, "learning_rate": 6.111111111111112e-05, "loss": 0.4148, "step": 7362 }, { "epoch": 9.0, "eval_loss": 0.9541579484939575, "eval_per": 0.06376613587110148, "eval_runtime": 118.3333, "eval_samples_per_second": 6.87, "eval_steps_per_second": 3.439, "eval_wer": 0.08301059213289161, "step": 7362 }, { "epoch": 10.0, "learning_rate": 5.555555555555556e-05, "loss": 0.3779, "step": 8180 }, { "epoch": 10.0, "eval_loss": 0.9479207396507263, "eval_per": 0.05010364647130877, "eval_runtime": 118.3528, "eval_samples_per_second": 6.869, "eval_steps_per_second": 3.439, "eval_wer": 0.06901217861975643, "step": 8180 }, { "epoch": 11.0, "learning_rate": 5e-05, "loss": 0.3502, "step": 8998 }, { "epoch": 11.0, "eval_loss": 0.9840469360351562, "eval_per": 0.04906718175822105, "eval_runtime": 118.5969, "eval_samples_per_second": 6.855, "eval_steps_per_second": 3.432, "eval_wer": 0.06887219448462507, "step": 8998 }, { "epoch": 12.0, "learning_rate": 4.4444444444444447e-05, "loss": 0.3294, "step": 9816 }, { "epoch": 12.0, "eval_loss": 1.087670922279358, "eval_per": 0.04906718175822105, "eval_runtime": 118.227, "eval_samples_per_second": 6.877, "eval_steps_per_second": 3.443, "eval_wer": 0.06943213102515049, "step": 9816 }, { "epoch": 13.0, "learning_rate": 3.888888888888889e-05, "loss": 0.3239, "step": 10634 }, { "epoch": 13.0, "eval_loss": 0.8955483436584473, "eval_per": 0.05335437670781117, "eval_runtime": 118.657, "eval_samples_per_second": 6.852, "eval_steps_per_second": 3.43, "eval_wer": 0.07311837991694274, "step": 10634 }, { "epoch": 14.0, "learning_rate": 3.3333333333333335e-05, "loss": 0.3069, "step": 11452 }, { "epoch": 14.0, "eval_loss": 0.854691743850708, "eval_per": 0.05804202393291247, "eval_runtime": 119.0248, "eval_samples_per_second": 6.831, "eval_steps_per_second": 3.419, "eval_wer": 0.077597872241146, "step": 11452 }, { "epoch": 15.0, "learning_rate": 2.777777777777778e-05, "loss": 0.2689, "step": 12270 }, { "epoch": 15.0, "eval_loss": 0.968323290348053, "eval_per": 0.05245924809196269, "eval_runtime": 118.5754, "eval_samples_per_second": 6.856, "eval_steps_per_second": 3.432, "eval_wer": 0.07199850683589193, "step": 12270 }, { "epoch": 16.0, "learning_rate": 2.2222222222222223e-05, "loss": 0.2486, "step": 13088 }, { "epoch": 16.0, "eval_loss": 0.9282185435295105, "eval_per": 0.05189390370300575, "eval_runtime": 118.5748, "eval_samples_per_second": 6.856, "eval_steps_per_second": 3.432, "eval_wer": 0.07041201997106994, "step": 13088 }, { "epoch": 17.0, "learning_rate": 1.6666666666666667e-05, "loss": 0.2291, "step": 13906 }, { "epoch": 17.0, "eval_loss": 0.900354266166687, "eval_per": 0.048101385093752946, "eval_runtime": 118.0532, "eval_samples_per_second": 6.887, "eval_steps_per_second": 3.448, "eval_wer": 0.06714572348467174, "step": 13906 }, { "epoch": 18.0, "learning_rate": 1.1111111111111112e-05, "loss": 0.2294, "step": 14724 }, { "epoch": 18.0, "eval_loss": 0.9242432117462158, "eval_per": 0.05472062564779045, "eval_runtime": 118.8448, "eval_samples_per_second": 6.841, "eval_steps_per_second": 3.425, "eval_wer": 0.07470486678176473, "step": 14724 }, { "epoch": 19.0, "learning_rate": 5.555555555555556e-06, "loss": 0.2151, "step": 15542 }, { "epoch": 19.0, "eval_loss": 0.9400033354759216, "eval_per": 0.05540375011778008, "eval_runtime": 118.591, "eval_samples_per_second": 6.855, "eval_steps_per_second": 3.432, "eval_wer": 0.07470486678176473, "step": 15542 }, { "epoch": 20.0, "learning_rate": 0.0, "loss": 0.2109, "step": 16360 }, { "epoch": 20.0, "eval_loss": 0.9222491979598999, "eval_per": 0.05396683312918119, "eval_runtime": 119.3623, "eval_samples_per_second": 6.811, "eval_steps_per_second": 3.41, "eval_wer": 0.07321170267369698, "step": 16360 }, { "epoch": 20.0, "step": 16360, "total_flos": 5.249198170404504e+18, "train_loss": 1.15744112849527, "train_runtime": 11016.1558, "train_samples_per_second": 2.97, "train_steps_per_second": 1.485 } ], "logging_steps": 500, "max_steps": 16360, "num_train_epochs": 20, "save_steps": 500, "total_flos": 5.249198170404504e+18, "trial_name": null, "trial_params": null }