{ "best_metric": 103.08219178082192, "best_model_checkpoint": "./whisper-small-amet/checkpoint-2000", "epoch": 2000.0, "global_step": 2000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 25.0, "learning_rate": 4.2000000000000006e-07, "loss": 2.9938, "step": 25 }, { "epoch": 50.0, "learning_rate": 9.200000000000001e-07, "loss": 2.2746, "step": 50 }, { "epoch": 75.0, "learning_rate": 1.4000000000000001e-06, "loss": 1.7055, "step": 75 }, { "epoch": 100.0, "learning_rate": 1.9000000000000002e-06, "loss": 0.9013, "step": 100 }, { "epoch": 100.0, "eval_loss": 2.7089741230010986, "eval_runtime": 28.1806, "eval_samples_per_second": 0.71, "eval_steps_per_second": 0.035, "eval_wer": 171.57534246575344, "step": 100 }, { "epoch": 125.0, "learning_rate": 2.4000000000000003e-06, "loss": 0.1244, "step": 125 }, { "epoch": 150.0, "learning_rate": 2.9e-06, "loss": 0.0031, "step": 150 }, { "epoch": 175.0, "learning_rate": 3.4000000000000005e-06, "loss": 0.0004, "step": 175 }, { "epoch": 200.0, "learning_rate": 3.900000000000001e-06, "loss": 0.0002, "step": 200 }, { "epoch": 200.0, "eval_loss": 3.7302818298339844, "eval_runtime": 28.2207, "eval_samples_per_second": 0.709, "eval_steps_per_second": 0.035, "eval_wer": 298.63013698630135, "step": 200 }, { "epoch": 225.0, "learning_rate": 4.4e-06, "loss": 0.0002, "step": 225 }, { "epoch": 250.0, "learning_rate": 4.9000000000000005e-06, "loss": 0.0001, "step": 250 }, { "epoch": 275.0, "learning_rate": 5.400000000000001e-06, "loss": 0.0001, "step": 275 }, { "epoch": 300.0, "learning_rate": 5.9e-06, "loss": 0.0001, "step": 300 }, { "epoch": 300.0, "eval_loss": 3.8286595344543457, "eval_runtime": 28.3319, "eval_samples_per_second": 0.706, "eval_steps_per_second": 0.035, "eval_wer": 239.3835616438356, "step": 300 }, { "epoch": 325.0, "learning_rate": 6.4000000000000006e-06, "loss": 0.0001, "step": 325 }, { "epoch": 350.0, "learning_rate": 6.9e-06, "loss": 0.0001, "step": 350 }, { "epoch": 375.0, "learning_rate": 7.4e-06, "loss": 0.0001, "step": 375 }, { "epoch": 400.0, "learning_rate": 7.9e-06, "loss": 0.0001, "step": 400 }, { "epoch": 400.0, "eval_loss": 3.8876891136169434, "eval_runtime": 28.3964, "eval_samples_per_second": 0.704, "eval_steps_per_second": 0.035, "eval_wer": 234.93150684931504, "step": 400 }, { "epoch": 425.0, "learning_rate": 8.400000000000001e-06, "loss": 0.0001, "step": 425 }, { "epoch": 450.0, "learning_rate": 8.900000000000001e-06, "loss": 0.0001, "step": 450 }, { "epoch": 475.0, "learning_rate": 9.4e-06, "loss": 0.0001, "step": 475 }, { "epoch": 500.0, "learning_rate": 9.9e-06, "loss": 0.0001, "step": 500 }, { "epoch": 500.0, "eval_loss": 4.056136608123779, "eval_runtime": 28.2255, "eval_samples_per_second": 0.709, "eval_steps_per_second": 0.035, "eval_wer": 316.4383561643836, "step": 500 }, { "epoch": 525.0, "learning_rate": 9.866666666666668e-06, "loss": 0.0001, "step": 525 }, { "epoch": 550.0, "learning_rate": 9.7e-06, "loss": 0.0001, "step": 550 }, { "epoch": 575.0, "learning_rate": 9.533333333333334e-06, "loss": 0.0001, "step": 575 }, { "epoch": 600.0, "learning_rate": 9.366666666666668e-06, "loss": 0.0001, "step": 600 }, { "epoch": 600.0, "eval_loss": 4.270617485046387, "eval_runtime": 28.1771, "eval_samples_per_second": 0.71, "eval_steps_per_second": 0.035, "eval_wer": 189.04109589041096, "step": 600 }, { "epoch": 625.0, "learning_rate": 9.200000000000002e-06, "loss": 0.0001, "step": 625 }, { "epoch": 650.0, "learning_rate": 9.033333333333334e-06, "loss": 0.0, "step": 650 }, { "epoch": 675.0, "learning_rate": 8.866666666666668e-06, "loss": 0.0, "step": 675 }, { "epoch": 700.0, "learning_rate": 8.700000000000001e-06, "loss": 0.0, "step": 700 }, { "epoch": 700.0, "eval_loss": 4.452445030212402, "eval_runtime": 28.3415, "eval_samples_per_second": 0.706, "eval_steps_per_second": 0.035, "eval_wer": 229.45205479452056, "step": 700 }, { "epoch": 725.0, "learning_rate": 8.533333333333335e-06, "loss": 0.0, "step": 725 }, { "epoch": 750.0, "learning_rate": 8.366666666666667e-06, "loss": 0.0, "step": 750 }, { "epoch": 775.0, "learning_rate": 8.2e-06, "loss": 0.0, "step": 775 }, { "epoch": 800.0, "learning_rate": 8.033333333333335e-06, "loss": 0.0, "step": 800 }, { "epoch": 800.0, "eval_loss": 4.625022888183594, "eval_runtime": 28.3479, "eval_samples_per_second": 0.706, "eval_steps_per_second": 0.035, "eval_wer": 308.5616438356164, "step": 800 }, { "epoch": 825.0, "learning_rate": 7.866666666666667e-06, "loss": 0.0, "step": 825 }, { "epoch": 850.0, "learning_rate": 7.7e-06, "loss": 0.0, "step": 850 }, { "epoch": 875.0, "learning_rate": 7.533333333333334e-06, "loss": 0.0, "step": 875 }, { "epoch": 900.0, "learning_rate": 7.3666666666666676e-06, "loss": 0.0, "step": 900 }, { "epoch": 900.0, "eval_loss": 4.784408092498779, "eval_runtime": 28.2633, "eval_samples_per_second": 0.708, "eval_steps_per_second": 0.035, "eval_wer": 429.4520547945205, "step": 900 }, { "epoch": 925.0, "learning_rate": 7.2000000000000005e-06, "loss": 0.0, "step": 925 }, { "epoch": 950.0, "learning_rate": 7.033333333333334e-06, "loss": 0.0, "step": 950 }, { "epoch": 975.0, "learning_rate": 6.886666666666667e-06, "loss": 0.0753, "step": 975 }, { "epoch": 1000.0, "learning_rate": 6.720000000000001e-06, "loss": 0.0405, "step": 1000 }, { "epoch": 1000.0, "eval_loss": 4.618178367614746, "eval_runtime": 28.5252, "eval_samples_per_second": 0.701, "eval_steps_per_second": 0.035, "eval_wer": 206.84931506849313, "step": 1000 }, { "epoch": 1025.0, "learning_rate": 6.553333333333334e-06, "loss": 0.0057, "step": 1025 }, { "epoch": 1050.0, "learning_rate": 6.386666666666668e-06, "loss": 0.0001, "step": 1050 }, { "epoch": 1075.0, "learning_rate": 6.220000000000001e-06, "loss": 0.0001, "step": 1075 }, { "epoch": 1100.0, "learning_rate": 6.0533333333333335e-06, "loss": 0.0002, "step": 1100 }, { "epoch": 1100.0, "eval_loss": 5.542290687561035, "eval_runtime": 28.5497, "eval_samples_per_second": 0.701, "eval_steps_per_second": 0.035, "eval_wer": 159.93150684931507, "step": 1100 }, { "epoch": 1125.0, "learning_rate": 5.886666666666667e-06, "loss": 0.0002, "step": 1125 }, { "epoch": 1150.0, "learning_rate": 5.72e-06, "loss": 0.0002, "step": 1150 }, { "epoch": 1175.0, "learning_rate": 5.553333333333334e-06, "loss": 0.0002, "step": 1175 }, { "epoch": 1200.0, "learning_rate": 5.386666666666667e-06, "loss": 0.0002, "step": 1200 }, { "epoch": 1200.0, "eval_loss": 6.0516815185546875, "eval_runtime": 28.4295, "eval_samples_per_second": 0.703, "eval_steps_per_second": 0.035, "eval_wer": 151.7123287671233, "step": 1200 }, { "epoch": 1225.0, "learning_rate": 5.220000000000001e-06, "loss": 0.0002, "step": 1225 }, { "epoch": 1250.0, "learning_rate": 5.053333333333334e-06, "loss": 0.0002, "step": 1250 }, { "epoch": 1275.0, "learning_rate": 4.886666666666668e-06, "loss": 0.0002, "step": 1275 }, { "epoch": 1300.0, "learning_rate": 4.7200000000000005e-06, "loss": 0.0002, "step": 1300 }, { "epoch": 1300.0, "eval_loss": 6.349332332611084, "eval_runtime": 28.5448, "eval_samples_per_second": 0.701, "eval_steps_per_second": 0.035, "eval_wer": 154.7945205479452, "step": 1300 }, { "epoch": 1325.0, "learning_rate": 4.5533333333333335e-06, "loss": 0.0002, "step": 1325 }, { "epoch": 1350.0, "learning_rate": 4.3866666666666665e-06, "loss": 0.0002, "step": 1350 }, { "epoch": 1375.0, "learning_rate": 4.22e-06, "loss": 0.0002, "step": 1375 }, { "epoch": 1400.0, "learning_rate": 4.053333333333333e-06, "loss": 0.0002, "step": 1400 }, { "epoch": 1400.0, "eval_loss": 6.543065547943115, "eval_runtime": 28.5232, "eval_samples_per_second": 0.701, "eval_steps_per_second": 0.035, "eval_wer": 138.6986301369863, "step": 1400 }, { "epoch": 1425.0, "learning_rate": 3.886666666666667e-06, "loss": 0.0002, "step": 1425 }, { "epoch": 1450.0, "learning_rate": 3.7200000000000004e-06, "loss": 0.0002, "step": 1450 }, { "epoch": 1475.0, "learning_rate": 3.5533333333333338e-06, "loss": 0.0002, "step": 1475 }, { "epoch": 1500.0, "learning_rate": 3.386666666666667e-06, "loss": 0.0002, "step": 1500 }, { "epoch": 1500.0, "eval_loss": 6.669939994812012, "eval_runtime": 28.5345, "eval_samples_per_second": 0.701, "eval_steps_per_second": 0.035, "eval_wer": 158.56164383561645, "step": 1500 }, { "epoch": 1525.0, "learning_rate": 3.2200000000000005e-06, "loss": 0.0002, "step": 1525 }, { "epoch": 1550.0, "learning_rate": 3.053333333333334e-06, "loss": 0.0001, "step": 1550 }, { "epoch": 1575.0, "learning_rate": 2.8866666666666673e-06, "loss": 0.0001, "step": 1575 }, { "epoch": 1600.0, "learning_rate": 2.7200000000000002e-06, "loss": 0.0001, "step": 1600 }, { "epoch": 1600.0, "eval_loss": 6.759077548980713, "eval_runtime": 28.534, "eval_samples_per_second": 0.701, "eval_steps_per_second": 0.035, "eval_wer": 160.27397260273972, "step": 1600 }, { "epoch": 1625.0, "learning_rate": 2.5533333333333336e-06, "loss": 0.0001, "step": 1625 }, { "epoch": 1650.0, "learning_rate": 2.386666666666667e-06, "loss": 0.0001, "step": 1650 }, { "epoch": 1675.0, "learning_rate": 2.2200000000000003e-06, "loss": 0.0001, "step": 1675 }, { "epoch": 1700.0, "learning_rate": 2.0533333333333337e-06, "loss": 0.0001, "step": 1700 }, { "epoch": 1700.0, "eval_loss": 6.82085657119751, "eval_runtime": 28.5933, "eval_samples_per_second": 0.699, "eval_steps_per_second": 0.035, "eval_wer": 103.08219178082192, "step": 1700 }, { "epoch": 1725.0, "learning_rate": 1.8866666666666669e-06, "loss": 0.0001, "step": 1725 }, { "epoch": 1750.0, "learning_rate": 1.72e-06, "loss": 0.0001, "step": 1750 }, { "epoch": 1775.0, "learning_rate": 1.5533333333333334e-06, "loss": 0.0001, "step": 1775 }, { "epoch": 1800.0, "learning_rate": 1.3866666666666668e-06, "loss": 0.0001, "step": 1800 }, { "epoch": 1800.0, "eval_loss": 6.856205940246582, "eval_runtime": 28.571, "eval_samples_per_second": 0.7, "eval_steps_per_second": 0.035, "eval_wer": 103.08219178082192, "step": 1800 }, { "epoch": 1825.0, "learning_rate": 1.2200000000000002e-06, "loss": 0.0001, "step": 1825 }, { "epoch": 1850.0, "learning_rate": 1.0533333333333333e-06, "loss": 0.0001, "step": 1850 }, { "epoch": 1875.0, "learning_rate": 8.866666666666668e-07, "loss": 0.0001, "step": 1875 }, { "epoch": 1900.0, "learning_rate": 7.2e-07, "loss": 0.0001, "step": 1900 }, { "epoch": 1900.0, "eval_loss": 6.875776767730713, "eval_runtime": 28.4345, "eval_samples_per_second": 0.703, "eval_steps_per_second": 0.035, "eval_wer": 103.08219178082192, "step": 1900 }, { "epoch": 1925.0, "learning_rate": 5.533333333333334e-07, "loss": 0.0001, "step": 1925 }, { "epoch": 1950.0, "learning_rate": 3.8666666666666674e-07, "loss": 0.0001, "step": 1950 }, { "epoch": 1975.0, "learning_rate": 2.2e-07, "loss": 0.0001, "step": 1975 }, { "epoch": 2000.0, "learning_rate": 5.3333333333333334e-08, "loss": 0.0001, "step": 2000 }, { "epoch": 2000.0, "eval_loss": 6.883942604064941, "eval_runtime": 28.4855, "eval_samples_per_second": 0.702, "eval_steps_per_second": 0.035, "eval_wer": 103.08219178082192, "step": 2000 }, { "epoch": 2000.0, "step": 2000, "total_flos": 5.7717080064e+17, "train_loss": 0.10164999849759625, "train_runtime": 954.9086, "train_samples_per_second": 134.044, "train_steps_per_second": 2.094 } ], "max_steps": 2000, "num_train_epochs": 2000, "total_flos": 5.7717080064e+17, "trial_name": null, "trial_params": null }