whisper_large_CGN / trainer_state.json
Jakob Poncelet
First model version
4a3d9de
{
"best_metric": 9.615871912312803,
"best_model_checkpoint": "/esat/audioslave/jponcele/whisper/finetuning_event/CGN/large/checkpoint-15000",
"epoch": 18.033533333333335,
"global_step": 15000,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.01,
"learning_rate": 1.94e-06,
"loss": 0.7504,
"step": 100
},
{
"epoch": 0.01,
"learning_rate": 3.920000000000001e-06,
"loss": 0.3565,
"step": 200
},
{
"epoch": 0.02,
"learning_rate": 5.92e-06,
"loss": 0.2271,
"step": 300
},
{
"epoch": 0.03,
"learning_rate": 7.92e-06,
"loss": 0.2206,
"step": 400
},
{
"epoch": 0.03,
"learning_rate": 9.920000000000002e-06,
"loss": 0.2448,
"step": 500
},
{
"epoch": 0.04,
"learning_rate": 9.933793103448277e-06,
"loss": 0.1832,
"step": 600
},
{
"epoch": 0.05,
"learning_rate": 9.865517241379312e-06,
"loss": 0.1504,
"step": 700
},
{
"epoch": 0.05,
"learning_rate": 9.796551724137931e-06,
"loss": 0.4013,
"step": 800
},
{
"epoch": 1.01,
"learning_rate": 9.727586206896552e-06,
"loss": 0.1325,
"step": 900
},
{
"epoch": 1.01,
"learning_rate": 9.658620689655173e-06,
"loss": 0.1078,
"step": 1000
},
{
"epoch": 1.01,
"eval_loss": 0.2717978060245514,
"eval_runtime": 90930.871,
"eval_samples_per_second": 0.568,
"eval_steps_per_second": 0.035,
"eval_wer": 14.3057057034114,
"step": 1000
},
{
"epoch": 1.02,
"learning_rate": 9.589655172413795e-06,
"loss": 0.1774,
"step": 1100
},
{
"epoch": 1.03,
"learning_rate": 9.520689655172414e-06,
"loss": 0.2996,
"step": 1200
},
{
"epoch": 1.03,
"learning_rate": 9.452413793103449e-06,
"loss": 0.1175,
"step": 1300
},
{
"epoch": 1.04,
"learning_rate": 9.38344827586207e-06,
"loss": 0.1589,
"step": 1400
},
{
"epoch": 1.05,
"learning_rate": 9.314482758620691e-06,
"loss": 0.2052,
"step": 1500
},
{
"epoch": 1.05,
"learning_rate": 9.24551724137931e-06,
"loss": 0.2372,
"step": 1600
},
{
"epoch": 2.01,
"learning_rate": 9.176551724137932e-06,
"loss": 0.1863,
"step": 1700
},
{
"epoch": 2.01,
"learning_rate": 9.107586206896553e-06,
"loss": 0.1293,
"step": 1800
},
{
"epoch": 2.02,
"learning_rate": 9.038620689655173e-06,
"loss": 0.1582,
"step": 1900
},
{
"epoch": 2.03,
"learning_rate": 8.969655172413794e-06,
"loss": 0.0762,
"step": 2000
},
{
"epoch": 2.03,
"eval_loss": 0.25997287034988403,
"eval_runtime": 86242.9732,
"eval_samples_per_second": 0.598,
"eval_steps_per_second": 0.037,
"eval_wer": 12.468659951078328,
"step": 2000
},
{
"epoch": 2.03,
"learning_rate": 8.900689655172415e-06,
"loss": 0.0869,
"step": 2100
},
{
"epoch": 2.04,
"learning_rate": 8.831724137931034e-06,
"loss": 0.067,
"step": 2200
},
{
"epoch": 2.05,
"learning_rate": 8.762758620689657e-06,
"loss": 0.2022,
"step": 2300
},
{
"epoch": 2.05,
"learning_rate": 8.693793103448277e-06,
"loss": 0.1808,
"step": 2400
},
{
"epoch": 3.01,
"learning_rate": 8.624827586206898e-06,
"loss": 0.1677,
"step": 2500
},
{
"epoch": 3.01,
"learning_rate": 8.555862068965517e-06,
"loss": 0.1633,
"step": 2600
},
{
"epoch": 3.02,
"learning_rate": 8.486896551724139e-06,
"loss": 0.1031,
"step": 2700
},
{
"epoch": 3.03,
"learning_rate": 8.41793103448276e-06,
"loss": 0.1452,
"step": 2800
},
{
"epoch": 3.03,
"learning_rate": 8.34896551724138e-06,
"loss": 0.0673,
"step": 2900
},
{
"epoch": 3.04,
"learning_rate": 8.28e-06,
"loss": 0.1941,
"step": 3000
},
{
"epoch": 3.04,
"eval_loss": 0.23860542476177216,
"eval_runtime": 87491.9677,
"eval_samples_per_second": 0.59,
"eval_steps_per_second": 0.037,
"eval_wer": 12.355587473912474,
"step": 3000
},
{
"epoch": 3.05,
"learning_rate": 8.211034482758622e-06,
"loss": 0.1519,
"step": 3100
},
{
"epoch": 3.05,
"learning_rate": 8.142068965517243e-06,
"loss": 0.1579,
"step": 3200
},
{
"epoch": 4.01,
"learning_rate": 8.073793103448276e-06,
"loss": 0.1228,
"step": 3300
},
{
"epoch": 4.01,
"learning_rate": 8.004827586206897e-06,
"loss": 0.2056,
"step": 3400
},
{
"epoch": 4.02,
"learning_rate": 7.935862068965518e-06,
"loss": 0.1543,
"step": 3500
},
{
"epoch": 4.03,
"learning_rate": 7.866896551724138e-06,
"loss": 0.0864,
"step": 3600
},
{
"epoch": 4.03,
"learning_rate": 7.797931034482759e-06,
"loss": 0.1363,
"step": 3700
},
{
"epoch": 4.04,
"learning_rate": 7.72896551724138e-06,
"loss": 0.0343,
"step": 3800
},
{
"epoch": 4.05,
"learning_rate": 7.660000000000001e-06,
"loss": 0.1021,
"step": 3900
},
{
"epoch": 4.05,
"learning_rate": 7.5910344827586215e-06,
"loss": 0.11,
"step": 4000
},
{
"epoch": 4.05,
"eval_loss": 0.24147863686084747,
"eval_runtime": 86034.4263,
"eval_samples_per_second": 0.6,
"eval_steps_per_second": 0.037,
"eval_wer": 11.524479299969311,
"step": 4000
},
{
"epoch": 5.0,
"learning_rate": 7.522068965517242e-06,
"loss": 0.0596,
"step": 4100
},
{
"epoch": 5.01,
"learning_rate": 7.453103448275862e-06,
"loss": 0.0889,
"step": 4200
},
{
"epoch": 5.02,
"learning_rate": 7.384137931034483e-06,
"loss": 0.0699,
"step": 4300
},
{
"epoch": 5.03,
"learning_rate": 7.315172413793104e-06,
"loss": 0.1914,
"step": 4400
},
{
"epoch": 5.03,
"learning_rate": 7.246206896551725e-06,
"loss": 0.1299,
"step": 4500
},
{
"epoch": 5.04,
"learning_rate": 7.177241379310346e-06,
"loss": 0.1244,
"step": 4600
},
{
"epoch": 5.04,
"learning_rate": 7.108275862068966e-06,
"loss": 0.079,
"step": 4700
},
{
"epoch": 5.05,
"learning_rate": 7.039310344827587e-06,
"loss": 0.0565,
"step": 4800
},
{
"epoch": 6.0,
"learning_rate": 6.970344827586207e-06,
"loss": 0.0424,
"step": 4900
},
{
"epoch": 6.01,
"learning_rate": 6.901379310344828e-06,
"loss": 0.0578,
"step": 5000
},
{
"epoch": 6.01,
"eval_loss": 0.23887480795383453,
"eval_runtime": 85622.6213,
"eval_samples_per_second": 0.603,
"eval_steps_per_second": 0.038,
"eval_wer": 11.166289121740093,
"step": 5000
},
{
"epoch": 6.02,
"learning_rate": 6.8324137931034485e-06,
"loss": 0.0527,
"step": 5100
},
{
"epoch": 6.02,
"learning_rate": 6.763448275862069e-06,
"loss": 0.0582,
"step": 5200
},
{
"epoch": 6.03,
"learning_rate": 6.694482758620691e-06,
"loss": 0.024,
"step": 5300
},
{
"epoch": 6.04,
"learning_rate": 6.625517241379311e-06,
"loss": 0.0562,
"step": 5400
},
{
"epoch": 6.04,
"learning_rate": 6.5565517241379315e-06,
"loss": 0.0607,
"step": 5500
},
{
"epoch": 6.05,
"learning_rate": 6.487586206896552e-06,
"loss": 0.0512,
"step": 5600
},
{
"epoch": 7.0,
"learning_rate": 6.418620689655173e-06,
"loss": 0.0434,
"step": 5700
},
{
"epoch": 7.01,
"learning_rate": 6.349655172413793e-06,
"loss": 0.0901,
"step": 5800
},
{
"epoch": 7.02,
"learning_rate": 6.280689655172414e-06,
"loss": 0.0687,
"step": 5900
},
{
"epoch": 7.02,
"learning_rate": 6.211724137931035e-06,
"loss": 0.0198,
"step": 6000
},
{
"epoch": 7.02,
"eval_loss": 0.2530022859573364,
"eval_runtime": 85352.5107,
"eval_samples_per_second": 0.605,
"eval_steps_per_second": 0.038,
"eval_wer": 10.562726574706145,
"step": 6000
},
{
"epoch": 7.03,
"learning_rate": 6.142758620689656e-06,
"loss": 0.0909,
"step": 6100
},
{
"epoch": 7.04,
"learning_rate": 6.073793103448276e-06,
"loss": 0.0906,
"step": 6200
},
{
"epoch": 7.04,
"learning_rate": 6.0048275862068975e-06,
"loss": 0.0599,
"step": 6300
},
{
"epoch": 7.05,
"learning_rate": 5.935862068965518e-06,
"loss": 0.0607,
"step": 6400
},
{
"epoch": 8.0,
"learning_rate": 5.866896551724138e-06,
"loss": 0.0932,
"step": 6500
},
{
"epoch": 8.01,
"learning_rate": 5.7979310344827585e-06,
"loss": 0.0902,
"step": 6600
},
{
"epoch": 8.02,
"learning_rate": 5.72896551724138e-06,
"loss": 0.0183,
"step": 6700
},
{
"epoch": 8.02,
"learning_rate": 5.66e-06,
"loss": 0.0264,
"step": 6800
},
{
"epoch": 8.03,
"learning_rate": 5.591034482758621e-06,
"loss": 0.0254,
"step": 6900
},
{
"epoch": 8.04,
"learning_rate": 5.522068965517242e-06,
"loss": 0.0924,
"step": 7000
},
{
"epoch": 8.04,
"eval_loss": 0.22727389633655548,
"eval_runtime": 85997.3481,
"eval_samples_per_second": 0.6,
"eval_steps_per_second": 0.038,
"eval_wer": 10.726350598532859,
"step": 7000
},
{
"epoch": 8.04,
"learning_rate": 5.453103448275863e-06,
"loss": 0.092,
"step": 7100
},
{
"epoch": 8.05,
"learning_rate": 5.384137931034483e-06,
"loss": 0.0653,
"step": 7200
},
{
"epoch": 9.0,
"learning_rate": 5.315172413793104e-06,
"loss": 0.0986,
"step": 7300
},
{
"epoch": 9.01,
"learning_rate": 5.2462068965517245e-06,
"loss": 0.1079,
"step": 7400
},
{
"epoch": 9.02,
"learning_rate": 5.177241379310345e-06,
"loss": 0.0404,
"step": 7500
},
{
"epoch": 9.02,
"learning_rate": 5.108275862068965e-06,
"loss": 0.0623,
"step": 7600
},
{
"epoch": 9.03,
"learning_rate": 5.039310344827587e-06,
"loss": 0.0219,
"step": 7700
},
{
"epoch": 9.04,
"learning_rate": 4.970344827586207e-06,
"loss": 0.0433,
"step": 7800
},
{
"epoch": 9.04,
"learning_rate": 4.901379310344828e-06,
"loss": 0.0555,
"step": 7900
},
{
"epoch": 9.05,
"learning_rate": 4.832413793103449e-06,
"loss": 0.0242,
"step": 8000
},
{
"epoch": 9.05,
"eval_loss": 0.2432514876127243,
"eval_runtime": 85600.137,
"eval_samples_per_second": 0.603,
"eval_steps_per_second": 0.038,
"eval_wer": 10.438448716920252,
"step": 8000
},
{
"epoch": 10.0,
"learning_rate": 4.763448275862069e-06,
"loss": 0.0146,
"step": 8100
},
{
"epoch": 10.01,
"learning_rate": 4.69448275862069e-06,
"loss": 0.0162,
"step": 8200
},
{
"epoch": 10.02,
"learning_rate": 4.625517241379311e-06,
"loss": 0.0422,
"step": 8300
},
{
"epoch": 10.02,
"learning_rate": 4.556551724137931e-06,
"loss": 0.0466,
"step": 8400
},
{
"epoch": 10.03,
"learning_rate": 4.487586206896552e-06,
"loss": 0.0264,
"step": 8500
},
{
"epoch": 10.04,
"learning_rate": 4.418620689655173e-06,
"loss": 0.0444,
"step": 8600
},
{
"epoch": 10.04,
"learning_rate": 4.349655172413794e-06,
"loss": 0.0785,
"step": 8700
},
{
"epoch": 10.05,
"learning_rate": 4.280689655172414e-06,
"loss": 0.0803,
"step": 8800
},
{
"epoch": 11.0,
"learning_rate": 4.2117241379310345e-06,
"loss": 0.0507,
"step": 8900
},
{
"epoch": 11.01,
"learning_rate": 4.142758620689656e-06,
"loss": 0.0468,
"step": 9000
},
{
"epoch": 11.01,
"eval_loss": 0.22253021597862244,
"eval_runtime": 85229.8997,
"eval_samples_per_second": 0.606,
"eval_steps_per_second": 0.038,
"eval_wer": 10.177159614280239,
"step": 9000
},
{
"epoch": 11.02,
"learning_rate": 4.073793103448276e-06,
"loss": 0.0714,
"step": 9100
},
{
"epoch": 11.02,
"learning_rate": 4.004827586206897e-06,
"loss": 0.0877,
"step": 9200
},
{
"epoch": 11.03,
"learning_rate": 3.9358620689655175e-06,
"loss": 0.0888,
"step": 9300
},
{
"epoch": 11.04,
"learning_rate": 3.867586206896552e-06,
"loss": 0.1097,
"step": 9400
},
{
"epoch": 11.04,
"learning_rate": 3.7986206896551727e-06,
"loss": 0.0995,
"step": 9500
},
{
"epoch": 11.05,
"learning_rate": 3.7296551724137935e-06,
"loss": 0.0074,
"step": 9600
},
{
"epoch": 12.0,
"learning_rate": 3.660689655172414e-06,
"loss": 0.0372,
"step": 9700
},
{
"epoch": 12.01,
"learning_rate": 3.5917241379310345e-06,
"loss": 0.028,
"step": 9800
},
{
"epoch": 12.02,
"learning_rate": 3.5227586206896553e-06,
"loss": 0.0528,
"step": 9900
},
{
"epoch": 12.02,
"learning_rate": 3.4537931034482765e-06,
"loss": 0.007,
"step": 10000
},
{
"epoch": 12.02,
"eval_loss": 0.2621050179004669,
"eval_runtime": 85409.6685,
"eval_samples_per_second": 0.604,
"eval_steps_per_second": 0.038,
"eval_wer": 9.971133411516329,
"step": 10000
},
{
"epoch": 12.03,
"learning_rate": 3.3848275862068968e-06,
"loss": 0.0174,
"step": 10100
},
{
"epoch": 12.04,
"learning_rate": 3.3158620689655175e-06,
"loss": 0.0164,
"step": 10200
},
{
"epoch": 12.04,
"learning_rate": 3.246896551724138e-06,
"loss": 0.0204,
"step": 10300
},
{
"epoch": 12.05,
"learning_rate": 3.177931034482759e-06,
"loss": 0.0057,
"step": 10400
},
{
"epoch": 13.0,
"learning_rate": 3.10896551724138e-06,
"loss": 0.0125,
"step": 10500
},
{
"epoch": 13.01,
"learning_rate": 3.04e-06,
"loss": 0.0346,
"step": 10600
},
{
"epoch": 13.02,
"learning_rate": 2.9717241379310345e-06,
"loss": 0.158,
"step": 10700
},
{
"epoch": 13.02,
"learning_rate": 2.9027586206896553e-06,
"loss": 0.1268,
"step": 10800
},
{
"epoch": 13.03,
"learning_rate": 2.8337931034482765e-06,
"loss": 0.0766,
"step": 10900
},
{
"epoch": 13.04,
"learning_rate": 2.764827586206897e-06,
"loss": 0.0103,
"step": 11000
},
{
"epoch": 13.04,
"eval_loss": 0.21942287683486938,
"eval_runtime": 85416.0012,
"eval_samples_per_second": 0.604,
"eval_steps_per_second": 0.038,
"eval_wer": 9.92351054388116,
"step": 11000
},
{
"epoch": 13.04,
"learning_rate": 2.6958620689655175e-06,
"loss": 0.0304,
"step": 11100
},
{
"epoch": 13.05,
"learning_rate": 2.626896551724138e-06,
"loss": 0.0132,
"step": 11200
},
{
"epoch": 14.0,
"learning_rate": 2.557931034482759e-06,
"loss": 0.0392,
"step": 11300
},
{
"epoch": 14.01,
"learning_rate": 2.4889655172413794e-06,
"loss": 0.0214,
"step": 11400
},
{
"epoch": 14.01,
"learning_rate": 2.42e-06,
"loss": 0.0431,
"step": 11500
},
{
"epoch": 14.02,
"learning_rate": 2.351034482758621e-06,
"loss": 0.0172,
"step": 11600
},
{
"epoch": 14.03,
"learning_rate": 2.2820689655172416e-06,
"loss": 0.0175,
"step": 11700
},
{
"epoch": 14.03,
"learning_rate": 2.2131034482758624e-06,
"loss": 0.0523,
"step": 11800
},
{
"epoch": 14.04,
"learning_rate": 2.1441379310344827e-06,
"loss": 0.089,
"step": 11900
},
{
"epoch": 14.05,
"learning_rate": 2.0758620689655175e-06,
"loss": 0.0571,
"step": 12000
},
{
"epoch": 14.05,
"eval_loss": 0.20878072082996368,
"eval_runtime": 128210.6226,
"eval_samples_per_second": 0.403,
"eval_steps_per_second": 0.025,
"eval_wer": 9.858697603703888,
"step": 12000
},
{
"epoch": 15.0,
"learning_rate": 2.0068965517241383e-06,
"loss": 0.0295,
"step": 12100
},
{
"epoch": 15.01,
"learning_rate": 1.9379310344827586e-06,
"loss": 0.0668,
"step": 12200
},
{
"epoch": 15.01,
"learning_rate": 1.8689655172413796e-06,
"loss": 0.0138,
"step": 12300
},
{
"epoch": 15.02,
"learning_rate": 1.8000000000000001e-06,
"loss": 0.0124,
"step": 12400
},
{
"epoch": 15.03,
"learning_rate": 1.7310344827586209e-06,
"loss": 0.0115,
"step": 12500
},
{
"epoch": 15.03,
"learning_rate": 1.6620689655172414e-06,
"loss": 0.0164,
"step": 12600
},
{
"epoch": 15.04,
"learning_rate": 1.5931034482758622e-06,
"loss": 0.0362,
"step": 12700
},
{
"epoch": 15.05,
"learning_rate": 1.524137931034483e-06,
"loss": 0.0362,
"step": 12800
},
{
"epoch": 16.0,
"learning_rate": 1.4551724137931037e-06,
"loss": 0.0596,
"step": 12900
},
{
"epoch": 16.01,
"learning_rate": 1.3862068965517242e-06,
"loss": 0.04,
"step": 13000
},
{
"epoch": 16.01,
"eval_loss": 0.21550078690052032,
"eval_runtime": 84922.7672,
"eval_samples_per_second": 0.608,
"eval_steps_per_second": 0.038,
"eval_wer": 9.765361876493786,
"step": 13000
},
{
"epoch": 16.01,
"learning_rate": 1.317241379310345e-06,
"loss": 0.0153,
"step": 13100
},
{
"epoch": 16.02,
"learning_rate": 1.2482758620689655e-06,
"loss": 0.015,
"step": 13200
},
{
"epoch": 16.03,
"learning_rate": 1.1793103448275863e-06,
"loss": 0.0159,
"step": 13300
},
{
"epoch": 16.03,
"learning_rate": 1.110344827586207e-06,
"loss": 0.0147,
"step": 13400
},
{
"epoch": 16.04,
"learning_rate": 1.0413793103448275e-06,
"loss": 0.0095,
"step": 13500
},
{
"epoch": 16.05,
"learning_rate": 9.724137931034483e-07,
"loss": 0.0058,
"step": 13600
},
{
"epoch": 17.0,
"learning_rate": 9.034482758620689e-07,
"loss": 0.0056,
"step": 13700
},
{
"epoch": 17.01,
"learning_rate": 8.344827586206897e-07,
"loss": 0.0159,
"step": 13800
},
{
"epoch": 17.01,
"learning_rate": 7.655172413793103e-07,
"loss": 0.0248,
"step": 13900
},
{
"epoch": 17.02,
"learning_rate": 6.965517241379311e-07,
"loss": 0.0191,
"step": 14000
},
{
"epoch": 17.02,
"eval_loss": 0.2494414746761322,
"eval_runtime": 84999.0835,
"eval_samples_per_second": 0.607,
"eval_steps_per_second": 0.038,
"eval_wer": 9.745243124925986,
"step": 14000
},
{
"epoch": 17.03,
"learning_rate": 6.275862068965517e-07,
"loss": 0.0314,
"step": 14100
},
{
"epoch": 17.03,
"learning_rate": 5.586206896551725e-07,
"loss": 0.0353,
"step": 14200
},
{
"epoch": 17.04,
"learning_rate": 4.896551724137931e-07,
"loss": 0.0035,
"step": 14300
},
{
"epoch": 17.05,
"learning_rate": 4.2068965517241383e-07,
"loss": 0.0112,
"step": 14400
},
{
"epoch": 18.0,
"learning_rate": 3.5172413793103453e-07,
"loss": 0.0039,
"step": 14500
},
{
"epoch": 18.01,
"learning_rate": 2.827586206896552e-07,
"loss": 0.0076,
"step": 14600
},
{
"epoch": 18.01,
"learning_rate": 2.1379310344827587e-07,
"loss": 0.0078,
"step": 14700
},
{
"epoch": 18.02,
"learning_rate": 1.4482758620689657e-07,
"loss": 0.0141,
"step": 14800
},
{
"epoch": 18.03,
"learning_rate": 7.586206896551724e-08,
"loss": 0.0125,
"step": 14900
},
{
"epoch": 18.03,
"learning_rate": 6.896551724137931e-09,
"loss": 0.0149,
"step": 15000
},
{
"epoch": 18.03,
"eval_loss": 0.23932012915611267,
"eval_runtime": 85191.5609,
"eval_samples_per_second": 0.606,
"eval_steps_per_second": 0.038,
"eval_wer": 9.615871912312803,
"step": 15000
},
{
"epoch": 18.03,
"step": 15000,
"total_flos": 2.0390255069036544e+21,
"train_loss": 0.006579866043726603,
"train_runtime": 476827.8094,
"train_samples_per_second": 2.013,
"train_steps_per_second": 0.031
}
],
"max_steps": 15000,
"num_train_epochs": 9223372036854775807,
"total_flos": 2.0390255069036544e+21,
"trial_name": null,
"trial_params": null
}