|
{ |
|
"best_metric": 10.718358038768528, |
|
"best_model_checkpoint": "../whisper-NST-cons2e5/checkpoint-6000", |
|
"epoch": 1.0, |
|
"global_step": 10000, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.03, |
|
"learning_rate": 9.88e-06, |
|
"loss": 1.2287, |
|
"step": 250 |
|
}, |
|
{ |
|
"epoch": 0.05, |
|
"learning_rate": 1.9880000000000003e-05, |
|
"loss": 0.2979, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 0.07, |
|
"learning_rate": 2e-05, |
|
"loss": 0.2728, |
|
"step": 750 |
|
}, |
|
{ |
|
"epoch": 0.1, |
|
"learning_rate": 2e-05, |
|
"loss": 0.2517, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 0.1, |
|
"eval_loss": 0.4131389260292053, |
|
"eval_runtime": 51.3583, |
|
"eval_samples_per_second": 1.947, |
|
"eval_steps_per_second": 0.136, |
|
"eval_wer": 18.47206385404789, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 0.12, |
|
"learning_rate": 2e-05, |
|
"loss": 0.2254, |
|
"step": 1250 |
|
}, |
|
{ |
|
"epoch": 0.15, |
|
"learning_rate": 2e-05, |
|
"loss": 0.2115, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 0.17, |
|
"learning_rate": 2e-05, |
|
"loss": 0.2018, |
|
"step": 1750 |
|
}, |
|
{ |
|
"epoch": 0.2, |
|
"learning_rate": 2e-05, |
|
"loss": 0.1931, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 0.2, |
|
"eval_loss": 0.3531236946582794, |
|
"eval_runtime": 74.7257, |
|
"eval_samples_per_second": 1.338, |
|
"eval_steps_per_second": 0.094, |
|
"eval_wer": 19.04218928164196, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 0.23, |
|
"learning_rate": 2e-05, |
|
"loss": 0.1786, |
|
"step": 2250 |
|
}, |
|
{ |
|
"epoch": 0.25, |
|
"learning_rate": 2e-05, |
|
"loss": 0.1746, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 0.28, |
|
"learning_rate": 2e-05, |
|
"loss": 0.1726, |
|
"step": 2750 |
|
}, |
|
{ |
|
"epoch": 0.3, |
|
"learning_rate": 2e-05, |
|
"loss": 0.1598, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 0.3, |
|
"eval_loss": 0.3605496883392334, |
|
"eval_runtime": 59.9526, |
|
"eval_samples_per_second": 1.668, |
|
"eval_steps_per_second": 0.117, |
|
"eval_wer": 16.875712656784494, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 0.33, |
|
"learning_rate": 2e-05, |
|
"loss": 0.1636, |
|
"step": 3250 |
|
}, |
|
{ |
|
"epoch": 0.35, |
|
"learning_rate": 2e-05, |
|
"loss": 0.158, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 0.38, |
|
"learning_rate": 2e-05, |
|
"loss": 0.1494, |
|
"step": 3750 |
|
}, |
|
{ |
|
"epoch": 0.4, |
|
"learning_rate": 2e-05, |
|
"loss": 0.1541, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 0.4, |
|
"eval_loss": 0.33670979738235474, |
|
"eval_runtime": 50.4438, |
|
"eval_samples_per_second": 1.982, |
|
"eval_steps_per_second": 0.139, |
|
"eval_wer": 14.481185860889395, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 0.42, |
|
"learning_rate": 2e-05, |
|
"loss": 0.1498, |
|
"step": 4250 |
|
}, |
|
{ |
|
"epoch": 0.45, |
|
"learning_rate": 2e-05, |
|
"loss": 0.1486, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 0.47, |
|
"learning_rate": 2e-05, |
|
"loss": 0.1471, |
|
"step": 4750 |
|
}, |
|
{ |
|
"epoch": 0.5, |
|
"learning_rate": 2e-05, |
|
"loss": 0.1443, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 0.5, |
|
"eval_loss": 0.3274496793746948, |
|
"eval_runtime": 55.4869, |
|
"eval_samples_per_second": 1.802, |
|
"eval_steps_per_second": 0.126, |
|
"eval_wer": 13.340935005701255, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 0.53, |
|
"learning_rate": 2e-05, |
|
"loss": 0.1337, |
|
"step": 5250 |
|
}, |
|
{ |
|
"epoch": 0.55, |
|
"learning_rate": 2e-05, |
|
"loss": 0.1358, |
|
"step": 5500 |
|
}, |
|
{ |
|
"epoch": 0.57, |
|
"learning_rate": 2e-05, |
|
"loss": 0.1232, |
|
"step": 5750 |
|
}, |
|
{ |
|
"epoch": 0.6, |
|
"learning_rate": 2e-05, |
|
"loss": 0.1301, |
|
"step": 6000 |
|
}, |
|
{ |
|
"epoch": 0.6, |
|
"eval_loss": 0.34810879826545715, |
|
"eval_runtime": 52.0858, |
|
"eval_samples_per_second": 1.92, |
|
"eval_steps_per_second": 0.134, |
|
"eval_wer": 10.718358038768528, |
|
"step": 6000 |
|
}, |
|
{ |
|
"epoch": 0.62, |
|
"learning_rate": 2e-05, |
|
"loss": 0.1308, |
|
"step": 6250 |
|
}, |
|
{ |
|
"epoch": 0.65, |
|
"learning_rate": 2e-05, |
|
"loss": 0.121, |
|
"step": 6500 |
|
}, |
|
{ |
|
"epoch": 0.68, |
|
"learning_rate": 2e-05, |
|
"loss": 0.1343, |
|
"step": 6750 |
|
}, |
|
{ |
|
"epoch": 0.7, |
|
"learning_rate": 2e-05, |
|
"loss": 0.1266, |
|
"step": 7000 |
|
}, |
|
{ |
|
"epoch": 0.7, |
|
"eval_loss": 0.3451653718948364, |
|
"eval_runtime": 52.2228, |
|
"eval_samples_per_second": 1.915, |
|
"eval_steps_per_second": 0.134, |
|
"eval_wer": 12.998859749144811, |
|
"step": 7000 |
|
}, |
|
{ |
|
"epoch": 0.72, |
|
"learning_rate": 2e-05, |
|
"loss": 0.1223, |
|
"step": 7250 |
|
}, |
|
{ |
|
"epoch": 0.75, |
|
"learning_rate": 2e-05, |
|
"loss": 0.1264, |
|
"step": 7500 |
|
}, |
|
{ |
|
"epoch": 0.78, |
|
"learning_rate": 2e-05, |
|
"loss": 0.119, |
|
"step": 7750 |
|
}, |
|
{ |
|
"epoch": 0.8, |
|
"learning_rate": 2e-05, |
|
"loss": 0.1216, |
|
"step": 8000 |
|
}, |
|
{ |
|
"epoch": 0.8, |
|
"eval_loss": 0.32154810428619385, |
|
"eval_runtime": 82.8333, |
|
"eval_samples_per_second": 1.207, |
|
"eval_steps_per_second": 0.085, |
|
"eval_wer": 10.832383124287343, |
|
"step": 8000 |
|
}, |
|
{ |
|
"epoch": 0.82, |
|
"learning_rate": 2e-05, |
|
"loss": 0.1242, |
|
"step": 8250 |
|
}, |
|
{ |
|
"epoch": 0.85, |
|
"learning_rate": 2e-05, |
|
"loss": 0.1217, |
|
"step": 8500 |
|
}, |
|
{ |
|
"epoch": 0.88, |
|
"learning_rate": 2e-05, |
|
"loss": 0.1245, |
|
"step": 8750 |
|
}, |
|
{ |
|
"epoch": 0.9, |
|
"learning_rate": 2e-05, |
|
"loss": 0.1121, |
|
"step": 9000 |
|
}, |
|
{ |
|
"epoch": 0.9, |
|
"eval_loss": 0.31604325771331787, |
|
"eval_runtime": 50.7948, |
|
"eval_samples_per_second": 1.969, |
|
"eval_steps_per_second": 0.138, |
|
"eval_wer": 11.516533637400228, |
|
"step": 9000 |
|
}, |
|
{ |
|
"epoch": 0.93, |
|
"learning_rate": 2e-05, |
|
"loss": 0.1161, |
|
"step": 9250 |
|
}, |
|
{ |
|
"epoch": 0.95, |
|
"learning_rate": 2e-05, |
|
"loss": 0.112, |
|
"step": 9500 |
|
}, |
|
{ |
|
"epoch": 0.97, |
|
"learning_rate": 2e-05, |
|
"loss": 0.1167, |
|
"step": 9750 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"learning_rate": 2e-05, |
|
"loss": 0.1171, |
|
"step": 10000 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_loss": 0.3520647883415222, |
|
"eval_runtime": 84.9296, |
|
"eval_samples_per_second": 1.177, |
|
"eval_steps_per_second": 0.082, |
|
"eval_wer": 11.85860889395667, |
|
"step": 10000 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"step": 10000, |
|
"total_flos": 4.61736640512e+19, |
|
"train_loss": 0.18131806907653808, |
|
"train_runtime": 89475.4174, |
|
"train_samples_per_second": 3.576, |
|
"train_steps_per_second": 0.112 |
|
} |
|
], |
|
"max_steps": 10000, |
|
"num_train_epochs": 9223372036854775807, |
|
"total_flos": 4.61736640512e+19, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|