|
{
|
|
"best_metric": 0.3861003861003861,
|
|
"best_model_checkpoint": "D:\\development\\whisper-finetune\\output_tiny\\checkpoint-1000",
|
|
"epoch": 1000.0,
|
|
"eval_steps": 1000,
|
|
"global_step": 15000,
|
|
"is_hyper_param_search": false,
|
|
"is_local_process_zero": true,
|
|
"is_world_process_zero": true,
|
|
"log_history": [
|
|
{
|
|
"epoch": 33.33,
|
|
"learning_rate": 9.88e-06,
|
|
"loss": 0.8261,
|
|
"step": 500
|
|
},
|
|
{
|
|
"epoch": 66.67,
|
|
"learning_rate": 9.659310344827587e-06,
|
|
"loss": 0.0028,
|
|
"step": 1000
|
|
},
|
|
{
|
|
"epoch": 66.67,
|
|
"eval_loss": 0.002442890079692006,
|
|
"eval_runtime": 21.9145,
|
|
"eval_samples_per_second": 5.339,
|
|
"eval_steps_per_second": 0.684,
|
|
"eval_wer": 0.3861003861003861,
|
|
"step": 1000
|
|
},
|
|
{
|
|
"epoch": 100.0,
|
|
"learning_rate": 9.314482758620691e-06,
|
|
"loss": 0.0016,
|
|
"step": 1500
|
|
},
|
|
{
|
|
"epoch": 133.33,
|
|
"learning_rate": 8.969655172413794e-06,
|
|
"loss": 0.0014,
|
|
"step": 2000
|
|
},
|
|
{
|
|
"epoch": 133.33,
|
|
"eval_loss": 0.0016565920086577535,
|
|
"eval_runtime": 21.8481,
|
|
"eval_samples_per_second": 5.355,
|
|
"eval_steps_per_second": 0.687,
|
|
"eval_wer": 0.3861003861003861,
|
|
"step": 2000
|
|
},
|
|
{
|
|
"epoch": 166.67,
|
|
"learning_rate": 8.624827586206898e-06,
|
|
"loss": 0.0014,
|
|
"step": 2500
|
|
},
|
|
{
|
|
"epoch": 200.0,
|
|
"learning_rate": 8.28e-06,
|
|
"loss": 0.0012,
|
|
"step": 3000
|
|
},
|
|
{
|
|
"epoch": 200.0,
|
|
"eval_loss": 0.0012075488921254873,
|
|
"eval_runtime": 21.8068,
|
|
"eval_samples_per_second": 5.365,
|
|
"eval_steps_per_second": 0.688,
|
|
"eval_wer": 0.3861003861003861,
|
|
"step": 3000
|
|
},
|
|
{
|
|
"epoch": 233.33,
|
|
"learning_rate": 7.935172413793105e-06,
|
|
"loss": 0.0012,
|
|
"step": 3500
|
|
},
|
|
{
|
|
"epoch": 266.67,
|
|
"learning_rate": 7.590344827586208e-06,
|
|
"loss": 0.0011,
|
|
"step": 4000
|
|
},
|
|
{
|
|
"epoch": 266.67,
|
|
"eval_loss": 0.0011881846003234386,
|
|
"eval_runtime": 22.3448,
|
|
"eval_samples_per_second": 5.236,
|
|
"eval_steps_per_second": 0.671,
|
|
"eval_wer": 0.3861003861003861,
|
|
"step": 4000
|
|
},
|
|
{
|
|
"epoch": 300.0,
|
|
"learning_rate": 7.2468965517241385e-06,
|
|
"loss": 0.0013,
|
|
"step": 4500
|
|
},
|
|
{
|
|
"epoch": 333.33,
|
|
"learning_rate": 6.902068965517243e-06,
|
|
"loss": 0.0011,
|
|
"step": 5000
|
|
},
|
|
{
|
|
"epoch": 333.33,
|
|
"eval_loss": 0.0012107096845284104,
|
|
"eval_runtime": 21.9233,
|
|
"eval_samples_per_second": 5.337,
|
|
"eval_steps_per_second": 0.684,
|
|
"eval_wer": 0.3861003861003861,
|
|
"step": 5000
|
|
},
|
|
{
|
|
"epoch": 366.67,
|
|
"learning_rate": 6.557241379310345e-06,
|
|
"loss": 0.0011,
|
|
"step": 5500
|
|
},
|
|
{
|
|
"epoch": 400.0,
|
|
"learning_rate": 6.2124137931034485e-06,
|
|
"loss": 0.0011,
|
|
"step": 6000
|
|
},
|
|
{
|
|
"epoch": 400.0,
|
|
"eval_loss": 0.0011809396091848612,
|
|
"eval_runtime": 21.8718,
|
|
"eval_samples_per_second": 5.349,
|
|
"eval_steps_per_second": 0.686,
|
|
"eval_wer": 0.3861003861003861,
|
|
"step": 6000
|
|
},
|
|
{
|
|
"epoch": 433.33,
|
|
"learning_rate": 5.868275862068966e-06,
|
|
"loss": 0.0011,
|
|
"step": 6500
|
|
},
|
|
{
|
|
"epoch": 466.67,
|
|
"learning_rate": 5.523448275862069e-06,
|
|
"loss": 0.001,
|
|
"step": 7000
|
|
},
|
|
{
|
|
"epoch": 466.67,
|
|
"eval_loss": 0.0011794030433520675,
|
|
"eval_runtime": 21.8283,
|
|
"eval_samples_per_second": 5.36,
|
|
"eval_steps_per_second": 0.687,
|
|
"eval_wer": 0.3861003861003861,
|
|
"step": 7000
|
|
},
|
|
{
|
|
"epoch": 500.0,
|
|
"learning_rate": 5.178620689655173e-06,
|
|
"loss": 0.001,
|
|
"step": 7500
|
|
},
|
|
{
|
|
"epoch": 533.33,
|
|
"learning_rate": 4.833793103448276e-06,
|
|
"loss": 0.001,
|
|
"step": 8000
|
|
},
|
|
{
|
|
"epoch": 533.33,
|
|
"eval_loss": 0.0011808406561613083,
|
|
"eval_runtime": 21.7413,
|
|
"eval_samples_per_second": 5.381,
|
|
"eval_steps_per_second": 0.69,
|
|
"eval_wer": 0.3861003861003861,
|
|
"step": 8000
|
|
},
|
|
{
|
|
"epoch": 566.67,
|
|
"learning_rate": 4.489655172413793e-06,
|
|
"loss": 0.001,
|
|
"step": 8500
|
|
},
|
|
{
|
|
"epoch": 600.0,
|
|
"learning_rate": 4.144827586206897e-06,
|
|
"loss": 0.001,
|
|
"step": 9000
|
|
},
|
|
{
|
|
"epoch": 600.0,
|
|
"eval_loss": 0.00120567309204489,
|
|
"eval_runtime": 21.8405,
|
|
"eval_samples_per_second": 5.357,
|
|
"eval_steps_per_second": 0.687,
|
|
"eval_wer": 0.3861003861003861,
|
|
"step": 9000
|
|
},
|
|
{
|
|
"epoch": 633.33,
|
|
"learning_rate": 3.8000000000000005e-06,
|
|
"loss": 0.001,
|
|
"step": 9500
|
|
},
|
|
{
|
|
"epoch": 666.67,
|
|
"learning_rate": 3.455172413793104e-06,
|
|
"loss": 0.001,
|
|
"step": 10000
|
|
},
|
|
{
|
|
"epoch": 666.67,
|
|
"eval_loss": 0.0011991177452728152,
|
|
"eval_runtime": 21.7109,
|
|
"eval_samples_per_second": 5.389,
|
|
"eval_steps_per_second": 0.691,
|
|
"eval_wer": 0.3861003861003861,
|
|
"step": 10000
|
|
},
|
|
{
|
|
"epoch": 700.0,
|
|
"learning_rate": 3.111034482758621e-06,
|
|
"loss": 0.001,
|
|
"step": 10500
|
|
},
|
|
{
|
|
"epoch": 733.33,
|
|
"learning_rate": 2.766206896551724e-06,
|
|
"loss": 0.001,
|
|
"step": 11000
|
|
},
|
|
{
|
|
"epoch": 733.33,
|
|
"eval_loss": 0.0011818531202152371,
|
|
"eval_runtime": 21.7427,
|
|
"eval_samples_per_second": 5.381,
|
|
"eval_steps_per_second": 0.69,
|
|
"eval_wer": 0.3861003861003861,
|
|
"step": 11000
|
|
},
|
|
{
|
|
"epoch": 766.67,
|
|
"learning_rate": 2.4220689655172416e-06,
|
|
"loss": 0.0009,
|
|
"step": 11500
|
|
},
|
|
{
|
|
"epoch": 800.0,
|
|
"learning_rate": 2.077931034482759e-06,
|
|
"loss": 0.001,
|
|
"step": 12000
|
|
},
|
|
{
|
|
"epoch": 800.0,
|
|
"eval_loss": 0.0011808592826128006,
|
|
"eval_runtime": 21.9404,
|
|
"eval_samples_per_second": 5.333,
|
|
"eval_steps_per_second": 0.684,
|
|
"eval_wer": 0.3861003861003861,
|
|
"step": 12000
|
|
},
|
|
{
|
|
"epoch": 833.33,
|
|
"learning_rate": 1.733103448275862e-06,
|
|
"loss": 0.0009,
|
|
"step": 12500
|
|
},
|
|
{
|
|
"epoch": 866.67,
|
|
"learning_rate": 1.3882758620689656e-06,
|
|
"loss": 0.0009,
|
|
"step": 13000
|
|
},
|
|
{
|
|
"epoch": 866.67,
|
|
"eval_loss": 0.0012090284144505858,
|
|
"eval_runtime": 21.6103,
|
|
"eval_samples_per_second": 5.414,
|
|
"eval_steps_per_second": 0.694,
|
|
"eval_wer": 0.3861003861003861,
|
|
"step": 13000
|
|
},
|
|
{
|
|
"epoch": 900.0,
|
|
"learning_rate": 1.043448275862069e-06,
|
|
"loss": 0.0009,
|
|
"step": 13500
|
|
},
|
|
{
|
|
"epoch": 933.33,
|
|
"learning_rate": 6.993103448275862e-07,
|
|
"loss": 0.0009,
|
|
"step": 14000
|
|
},
|
|
{
|
|
"epoch": 933.33,
|
|
"eval_loss": 0.0012141974875703454,
|
|
"eval_runtime": 21.6816,
|
|
"eval_samples_per_second": 5.396,
|
|
"eval_steps_per_second": 0.692,
|
|
"eval_wer": 0.3861003861003861,
|
|
"step": 14000
|
|
},
|
|
{
|
|
"epoch": 966.67,
|
|
"learning_rate": 3.558620689655173e-07,
|
|
"loss": 0.0009,
|
|
"step": 14500
|
|
},
|
|
{
|
|
"epoch": 1000.0,
|
|
"learning_rate": 1.1034482758620692e-08,
|
|
"loss": 0.0009,
|
|
"step": 15000
|
|
},
|
|
{
|
|
"epoch": 1000.0,
|
|
"eval_loss": 0.0012086295755580068,
|
|
"eval_runtime": 22.0752,
|
|
"eval_samples_per_second": 5.3,
|
|
"eval_steps_per_second": 0.679,
|
|
"eval_wer": 0.3861003861003861,
|
|
"step": 15000
|
|
}
|
|
],
|
|
"logging_steps": 500,
|
|
"max_steps": 15000,
|
|
"num_input_tokens_seen": 0,
|
|
"num_train_epochs": 1000,
|
|
"save_steps": 1000,
|
|
"total_flos": 2.88040955904e+18,
|
|
"train_batch_size": 8,
|
|
"trial_name": null,
|
|
"trial_params": null
|
|
}
|
|
|