codefactory4791's picture
Training in progress, step 8000
14ef323
raw
history blame
No virus
8.11 kB
{
"best_metric": 27.7224217287947,
"best_model_checkpoint": "codefactory4791/whisper-small-medicalv2/checkpoint-4500",
"epoch": 20.408163265306122,
"global_step": 8000,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.64,
"learning_rate": 4.92e-06,
"loss": 1.5644,
"step": 250
},
{
"epoch": 1.28,
"learning_rate": 9.920000000000002e-06,
"loss": 0.5293,
"step": 500
},
{
"epoch": 1.28,
"eval_loss": 0.48172396421432495,
"eval_runtime": 325.9765,
"eval_samples_per_second": 4.23,
"eval_steps_per_second": 0.135,
"eval_wer": 46.628900915482276,
"step": 500
},
{
"epoch": 1.91,
"learning_rate": 9.742105263157897e-06,
"loss": 0.5005,
"step": 750
},
{
"epoch": 2.55,
"learning_rate": 9.478947368421053e-06,
"loss": 0.4125,
"step": 1000
},
{
"epoch": 2.55,
"eval_loss": 0.5011524558067322,
"eval_runtime": 303.4033,
"eval_samples_per_second": 4.545,
"eval_steps_per_second": 0.145,
"eval_wer": 32.163269435031104,
"step": 1000
},
{
"epoch": 3.19,
"learning_rate": 9.215789473684211e-06,
"loss": 0.3928,
"step": 1250
},
{
"epoch": 3.83,
"learning_rate": 8.95263157894737e-06,
"loss": 0.3263,
"step": 1500
},
{
"epoch": 3.83,
"eval_loss": 0.5298507809638977,
"eval_runtime": 296.4623,
"eval_samples_per_second": 4.652,
"eval_steps_per_second": 0.148,
"eval_wer": 29.558444185928884,
"step": 1500
},
{
"epoch": 4.46,
"learning_rate": 8.689473684210526e-06,
"loss": 0.2629,
"step": 1750
},
{
"epoch": 5.1,
"learning_rate": 8.426315789473684e-06,
"loss": 0.2399,
"step": 2000
},
{
"epoch": 5.1,
"eval_loss": 0.5742943286895752,
"eval_runtime": 290.0311,
"eval_samples_per_second": 4.755,
"eval_steps_per_second": 0.152,
"eval_wer": 28.157402255829243,
"step": 2000
},
{
"epoch": 5.74,
"learning_rate": 8.163157894736842e-06,
"loss": 0.1817,
"step": 2250
},
{
"epoch": 6.38,
"learning_rate": 7.9e-06,
"loss": 0.1563,
"step": 2500
},
{
"epoch": 6.38,
"eval_loss": 0.6200889348983765,
"eval_runtime": 297.5485,
"eval_samples_per_second": 4.635,
"eval_steps_per_second": 0.148,
"eval_wer": 39.52253300288301,
"step": 2500
},
{
"epoch": 7.02,
"learning_rate": 7.636842105263159e-06,
"loss": 0.1411,
"step": 2750
},
{
"epoch": 7.65,
"learning_rate": 7.373684210526316e-06,
"loss": 0.095,
"step": 3000
},
{
"epoch": 7.65,
"eval_loss": 0.6449038982391357,
"eval_runtime": 288.5774,
"eval_samples_per_second": 4.779,
"eval_steps_per_second": 0.152,
"eval_wer": 28.481108694552624,
"step": 3000
},
{
"epoch": 8.29,
"learning_rate": 7.110526315789474e-06,
"loss": 0.0869,
"step": 3250
},
{
"epoch": 8.93,
"learning_rate": 6.8473684210526325e-06,
"loss": 0.0767,
"step": 3500
},
{
"epoch": 8.93,
"eval_loss": 0.671624481678009,
"eval_runtime": 290.9537,
"eval_samples_per_second": 4.74,
"eval_steps_per_second": 0.151,
"eval_wer": 29.841687319811843,
"step": 3500
},
{
"epoch": 9.57,
"learning_rate": 6.58421052631579e-06,
"loss": 0.0598,
"step": 3750
},
{
"epoch": 10.2,
"learning_rate": 6.321052631578948e-06,
"loss": 0.0537,
"step": 4000
},
{
"epoch": 10.2,
"eval_loss": 0.71231609582901,
"eval_runtime": 295.3003,
"eval_samples_per_second": 4.67,
"eval_steps_per_second": 0.149,
"eval_wer": 28.354660866926306,
"step": 4000
},
{
"epoch": 10.84,
"learning_rate": 6.057894736842106e-06,
"loss": 0.0486,
"step": 4250
},
{
"epoch": 11.48,
"learning_rate": 5.794736842105264e-06,
"loss": 0.0406,
"step": 4500
},
{
"epoch": 11.48,
"eval_loss": 0.72938472032547,
"eval_runtime": 288.8463,
"eval_samples_per_second": 4.774,
"eval_steps_per_second": 0.152,
"eval_wer": 27.7224217287947,
"step": 4500
},
{
"epoch": 12.12,
"learning_rate": 5.531578947368421e-06,
"loss": 0.0376,
"step": 4750
},
{
"epoch": 12.76,
"learning_rate": 5.268421052631579e-06,
"loss": 0.0314,
"step": 5000
},
{
"epoch": 12.76,
"eval_loss": 0.7565638422966003,
"eval_runtime": 294.0019,
"eval_samples_per_second": 4.69,
"eval_steps_per_second": 0.15,
"eval_wer": 27.950027818522077,
"step": 5000
},
{
"epoch": 13.39,
"learning_rate": 5.005263157894737e-06,
"loss": 0.0278,
"step": 5250
},
{
"epoch": 14.03,
"learning_rate": 4.7421052631578954e-06,
"loss": 0.026,
"step": 5500
},
{
"epoch": 14.03,
"eval_loss": 0.7726335525512695,
"eval_runtime": 292.0072,
"eval_samples_per_second": 4.722,
"eval_steps_per_second": 0.151,
"eval_wer": 28.106823124778717,
"step": 5500
},
{
"epoch": 14.67,
"learning_rate": 4.478947368421054e-06,
"loss": 0.0222,
"step": 5750
},
{
"epoch": 15.31,
"learning_rate": 4.215789473684211e-06,
"loss": 0.0212,
"step": 6000
},
{
"epoch": 15.31,
"eval_loss": 0.757480263710022,
"eval_runtime": 302.5701,
"eval_samples_per_second": 4.558,
"eval_steps_per_second": 0.145,
"eval_wer": 31.252845076121595,
"step": 6000
},
{
"epoch": 15.94,
"learning_rate": 3.952631578947368e-06,
"loss": 0.0191,
"step": 6250
},
{
"epoch": 16.58,
"learning_rate": 3.6894736842105265e-06,
"loss": 0.016,
"step": 6500
},
{
"epoch": 16.58,
"eval_loss": 0.7838702201843262,
"eval_runtime": 293.8696,
"eval_samples_per_second": 4.693,
"eval_steps_per_second": 0.15,
"eval_wer": 28.34960295382125,
"step": 6500
},
{
"epoch": 17.22,
"learning_rate": 3.4263157894736842e-06,
"loss": 0.0154,
"step": 6750
},
{
"epoch": 17.86,
"learning_rate": 3.1631578947368424e-06,
"loss": 0.0132,
"step": 7000
},
{
"epoch": 17.86,
"eval_loss": 0.7901157140731812,
"eval_runtime": 300.427,
"eval_samples_per_second": 4.59,
"eval_steps_per_second": 0.146,
"eval_wer": 28.98184209195286,
"step": 7000
},
{
"epoch": 18.49,
"learning_rate": 2.9e-06,
"loss": 0.0114,
"step": 7250
},
{
"epoch": 19.13,
"learning_rate": 2.6368421052631584e-06,
"loss": 0.0112,
"step": 7500
},
{
"epoch": 19.13,
"eval_loss": 0.8057935833930969,
"eval_runtime": 299.4809,
"eval_samples_per_second": 4.605,
"eval_steps_per_second": 0.147,
"eval_wer": 29.027363309898334,
"step": 7500
},
{
"epoch": 19.77,
"learning_rate": 2.373684210526316e-06,
"loss": 0.0089,
"step": 7750
},
{
"epoch": 20.41,
"learning_rate": 2.110526315789474e-06,
"loss": 0.0078,
"step": 8000
},
{
"epoch": 20.41,
"eval_loss": 0.8125391006469727,
"eval_runtime": 297.7542,
"eval_samples_per_second": 4.631,
"eval_steps_per_second": 0.148,
"eval_wer": 29.593849577664255,
"step": 8000
}
],
"max_steps": 10000,
"num_train_epochs": 26,
"total_flos": 1.47495998103552e+20,
"trial_name": null,
"trial_params": null
}