B1_1000_1e-4_hp-mehrdad / trainer_state.json
lnxdx's picture
End of training
9bea35d
raw
history blame
No virus
4.28 kB
{
"best_metric": 0.2908878504672897,
"best_model_checkpoint": "/content/drive/MyDrive/wav2vec2-large-xlsr-persian-asr-shemo_sm74/checkpoint-900",
"epoch": 6.25,
"eval_steps": 100,
"global_step": 1000,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.62,
"learning_rate": 1.9800000000000004e-05,
"loss": 0.7626,
"step": 100
},
{
"epoch": 0.62,
"eval_loss": 0.6772463321685791,
"eval_runtime": 36.0706,
"eval_samples_per_second": 7.873,
"eval_steps_per_second": 0.998,
"eval_wer": 0.321553738317757,
"step": 100
},
{
"epoch": 1.25,
"learning_rate": 3.9800000000000005e-05,
"loss": 0.7702,
"step": 200
},
{
"epoch": 1.25,
"eval_loss": 0.6705306768417358,
"eval_runtime": 35.9659,
"eval_samples_per_second": 7.896,
"eval_steps_per_second": 1.001,
"eval_wer": 0.3177570093457944,
"step": 200
},
{
"epoch": 1.88,
"learning_rate": 5.9800000000000003e-05,
"loss": 0.7605,
"step": 300
},
{
"epoch": 1.88,
"eval_loss": 0.6425135731697083,
"eval_runtime": 36.0164,
"eval_samples_per_second": 7.885,
"eval_steps_per_second": 1.0,
"eval_wer": 0.317464953271028,
"step": 300
},
{
"epoch": 2.5,
"learning_rate": 7.98e-05,
"loss": 0.6617,
"step": 400
},
{
"epoch": 2.5,
"eval_loss": 0.7112990617752075,
"eval_runtime": 35.9864,
"eval_samples_per_second": 7.892,
"eval_steps_per_second": 1.0,
"eval_wer": 0.3028621495327103,
"step": 400
},
{
"epoch": 3.12,
"learning_rate": 9.98e-05,
"loss": 0.661,
"step": 500
},
{
"epoch": 3.12,
"eval_loss": 0.7172772288322449,
"eval_runtime": 35.6659,
"eval_samples_per_second": 7.963,
"eval_steps_per_second": 1.009,
"eval_wer": 0.3019859813084112,
"step": 500
},
{
"epoch": 3.75,
"learning_rate": 8.020000000000001e-05,
"loss": 0.6037,
"step": 600
},
{
"epoch": 3.75,
"eval_loss": 0.683303713798523,
"eval_runtime": 36.0387,
"eval_samples_per_second": 7.88,
"eval_steps_per_second": 0.999,
"eval_wer": 0.347838785046729,
"step": 600
},
{
"epoch": 4.38,
"learning_rate": 6.02e-05,
"loss": 0.5343,
"step": 700
},
{
"epoch": 4.38,
"eval_loss": 0.8271604180335999,
"eval_runtime": 35.168,
"eval_samples_per_second": 8.076,
"eval_steps_per_second": 1.024,
"eval_wer": 0.29585280373831774,
"step": 700
},
{
"epoch": 5.0,
"learning_rate": 4.02e-05,
"loss": 0.5096,
"step": 800
},
{
"epoch": 5.0,
"eval_loss": 0.8571420311927795,
"eval_runtime": 35.4406,
"eval_samples_per_second": 8.013,
"eval_steps_per_second": 1.016,
"eval_wer": 0.2973130841121495,
"step": 800
},
{
"epoch": 5.62,
"learning_rate": 2.0200000000000003e-05,
"loss": 0.4471,
"step": 900
},
{
"epoch": 5.62,
"eval_loss": 0.9498320817947388,
"eval_runtime": 37.0202,
"eval_samples_per_second": 7.671,
"eval_steps_per_second": 0.972,
"eval_wer": 0.2908878504672897,
"step": 900
},
{
"epoch": 6.25,
"learning_rate": 2.0000000000000002e-07,
"loss": 0.4393,
"step": 1000
},
{
"epoch": 6.25,
"eval_loss": 0.9137212038040161,
"eval_runtime": 36.1327,
"eval_samples_per_second": 7.86,
"eval_steps_per_second": 0.996,
"eval_wer": 0.2932242990654206,
"step": 1000
},
{
"epoch": 6.25,
"step": 1000,
"total_flos": 4.798362622332561e+18,
"train_loss": 0.6149942665100098,
"train_runtime": 5145.8365,
"train_samples_per_second": 3.109,
"train_steps_per_second": 0.194
}
],
"logging_steps": 100,
"max_steps": 1000,
"num_train_epochs": 7,
"save_steps": 100,
"total_flos": 4.798362622332561e+18,
"trial_name": null,
"trial_params": null
}