whisper-large-v2-he-1 / trainer_state.json
Shiry's picture
End of training
2afbf55
{
"best_metric": 27.250397341424648,
"best_model_checkpoint": "./checkpoint-50",
"epoch": 99.01,
"global_step": 200,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 12.01,
"learning_rate": 9.210526315789473e-07,
"loss": 0.752,
"step": 25
},
{
"epoch": 24.01,
"learning_rate": 7.947368421052631e-07,
"loss": 0.425,
"step": 50
},
{
"epoch": 24.01,
"eval_loss": 0.4105507731437683,
"eval_runtime": 786.9933,
"eval_samples_per_second": 1.006,
"eval_steps_per_second": 0.032,
"eval_wer": 27.250397341424648,
"step": 50
},
{
"epoch": 37.01,
"learning_rate": 6.63157894736842e-07,
"loss": 0.2879,
"step": 75
},
{
"epoch": 49.01,
"learning_rate": 5.31578947368421e-07,
"loss": 0.1906,
"step": 100
},
{
"epoch": 49.01,
"eval_loss": 0.44195765256881714,
"eval_runtime": 813.6355,
"eval_samples_per_second": 0.973,
"eval_steps_per_second": 0.031,
"eval_wer": 29.013148388961135,
"step": 100
},
{
"epoch": 62.01,
"learning_rate": 4e-07,
"loss": 0.1347,
"step": 125
},
{
"epoch": 74.01,
"learning_rate": 2.684210526315789e-07,
"loss": 0.0982,
"step": 150
},
{
"epoch": 74.01,
"eval_loss": 0.4795360267162323,
"eval_runtime": 848.8397,
"eval_samples_per_second": 0.933,
"eval_steps_per_second": 0.029,
"eval_wer": 30.306314116457163,
"step": 150
},
{
"epoch": 87.0,
"learning_rate": 1.368421052631579e-07,
"loss": 0.0829,
"step": 175
},
{
"epoch": 99.01,
"learning_rate": 5.263157894736842e-09,
"loss": 0.0717,
"step": 200
},
{
"epoch": 99.01,
"eval_loss": 0.4944527745246887,
"eval_runtime": 875.6338,
"eval_samples_per_second": 0.904,
"eval_steps_per_second": 0.029,
"eval_wer": 30.891489669122958,
"step": 200
},
{
"epoch": 99.01,
"step": 200,
"total_flos": 1.387640884064256e+20,
"train_loss": 0.25535590410232545,
"train_runtime": 48457.1181,
"train_samples_per_second": 2.113,
"train_steps_per_second": 0.004
}
],
"max_steps": 200,
"num_train_epochs": 9223372036854775807,
"total_flos": 1.387640884064256e+20,
"trial_name": null,
"trial_params": null
}