guvitncpl195manojtharu143 / trainer_state.json
tharumanoj143's picture
Upload 8 files
2cdc596 verified
raw
history blame
2.28 kB
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 20.337552742616033,
"global_step": 2400,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 3.39,
"learning_rate": 0.00023999999999999998,
"loss": 6.3317,
"step": 400
},
{
"epoch": 3.39,
"eval_loss": 3.161163806915283,
"eval_runtime": 205.0119,
"eval_samples_per_second": 8.687,
"eval_wer": 1.0,
"step": 400
},
{
"epoch": 6.78,
"learning_rate": 0.0002703947368421052,
"loss": 1.6739,
"step": 800
},
{
"epoch": 6.78,
"eval_loss": 0.6274727582931519,
"eval_runtime": 205.8605,
"eval_samples_per_second": 8.651,
"eval_wer": 1.008992553042012,
"step": 800
},
{
"epoch": 10.17,
"learning_rate": 0.00023092105263157893,
"loss": 0.3726,
"step": 1200
},
{
"epoch": 10.17,
"eval_loss": 0.6007506847381592,
"eval_runtime": 208.514,
"eval_samples_per_second": 8.541,
"eval_wer": 0.9197695658282984,
"step": 1200
},
{
"epoch": 13.56,
"learning_rate": 0.00019144736842105262,
"loss": 0.2323,
"step": 1600
},
{
"epoch": 13.56,
"eval_loss": 0.62809157371521,
"eval_runtime": 207.5386,
"eval_samples_per_second": 8.582,
"eval_wer": 0.9513840101166222,
"step": 1600
},
{
"epoch": 16.95,
"learning_rate": 0.00015197368421052628,
"loss": 0.1598,
"step": 2000
},
{
"epoch": 16.95,
"eval_loss": 0.679410994052887,
"eval_runtime": 213.3742,
"eval_samples_per_second": 8.347,
"eval_wer": 0.8642686525221301,
"step": 2000
},
{
"epoch": 20.34,
"learning_rate": 0.0001125,
"loss": 0.1258,
"step": 2400
},
{
"epoch": 20.34,
"eval_loss": 0.7365503311157227,
"eval_runtime": 210.0426,
"eval_samples_per_second": 8.479,
"eval_wer": 0.8294225094843333,
"step": 2400
}
],
"max_steps": 3540,
"num_train_epochs": 30,
"total_flos": 1.022364819420586e+19,
"trial_name": null,
"trial_params": null
}