mfact-mad-x / trainer_state.json
Yifu Qiu
mfact-mad-x-v1
49ce16d
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 9.999908653156034,
"global_step": 95780,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"learning_rate": 9.048181989924434e-05,
"loss": 3.734,
"step": 9578
},
{
"epoch": 2.0,
"learning_rate": 8.043939546599497e-05,
"loss": 3.5549,
"step": 19156
},
{
"epoch": 3.0,
"learning_rate": 7.03969710327456e-05,
"loss": 3.5027,
"step": 28734
},
{
"epoch": 4.0,
"learning_rate": 6.0354546599496234e-05,
"loss": 3.4695,
"step": 38312
},
{
"epoch": 5.0,
"learning_rate": 5.0312122166246854e-05,
"loss": 3.4447,
"step": 47890
},
{
"epoch": 6.0,
"learning_rate": 4.026969773299749e-05,
"loss": 3.4219,
"step": 57468
},
{
"epoch": 7.0,
"learning_rate": 3.0227273299748105e-05,
"loss": 3.3985,
"step": 67046
},
{
"epoch": 8.0,
"learning_rate": 2.0184848866498742e-05,
"loss": 3.3824,
"step": 76624
},
{
"epoch": 9.0,
"learning_rate": 1.0142424433249365e-05,
"loss": 3.3701,
"step": 86202
},
{
"epoch": 10.0,
"learning_rate": 9.999999999999998e-08,
"loss": 3.3609,
"step": 95780
},
{
"epoch": 10.0,
"step": 95780,
"total_flos": 5.86608789194907e+18,
"train_loss": 3.463967107237941,
"train_runtime": 128255.8433,
"train_samples_per_second": 23.899,
"train_steps_per_second": 0.747
}
],
"max_steps": 95780,
"num_train_epochs": 10,
"total_flos": 5.86608789194907e+18,
"trial_name": null,
"trial_params": null
}