covid-policy-roberta-21 / trainer_state.json
MoritzLaurer
from local
e911c39
{
"best_metric": 0.7558827552193487,
"best_model_checkpoint": "./results/coronanet_classi_roberta/checkpoint-3372",
"epoch": 4.0,
"global_step": 3372,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.59,
"learning_rate": 8.92132907519561e-05,
"loss": 1.7123,
"step": 500
},
{
"epoch": 1.0,
"eval_accuracy_balanced": 0.6744778154481599,
"eval_accuracy_not_balanced": 0.7375055613228533,
"eval_f1_macro": 0.6774596453859705,
"eval_f1_weighted": 0.7344846513012891,
"eval_loss": 0.8972207307815552,
"eval_precision": 0.7429861548781078,
"eval_recall": 0.7375055613228533,
"eval_runtime": 29.1161,
"eval_samples_per_second": 231.59,
"step": 843
},
{
"epoch": 1.19,
"learning_rate": 7.368172899151806e-05,
"loss": 0.8779,
"step": 1000
},
{
"epoch": 1.78,
"learning_rate": 5.815016723108002e-05,
"loss": 0.7389,
"step": 1500
},
{
"epoch": 2.0,
"eval_accuracy_balanced": 0.744417109661457,
"eval_accuracy_not_balanced": 0.7655346285036334,
"eval_f1_macro": 0.7393973656051112,
"eval_f1_weighted": 0.7626792308967099,
"eval_loss": 0.8118156790733337,
"eval_precision": 0.7652843843532866,
"eval_recall": 0.7655346285036334,
"eval_runtime": 29.1071,
"eval_samples_per_second": 231.661,
"step": 1686
},
{
"epoch": 2.37,
"learning_rate": 4.261860547064198e-05,
"loss": 0.5835,
"step": 2000
},
{
"epoch": 2.97,
"learning_rate": 2.708704371020394e-05,
"loss": 0.4919,
"step": 2500
},
{
"epoch": 3.0,
"eval_accuracy_balanced": 0.7503794754553327,
"eval_accuracy_not_balanced": 0.773987839240694,
"eval_f1_macro": 0.7470579664348881,
"eval_f1_weighted": 0.7724065863470936,
"eval_loss": 0.7920669913291931,
"eval_precision": 0.7736999040473431,
"eval_recall": 0.773987839240694,
"eval_runtime": 29.1029,
"eval_samples_per_second": 231.695,
"step": 2529
},
{
"epoch": 3.56,
"learning_rate": 1.15554819497659e-05,
"loss": 0.33,
"step": 3000
},
{
"epoch": 4.0,
"eval_accuracy_balanced": 0.7558827552193487,
"eval_accuracy_not_balanced": 0.7773987839240694,
"eval_f1_macro": 0.7509844357682027,
"eval_f1_weighted": 0.7760847284277537,
"eval_loss": 0.853062629699707,
"eval_precision": 0.7759580640894472,
"eval_recall": 0.7773987839240694,
"eval_runtime": 29.115,
"eval_samples_per_second": 231.599,
"step": 3372
}
],
"max_steps": 3372,
"num_train_epochs": 4,
"total_flos": 27219994048880640,
"trial_name": null,
"trial_params": null
}