longformer-simple / checkpoint-41 /trainer_state.json
Theoreticallyhugo's picture
Training in progress, epoch 1, checkpoint
7bfcc3d verified
{
"best_metric": 0.5843302011489868,
"best_model_checkpoint": "longformer-simple/checkpoint-41",
"epoch": 1.0,
"eval_steps": 500,
"global_step": 41,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_Claim": {
"f1-score": 0.21931818181818183,
"precision": 0.48984771573604063,
"recall": 0.14128843338213762,
"support": 4098.0
},
"eval_MajorClaim": {
"f1-score": 0.5428571428571428,
"precision": 0.5396243701328447,
"recall": 0.5461288827074641,
"support": 2157.0
},
"eval_O": {
"f1-score": 0.8746832169640548,
"precision": 0.8916069169126951,
"recall": 0.858390011166379,
"support": 9851.0
},
"eval_Premise": {
"f1-score": 0.8596746372645179,
"precision": 0.7743724104313917,
"recall": 0.9660965412390726,
"support": 13155.0
},
"eval_accuracy": 0.7833635214107515,
"eval_loss": 0.5843302011489868,
"eval_macro avg": {
"f1-score": 0.6241332947259743,
"precision": 0.673862853303243,
"recall": 0.6279759671237634,
"support": 29261.0
},
"eval_runtime": 1.4428,
"eval_samples_per_second": 55.446,
"eval_steps_per_second": 6.931,
"eval_weighted avg": {
"f1-score": 0.7516910901801511,
"precision": 0.7566882370115429,
"recall": 0.7833635214107515,
"support": 29261.0
},
"step": 41
}
],
"logging_steps": 500,
"max_steps": 205,
"num_input_tokens_seen": 0,
"num_train_epochs": 5,
"save_steps": 500,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": false
},
"attributes": {}
}
},
"total_flos": 143788732726800.0,
"train_batch_size": 8,
"trial_name": null,
"trial_params": null
}