MSLacerda's picture
MSLacerda/attribute_minig_mslacerda
2803ec7 verified
raw
history blame contribute delete
No virus
5.01 kB
{
"best_metric": 0.6368208527565002,
"best_model_checkpoint": "../experiments/attribute_minig_mslacerda/run-1/checkpoint-473",
"epoch": 11.0,
"eval_steps": 500,
"global_step": 473,
"is_hyper_param_search": true,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_accuracy": 0.03543543543543543,
"eval_f1": 0.004940711462450594,
"eval_loss": 4.673229217529297,
"eval_precision": 0.004108463434675432,
"eval_recall": 0.006195786864931847,
"eval_runtime": 0.3918,
"eval_samples_per_second": 742.66,
"eval_steps_per_second": 94.428,
"step": 43
},
{
"epoch": 2.0,
"eval_accuracy": 0.12612612612612611,
"eval_f1": 0.019381056580181303,
"eval_loss": 4.209076881408691,
"eval_precision": 0.019558359621451103,
"eval_recall": 0.019206939281288724,
"eval_runtime": 0.3924,
"eval_samples_per_second": 741.507,
"eval_steps_per_second": 94.281,
"step": 86
},
{
"epoch": 3.0,
"eval_accuracy": 0.3282282282282282,
"eval_f1": 0.10037453183520599,
"eval_loss": 3.259751319885254,
"eval_precision": 0.1268939393939394,
"eval_recall": 0.08302354399008674,
"eval_runtime": 0.4015,
"eval_samples_per_second": 724.86,
"eval_steps_per_second": 92.164,
"step": 129
},
{
"epoch": 4.0,
"eval_accuracy": 0.4903903903903904,
"eval_f1": 0.2385254788579689,
"eval_loss": 2.3082196712493896,
"eval_precision": 0.2862098872506505,
"eval_recall": 0.20446096654275092,
"eval_runtime": 0.3924,
"eval_samples_per_second": 741.662,
"eval_steps_per_second": 94.301,
"step": 172
},
{
"epoch": 5.0,
"eval_accuracy": 0.5990990990990991,
"eval_f1": 0.3480905711388983,
"eval_loss": 1.7047184705734253,
"eval_precision": 0.3828996282527881,
"eval_recall": 0.3190830235439901,
"eval_runtime": 0.395,
"eval_samples_per_second": 736.685,
"eval_steps_per_second": 93.668,
"step": 215
},
{
"epoch": 6.0,
"eval_accuracy": 0.6927927927927928,
"eval_f1": 0.4707024927160893,
"eval_loss": 1.2966375350952148,
"eval_precision": 0.4928813559322034,
"eval_recall": 0.45043370508054525,
"eval_runtime": 0.3855,
"eval_samples_per_second": 754.812,
"eval_steps_per_second": 95.973,
"step": 258
},
{
"epoch": 7.0,
"eval_accuracy": 0.7678678678678679,
"eval_f1": 0.5833596962986396,
"eval_loss": 1.0009989738464355,
"eval_precision": 0.5959922430510666,
"eval_recall": 0.5712515489467163,
"eval_runtime": 0.6988,
"eval_samples_per_second": 416.416,
"eval_steps_per_second": 52.946,
"step": 301
},
{
"epoch": 8.0,
"eval_accuracy": 0.8144144144144144,
"eval_f1": 0.6510903426791277,
"eval_loss": 0.8084700107574463,
"eval_precision": 0.6547619047619048,
"eval_recall": 0.6474597273853779,
"eval_runtime": 0.3918,
"eval_samples_per_second": 742.642,
"eval_steps_per_second": 94.425,
"step": 344
},
{
"epoch": 9.0,
"eval_accuracy": 0.8366366366366367,
"eval_f1": 0.6894850447116867,
"eval_loss": 0.7090229988098145,
"eval_precision": 0.6863106200122775,
"eval_recall": 0.6926889714993805,
"eval_runtime": 0.4014,
"eval_samples_per_second": 724.894,
"eval_steps_per_second": 92.169,
"step": 387
},
{
"epoch": 10.0,
"eval_accuracy": 0.8426426426426427,
"eval_f1": 0.7053378586855908,
"eval_loss": 0.6727187037467957,
"eval_precision": 0.702519975414874,
"eval_recall": 0.70817843866171,
"eval_runtime": 0.3949,
"eval_samples_per_second": 736.903,
"eval_steps_per_second": 93.696,
"step": 430
},
{
"epoch": 11.0,
"eval_accuracy": 0.8552552552552553,
"eval_f1": 0.7300613496932516,
"eval_loss": 0.6368208527565002,
"eval_precision": 0.7229647630619684,
"eval_recall": 0.7372986369268897,
"eval_runtime": 0.3928,
"eval_samples_per_second": 740.915,
"eval_steps_per_second": 94.206,
"step": 473
}
],
"logging_steps": 500,
"max_steps": 559,
"num_input_tokens_seen": 0,
"num_train_epochs": 13,
"save_steps": 500,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": false
},
"attributes": {}
}
},
"total_flos": 0,
"train_batch_size": 32,
"trial_name": null,
"trial_params": {
"learning_rate": 3.979306441518639e-05,
"num_train_epochs": 13,
"per_device_train_batch_size": 32,
"warmup_steps": 286,
"weight_decay": 0.144636026358464
}
}