|
{ |
|
"best_metric": 76.75840978593273, |
|
"best_model_checkpoint": "outputs/lora/t5-base/superglue-boolq/checkpoint-200", |
|
"epoch": 1.0, |
|
"global_step": 295, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.34, |
|
"eval_accuracy": 73.27217125382262, |
|
"eval_average_metrics": 73.27217125382262, |
|
"eval_loss": 0.22932085394859314, |
|
"eval_runtime": 6.9751, |
|
"eval_samples_per_second": 234.404, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 0.68, |
|
"eval_accuracy": 76.75840978593273, |
|
"eval_average_metrics": 76.75840978593273, |
|
"eval_loss": 0.20979416370391846, |
|
"eval_runtime": 6.9617, |
|
"eval_samples_per_second": 234.856, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"step": 295, |
|
"total_flos": 2875122627969024.0, |
|
"train_loss": 0.6385218733448094, |
|
"train_runtime": 76.4806, |
|
"train_samples_per_second": 123.26, |
|
"train_steps_per_second": 3.857 |
|
} |
|
], |
|
"max_steps": 295, |
|
"num_train_epochs": 1, |
|
"total_flos": 2875122627969024.0, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|