|
{ |
|
"best_metric": 0.17856432497501373, |
|
"best_model_checkpoint": "bioformer8L_caption_reference_RTX6000/checkpoint-1230", |
|
"epoch": 2.0, |
|
"eval_steps": 500, |
|
"global_step": 2460, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.4065040650406504, |
|
"grad_norm": 8.241156578063965, |
|
"learning_rate": 2.75609756097561e-05, |
|
"loss": 0.2277, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 0.8130081300813008, |
|
"grad_norm": 2.205291986465454, |
|
"learning_rate": 2.5121951219512197e-05, |
|
"loss": 0.177, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_accuracy": 0.9276147633166343, |
|
"eval_f1": 0.9222332155896071, |
|
"eval_f1_medical": 0.9426906265177271, |
|
"eval_f1_non_medical": 0.9017758046614872, |
|
"eval_loss": 0.17856432497501373, |
|
"eval_precision": 0.9277090451077986, |
|
"eval_recall": 0.9177374028102576, |
|
"eval_runtime": 37.413, |
|
"eval_samples_per_second": 261.433, |
|
"eval_steps_per_second": 8.179, |
|
"step": 1230 |
|
}, |
|
{ |
|
"epoch": 1.2195121951219512, |
|
"grad_norm": 3.5154032707214355, |
|
"learning_rate": 2.2682926829268295e-05, |
|
"loss": 0.1466, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 1.6260162601626016, |
|
"grad_norm": 3.8458199501037598, |
|
"learning_rate": 2.024390243902439e-05, |
|
"loss": 0.1232, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_accuracy": 0.929352826909314, |
|
"eval_f1": 0.9248187483559904, |
|
"eval_f1_medical": 0.9432816219322006, |
|
"eval_f1_non_medical": 0.9063558747797804, |
|
"eval_loss": 0.20747286081314087, |
|
"eval_precision": 0.9255804539078865, |
|
"eval_recall": 0.9240820913256004, |
|
"eval_runtime": 37.4622, |
|
"eval_samples_per_second": 261.09, |
|
"eval_steps_per_second": 8.168, |
|
"step": 2460 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 6150, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 5, |
|
"save_steps": 500, |
|
"stateful_callbacks": { |
|
"TrainerControl": { |
|
"args": { |
|
"should_epoch_stop": false, |
|
"should_evaluate": false, |
|
"should_log": false, |
|
"should_save": true, |
|
"should_training_stop": false |
|
}, |
|
"attributes": {} |
|
} |
|
}, |
|
"total_flos": 6162603809728128.0, |
|
"train_batch_size": 32, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|