|
{ |
|
"best_metric": 1.2208830118179321, |
|
"best_model_checkpoint": "facial_age_image_detection/checkpoint-3120", |
|
"epoch": 13.0, |
|
"eval_steps": 500, |
|
"global_step": 3120, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"eval_accuracy": 0.5914377871175838, |
|
"eval_loss": 1.247507929801941, |
|
"eval_runtime": 105.4075, |
|
"eval_samples_per_second": 97.061, |
|
"eval_steps_per_second": 3.036, |
|
"step": 240 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_accuracy": 0.599159417456749, |
|
"eval_loss": 1.2387152910232544, |
|
"eval_runtime": 105.6722, |
|
"eval_samples_per_second": 96.818, |
|
"eval_steps_per_second": 3.028, |
|
"step": 480 |
|
}, |
|
{ |
|
"epoch": 2.08, |
|
"grad_norm": 16.16035270690918, |
|
"learning_rate": 6.112676056338028e-07, |
|
"loss": 0.8178, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_accuracy": 0.593979083178575, |
|
"eval_loss": 1.240220069885254, |
|
"eval_runtime": 106.9319, |
|
"eval_samples_per_second": 95.678, |
|
"eval_steps_per_second": 2.993, |
|
"step": 720 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy": 0.5982797380510214, |
|
"eval_loss": 1.2350324392318726, |
|
"eval_runtime": 105.7769, |
|
"eval_samples_per_second": 96.722, |
|
"eval_steps_per_second": 3.025, |
|
"step": 960 |
|
}, |
|
{ |
|
"epoch": 4.17, |
|
"grad_norm": 12.192686080932617, |
|
"learning_rate": 5.126760563380281e-07, |
|
"loss": 0.8038, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_accuracy": 0.5962271527709901, |
|
"eval_loss": 1.2324706315994263, |
|
"eval_runtime": 105.7457, |
|
"eval_samples_per_second": 96.751, |
|
"eval_steps_per_second": 3.026, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_accuracy": 0.5964226370833741, |
|
"eval_loss": 1.2318035364151, |
|
"eval_runtime": 105.5068, |
|
"eval_samples_per_second": 96.97, |
|
"eval_steps_per_second": 3.033, |
|
"step": 1440 |
|
}, |
|
{ |
|
"epoch": 6.25, |
|
"grad_norm": 12.383950233459473, |
|
"learning_rate": 4.140845070422535e-07, |
|
"loss": 0.7976, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_accuracy": 0.5976932851138697, |
|
"eval_loss": 1.2295589447021484, |
|
"eval_runtime": 106.676, |
|
"eval_samples_per_second": 95.907, |
|
"eval_steps_per_second": 3.0, |
|
"step": 1680 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_accuracy": 0.5974978008014857, |
|
"eval_loss": 1.2282449007034302, |
|
"eval_runtime": 105.9543, |
|
"eval_samples_per_second": 96.561, |
|
"eval_steps_per_second": 3.02, |
|
"step": 1920 |
|
}, |
|
{ |
|
"epoch": 8.33, |
|
"grad_norm": 12.568708419799805, |
|
"learning_rate": 3.1549295774647887e-07, |
|
"loss": 0.7888, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_accuracy": 0.6013097448929723, |
|
"eval_loss": 1.2256407737731934, |
|
"eval_runtime": 105.7499, |
|
"eval_samples_per_second": 96.747, |
|
"eval_steps_per_second": 3.026, |
|
"step": 2160 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_accuracy": 0.6001368390186688, |
|
"eval_loss": 1.2228951454162598, |
|
"eval_runtime": 106.2182, |
|
"eval_samples_per_second": 96.321, |
|
"eval_steps_per_second": 3.013, |
|
"step": 2400 |
|
}, |
|
{ |
|
"epoch": 10.42, |
|
"grad_norm": 10.32869815826416, |
|
"learning_rate": 2.169014084507042e-07, |
|
"loss": 0.7785, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"eval_accuracy": 0.5989639331443651, |
|
"eval_loss": 1.223892331123352, |
|
"eval_runtime": 105.6089, |
|
"eval_samples_per_second": 96.876, |
|
"eval_steps_per_second": 3.03, |
|
"step": 2640 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_accuracy": 0.599452643925325, |
|
"eval_loss": 1.2233675718307495, |
|
"eval_runtime": 105.2752, |
|
"eval_samples_per_second": 97.183, |
|
"eval_steps_per_second": 3.04, |
|
"step": 2880 |
|
}, |
|
{ |
|
"epoch": 12.5, |
|
"grad_norm": 10.018258094787598, |
|
"learning_rate": 1.1830985915492958e-07, |
|
"loss": 0.7763, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"eval_accuracy": 0.5997458703939009, |
|
"eval_loss": 1.2208830118179321, |
|
"eval_runtime": 106.4062, |
|
"eval_samples_per_second": 96.15, |
|
"eval_steps_per_second": 3.007, |
|
"step": 3120 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 3600, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 15, |
|
"save_steps": 500, |
|
"total_flos": 1.5461399088864369e+19, |
|
"train_batch_size": 64, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|