|
{ |
|
"best_metric": 0.4894636273384094, |
|
"best_model_checkpoint": "autotrain-sentiment-analyzer-reddit/checkpoint-691", |
|
"epoch": 1.0, |
|
"eval_steps": 500, |
|
"global_step": 691, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.05, |
|
"grad_norm": 10.44394588470459, |
|
"learning_rate": 8.173076923076923e-06, |
|
"loss": 0.3149, |
|
"step": 34 |
|
}, |
|
{ |
|
"epoch": 0.1, |
|
"grad_norm": 12.510290145874023, |
|
"learning_rate": 1.6346153846153847e-05, |
|
"loss": 0.3768, |
|
"step": 68 |
|
}, |
|
{ |
|
"epoch": 0.15, |
|
"grad_norm": 10.982364654541016, |
|
"learning_rate": 2.4519230769230768e-05, |
|
"loss": 0.3113, |
|
"step": 102 |
|
}, |
|
{ |
|
"epoch": 0.2, |
|
"grad_norm": 14.942676544189453, |
|
"learning_rate": 3.269230769230769e-05, |
|
"loss": 0.4581, |
|
"step": 136 |
|
}, |
|
{ |
|
"epoch": 0.25, |
|
"grad_norm": 15.461087226867676, |
|
"learning_rate": 4.0865384615384615e-05, |
|
"loss": 0.5979, |
|
"step": 170 |
|
}, |
|
{ |
|
"epoch": 0.3, |
|
"grad_norm": 51.596256256103516, |
|
"learning_rate": 4.9038461538461536e-05, |
|
"loss": 0.548, |
|
"step": 204 |
|
}, |
|
{ |
|
"epoch": 0.34, |
|
"grad_norm": 21.773590087890625, |
|
"learning_rate": 4.9195710455764076e-05, |
|
"loss": 0.5489, |
|
"step": 238 |
|
}, |
|
{ |
|
"epoch": 0.39, |
|
"grad_norm": 11.456461906433105, |
|
"learning_rate": 4.8284182305630025e-05, |
|
"loss": 0.6068, |
|
"step": 272 |
|
}, |
|
{ |
|
"epoch": 0.44, |
|
"grad_norm": 15.925763130187988, |
|
"learning_rate": 4.737265415549598e-05, |
|
"loss": 0.5067, |
|
"step": 306 |
|
}, |
|
{ |
|
"epoch": 0.49, |
|
"grad_norm": 15.808685302734375, |
|
"learning_rate": 4.6461126005361935e-05, |
|
"loss": 0.5312, |
|
"step": 340 |
|
}, |
|
{ |
|
"epoch": 0.54, |
|
"grad_norm": 53.43648910522461, |
|
"learning_rate": 4.554959785522788e-05, |
|
"loss": 0.4574, |
|
"step": 374 |
|
}, |
|
{ |
|
"epoch": 0.59, |
|
"grad_norm": 4.778822898864746, |
|
"learning_rate": 4.463806970509384e-05, |
|
"loss": 0.6492, |
|
"step": 408 |
|
}, |
|
{ |
|
"epoch": 0.64, |
|
"grad_norm": 9.234722137451172, |
|
"learning_rate": 4.3726541554959786e-05, |
|
"loss": 0.6046, |
|
"step": 442 |
|
}, |
|
{ |
|
"epoch": 0.69, |
|
"grad_norm": 8.603498458862305, |
|
"learning_rate": 4.281501340482574e-05, |
|
"loss": 0.5429, |
|
"step": 476 |
|
}, |
|
{ |
|
"epoch": 0.74, |
|
"grad_norm": 23.032926559448242, |
|
"learning_rate": 4.1903485254691696e-05, |
|
"loss": 0.5069, |
|
"step": 510 |
|
}, |
|
{ |
|
"epoch": 0.79, |
|
"grad_norm": 3.559593915939331, |
|
"learning_rate": 4.0991957104557644e-05, |
|
"loss": 0.5562, |
|
"step": 544 |
|
}, |
|
{ |
|
"epoch": 0.84, |
|
"grad_norm": 14.31966495513916, |
|
"learning_rate": 4.008042895442359e-05, |
|
"loss": 0.4328, |
|
"step": 578 |
|
}, |
|
{ |
|
"epoch": 0.89, |
|
"grad_norm": 16.031381607055664, |
|
"learning_rate": 3.916890080428954e-05, |
|
"loss": 0.5084, |
|
"step": 612 |
|
}, |
|
{ |
|
"epoch": 0.93, |
|
"grad_norm": 6.348935127258301, |
|
"learning_rate": 3.8257372654155496e-05, |
|
"loss": 0.5242, |
|
"step": 646 |
|
}, |
|
{ |
|
"epoch": 0.98, |
|
"grad_norm": 20.074831008911133, |
|
"learning_rate": 3.734584450402145e-05, |
|
"loss": 0.5023, |
|
"step": 680 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_accuracy": 0.8096960926193922, |
|
"eval_f1_macro": 0.7895193987806856, |
|
"eval_f1_micro": 0.8096960926193921, |
|
"eval_f1_weighted": 0.8045465713974906, |
|
"eval_loss": 0.4894636273384094, |
|
"eval_precision_macro": 0.814875613105015, |
|
"eval_precision_micro": 0.8096960926193922, |
|
"eval_precision_weighted": 0.8193628961020867, |
|
"eval_recall_macro": 0.7801134533159866, |
|
"eval_recall_micro": 0.8096960926193922, |
|
"eval_recall_weighted": 0.8096960926193922, |
|
"eval_runtime": 321.1321, |
|
"eval_samples_per_second": 4.304, |
|
"eval_steps_per_second": 0.271, |
|
"step": 691 |
|
} |
|
], |
|
"logging_steps": 34, |
|
"max_steps": 2073, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 3, |
|
"save_steps": 500, |
|
"total_flos": 363491186591232.0, |
|
"train_batch_size": 8, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|