|
{ |
|
"best_metric": 0.9426312247644684, |
|
"best_model_checkpoint": "cq-bert-model-repo/checkpoint-3042", |
|
"epoch": 1.0, |
|
"global_step": 3042, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.16436554898093358, |
|
"learning_rate": 1.671268902038133e-05, |
|
"loss": 0.2786270751953125, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 0.32873109796186717, |
|
"learning_rate": 1.3425378040762658e-05, |
|
"loss": 0.24325125122070312, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 0.4930966469428008, |
|
"learning_rate": 1.0138067061143987e-05, |
|
"loss": 0.21087245178222655, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 0.6574621959237343, |
|
"learning_rate": 6.850756081525313e-06, |
|
"loss": 0.19398100280761718, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 0.821827744904668, |
|
"learning_rate": 3.563445101906641e-06, |
|
"loss": 0.20912657165527343, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 0.9861932938856016, |
|
"learning_rate": 2.7613412228796843e-07, |
|
"loss": 0.19943014526367187, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_accuracy": 0.9426312247644684, |
|
"eval_f1": 0.8816383200277681, |
|
"eval_loss": 0.18397130072116852, |
|
"step": 3042 |
|
} |
|
], |
|
"max_steps": 3042, |
|
"num_train_epochs": 1, |
|
"total_flos": 1321583063589120, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|