|
{ |
|
"best_metric": 2.3307483196258545, |
|
"best_model_checkpoint": "add_BERT_no_pretrain_stsb/checkpoint-270", |
|
"epoch": 11.0, |
|
"global_step": 495, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"learning_rate": 3.9200000000000004e-05, |
|
"loss": 2.4937, |
|
"step": 45 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_combined_score": 0.03484396955490256, |
|
"eval_loss": 2.637270927429199, |
|
"eval_pearson": 0.041015241553137224, |
|
"eval_runtime": 2.7912, |
|
"eval_samples_per_second": 537.4, |
|
"eval_spearmanr": 0.028672697556667882, |
|
"eval_steps_per_second": 4.299, |
|
"step": 45 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"learning_rate": 3.8400000000000005e-05, |
|
"loss": 2.22, |
|
"step": 90 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_combined_score": 0.06629060639069365, |
|
"eval_loss": 2.4288177490234375, |
|
"eval_pearson": 0.07402195261812716, |
|
"eval_runtime": 2.8138, |
|
"eval_samples_per_second": 533.087, |
|
"eval_spearmanr": 0.058559260163260116, |
|
"eval_steps_per_second": 4.265, |
|
"step": 90 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"learning_rate": 3.76e-05, |
|
"loss": 2.1554, |
|
"step": 135 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_combined_score": 0.055355126341372324, |
|
"eval_loss": 2.3868918418884277, |
|
"eval_pearson": 0.06089199058890605, |
|
"eval_runtime": 2.8061, |
|
"eval_samples_per_second": 534.558, |
|
"eval_spearmanr": 0.04981826209383859, |
|
"eval_steps_per_second": 4.276, |
|
"step": 135 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"learning_rate": 3.680000000000001e-05, |
|
"loss": 2.0556, |
|
"step": 180 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_combined_score": 0.07587737081449714, |
|
"eval_loss": 2.5739591121673584, |
|
"eval_pearson": 0.0800115043320288, |
|
"eval_runtime": 2.8092, |
|
"eval_samples_per_second": 533.959, |
|
"eval_spearmanr": 0.07174323729696545, |
|
"eval_steps_per_second": 4.272, |
|
"step": 180 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"learning_rate": 3.6e-05, |
|
"loss": 2.0221, |
|
"step": 225 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_combined_score": 0.07517103861970047, |
|
"eval_loss": 2.465646266937256, |
|
"eval_pearson": 0.08491360492393328, |
|
"eval_runtime": 2.8092, |
|
"eval_samples_per_second": 533.96, |
|
"eval_spearmanr": 0.06542847231546765, |
|
"eval_steps_per_second": 4.272, |
|
"step": 225 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"learning_rate": 3.52e-05, |
|
"loss": 2.0403, |
|
"step": 270 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_combined_score": 0.06472344315426198, |
|
"eval_loss": 2.3307483196258545, |
|
"eval_pearson": 0.07194759835590063, |
|
"eval_runtime": 2.8052, |
|
"eval_samples_per_second": 534.716, |
|
"eval_spearmanr": 0.05749928795262334, |
|
"eval_steps_per_second": 4.278, |
|
"step": 270 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"learning_rate": 3.44e-05, |
|
"loss": 2.1732, |
|
"step": 315 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_combined_score": 0.06413160396195583, |
|
"eval_loss": 2.5174152851104736, |
|
"eval_pearson": 0.06991174129088629, |
|
"eval_runtime": 2.8054, |
|
"eval_samples_per_second": 534.68, |
|
"eval_spearmanr": 0.058351466633025366, |
|
"eval_steps_per_second": 4.277, |
|
"step": 315 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"learning_rate": 3.3600000000000004e-05, |
|
"loss": 2.0399, |
|
"step": 360 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_combined_score": 0.06615269419943948, |
|
"eval_loss": 2.5648128986358643, |
|
"eval_pearson": 0.07178384296600182, |
|
"eval_runtime": 2.8071, |
|
"eval_samples_per_second": 534.35, |
|
"eval_spearmanr": 0.06052154543287713, |
|
"eval_steps_per_second": 4.275, |
|
"step": 360 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"learning_rate": 3.28e-05, |
|
"loss": 2.0765, |
|
"step": 405 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_combined_score": 0.05558546651483845, |
|
"eval_loss": 2.3373327255249023, |
|
"eval_pearson": 0.06209781802846023, |
|
"eval_runtime": 2.8097, |
|
"eval_samples_per_second": 533.863, |
|
"eval_spearmanr": 0.04907311500121666, |
|
"eval_steps_per_second": 4.271, |
|
"step": 405 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"learning_rate": 3.2000000000000005e-05, |
|
"loss": 2.0538, |
|
"step": 450 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_combined_score": 0.04471248717433318, |
|
"eval_loss": 2.6402227878570557, |
|
"eval_pearson": 0.04634878343613905, |
|
"eval_runtime": 2.8018, |
|
"eval_samples_per_second": 535.361, |
|
"eval_spearmanr": 0.04307619091252732, |
|
"eval_steps_per_second": 4.283, |
|
"step": 450 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"learning_rate": 3.1200000000000006e-05, |
|
"loss": 2.0147, |
|
"step": 495 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"eval_combined_score": 0.05055556341697049, |
|
"eval_loss": 2.4726502895355225, |
|
"eval_pearson": 0.05397516518599763, |
|
"eval_runtime": 2.8161, |
|
"eval_samples_per_second": 532.645, |
|
"eval_spearmanr": 0.04713596164794335, |
|
"eval_steps_per_second": 4.261, |
|
"step": 495 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"step": 495, |
|
"total_flos": 9031970478620672.0, |
|
"train_loss": 2.1222905785146384, |
|
"train_runtime": 469.3728, |
|
"train_samples_per_second": 612.413, |
|
"train_steps_per_second": 4.794 |
|
} |
|
], |
|
"max_steps": 2250, |
|
"num_train_epochs": 50, |
|
"total_flos": 9031970478620672.0, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|