|
{ |
|
"best_metric": 1.528552770614624, |
|
"best_model_checkpoint": "/home2/s5431786/jb-internship-repr/results/Salesforce-codet5-small-java-small-selected-wo-tokens/checkpoint-2000", |
|
"epoch": 2.7743098904147594, |
|
"global_step": 20000, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.28, |
|
"learning_rate": 9.94363646983237e-05, |
|
"loss": 2.1009, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 0.28, |
|
"eval_exact_match": 0.31785774198959904, |
|
"eval_loss": 1.528552770614624, |
|
"eval_rouge1": 0.5232290073169683, |
|
"eval_rouge2": 0.24795642157242634, |
|
"eval_rougeL": 0.5233033679411545, |
|
"eval_runtime": 163.446, |
|
"eval_samples_per_second": 145.883, |
|
"eval_steps_per_second": 1.523, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 0.55, |
|
"learning_rate": 9.359558437007184e-05, |
|
"loss": 1.3098, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 0.55, |
|
"eval_exact_match": 0.29667840966280823, |
|
"eval_loss": 1.5582195520401, |
|
"eval_rouge1": 0.499918373090859, |
|
"eval_rouge2": 0.22982882883486827, |
|
"eval_rougeL": 0.49974542584946463, |
|
"eval_runtime": 169.5108, |
|
"eval_samples_per_second": 140.664, |
|
"eval_steps_per_second": 1.469, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 0.83, |
|
"learning_rate": 8.775480404182e-05, |
|
"loss": 1.1968, |
|
"step": 6000 |
|
}, |
|
{ |
|
"epoch": 0.83, |
|
"eval_exact_match": 0.321003187384667, |
|
"eval_loss": 1.551592469215393, |
|
"eval_rouge1": 0.5260578932396776, |
|
"eval_rouge2": 0.25462429236963685, |
|
"eval_rougeL": 0.5257669098334219, |
|
"eval_runtime": 163.9432, |
|
"eval_samples_per_second": 145.441, |
|
"eval_steps_per_second": 1.519, |
|
"step": 6000 |
|
}, |
|
{ |
|
"epoch": 1.11, |
|
"learning_rate": 8.191402371356814e-05, |
|
"loss": 1.1145, |
|
"step": 8000 |
|
}, |
|
{ |
|
"epoch": 1.11, |
|
"eval_exact_match": 0.31735447072638817, |
|
"eval_loss": 1.572016954421997, |
|
"eval_rouge1": 0.5094747473558878, |
|
"eval_rouge2": 0.2465356707776194, |
|
"eval_rougeL": 0.5091592701411148, |
|
"eval_runtime": 163.415, |
|
"eval_samples_per_second": 145.911, |
|
"eval_steps_per_second": 1.524, |
|
"step": 8000 |
|
}, |
|
{ |
|
"epoch": 1.39, |
|
"learning_rate": 7.607908416564453e-05, |
|
"loss": 1.0477, |
|
"step": 10000 |
|
}, |
|
{ |
|
"epoch": 1.39, |
|
"eval_exact_match": 0.33387854386847843, |
|
"eval_loss": 1.5617761611938477, |
|
"eval_rouge1": 0.5280223151246797, |
|
"eval_rouge2": 0.2615585801921996, |
|
"eval_rougeL": 0.5274734242132477, |
|
"eval_runtime": 165.805, |
|
"eval_samples_per_second": 143.807, |
|
"eval_steps_per_second": 1.502, |
|
"step": 10000 |
|
}, |
|
{ |
|
"epoch": 1.66, |
|
"learning_rate": 7.023830383739268e-05, |
|
"loss": 1.0219, |
|
"step": 12000 |
|
}, |
|
{ |
|
"epoch": 1.66, |
|
"eval_exact_match": 0.32372924006039255, |
|
"eval_loss": 1.5944069623947144, |
|
"eval_rouge1": 0.5133412941637794, |
|
"eval_rouge2": 0.24304376784560536, |
|
"eval_rougeL": 0.5128045498112566, |
|
"eval_runtime": 164.4858, |
|
"eval_samples_per_second": 144.961, |
|
"eval_steps_per_second": 1.514, |
|
"step": 12000 |
|
}, |
|
{ |
|
"epoch": 1.94, |
|
"learning_rate": 6.440044389930495e-05, |
|
"loss": 1.0027, |
|
"step": 14000 |
|
}, |
|
{ |
|
"epoch": 1.94, |
|
"eval_exact_match": 0.3238550578761953, |
|
"eval_loss": 1.5750421285629272, |
|
"eval_rouge1": 0.5206336041126007, |
|
"eval_rouge2": 0.24470678869584325, |
|
"eval_rougeL": 0.5202257107678057, |
|
"eval_runtime": 161.6161, |
|
"eval_samples_per_second": 147.535, |
|
"eval_steps_per_second": 1.541, |
|
"step": 14000 |
|
}, |
|
{ |
|
"epoch": 2.22, |
|
"learning_rate": 5.856258396121722e-05, |
|
"loss": 0.9263, |
|
"step": 16000 |
|
}, |
|
{ |
|
"epoch": 2.22, |
|
"eval_exact_match": 0.33018788793826537, |
|
"eval_loss": 1.5776818990707397, |
|
"eval_rouge1": 0.5179861628783158, |
|
"eval_rouge2": 0.24451742588852704, |
|
"eval_rougeL": 0.5176686731279507, |
|
"eval_runtime": 165.4256, |
|
"eval_samples_per_second": 144.137, |
|
"eval_steps_per_second": 1.505, |
|
"step": 16000 |
|
}, |
|
{ |
|
"epoch": 2.5, |
|
"learning_rate": 5.272180363296537e-05, |
|
"loss": 0.9054, |
|
"step": 18000 |
|
}, |
|
{ |
|
"epoch": 2.5, |
|
"eval_exact_match": 0.3242325113236034, |
|
"eval_loss": 1.6233525276184082, |
|
"eval_rouge1": 0.5204582779286969, |
|
"eval_rouge2": 0.24576987021627228, |
|
"eval_rougeL": 0.520011433933161, |
|
"eval_runtime": 164.3556, |
|
"eval_samples_per_second": 145.076, |
|
"eval_steps_per_second": 1.515, |
|
"step": 18000 |
|
}, |
|
{ |
|
"epoch": 2.77, |
|
"learning_rate": 4.688102330471351e-05, |
|
"loss": 0.8921, |
|
"step": 20000 |
|
}, |
|
{ |
|
"epoch": 2.77, |
|
"eval_exact_match": 0.3301459486663312, |
|
"eval_loss": 1.5790328979492188, |
|
"eval_rouge1": 0.5328535938777187, |
|
"eval_rouge2": 0.2582260548148201, |
|
"eval_rougeL": 0.5322687769671152, |
|
"eval_runtime": 166.1094, |
|
"eval_samples_per_second": 143.544, |
|
"eval_steps_per_second": 1.499, |
|
"step": 20000 |
|
} |
|
], |
|
"max_steps": 36045, |
|
"num_train_epochs": 5, |
|
"total_flos": 2.5983189730197504e+17, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|