r1_iterater / checkpoint-405 /trainer_state.json
owanr's picture
Upload 53 files
7e270f3
raw
history blame
4.3 kB
{
"best_metric": 0.13342921435832977,
"best_model_checkpoint": "/home/dongyeop/owan0002/revision-preference/code/preference_classifier/coedit_t5/output_r1_iter_wo_p/checkpoint-405",
"epoch": 15.0,
"global_step": 405,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_bleu": 0.0,
"eval_gen_len": 2.9953,
"eval_loss": 0.2727777659893036,
"eval_runtime": 10.2846,
"eval_samples_per_second": 164.517,
"eval_steps_per_second": 1.361,
"step": 27
},
{
"epoch": 2.0,
"eval_bleu": 0.0,
"eval_gen_len": 2.6791,
"eval_loss": 0.26499590277671814,
"eval_runtime": 9.934,
"eval_samples_per_second": 170.324,
"eval_steps_per_second": 1.409,
"step": 54
},
{
"epoch": 3.0,
"eval_bleu": 0.0,
"eval_gen_len": 2.1874,
"eval_loss": 0.2637251317501068,
"eval_runtime": 9.8272,
"eval_samples_per_second": 172.175,
"eval_steps_per_second": 1.425,
"step": 81
},
{
"epoch": 4.0,
"eval_bleu": 0.0,
"eval_gen_len": 2.2973,
"eval_loss": 0.24176451563835144,
"eval_runtime": 9.7849,
"eval_samples_per_second": 172.92,
"eval_steps_per_second": 1.431,
"step": 108
},
{
"epoch": 5.0,
"eval_bleu": 0.0,
"eval_gen_len": 2.2494,
"eval_loss": 0.2737601399421692,
"eval_runtime": 10.431,
"eval_samples_per_second": 162.209,
"eval_steps_per_second": 1.342,
"step": 135
},
{
"epoch": 6.0,
"eval_bleu": 0.0,
"eval_gen_len": 2.3812,
"eval_loss": 0.19136066734790802,
"eval_runtime": 9.9867,
"eval_samples_per_second": 169.425,
"eval_steps_per_second": 1.402,
"step": 162
},
{
"epoch": 7.0,
"eval_bleu": 0.0,
"eval_gen_len": 2.3983,
"eval_loss": 0.16406123340129852,
"eval_runtime": 9.9234,
"eval_samples_per_second": 170.505,
"eval_steps_per_second": 1.411,
"step": 189
},
{
"epoch": 8.0,
"eval_bleu": 0.0,
"eval_gen_len": 2.3995,
"eval_loss": 0.16948193311691284,
"eval_runtime": 10.0828,
"eval_samples_per_second": 167.811,
"eval_steps_per_second": 1.389,
"step": 216
},
{
"epoch": 9.0,
"eval_bleu": 0.0,
"eval_gen_len": 2.4167,
"eval_loss": 0.15213139355182648,
"eval_runtime": 9.7652,
"eval_samples_per_second": 173.268,
"eval_steps_per_second": 1.434,
"step": 243
},
{
"epoch": 10.0,
"eval_bleu": 0.0,
"eval_gen_len": 2.4167,
"eval_loss": 0.15690775215625763,
"eval_runtime": 9.8519,
"eval_samples_per_second": 171.743,
"eval_steps_per_second": 1.421,
"step": 270
},
{
"epoch": 11.0,
"eval_bleu": 0.0,
"eval_gen_len": 2.4137,
"eval_loss": 0.16145527362823486,
"eval_runtime": 9.771,
"eval_samples_per_second": 173.166,
"eval_steps_per_second": 1.433,
"step": 297
},
{
"epoch": 12.0,
"eval_bleu": 0.0,
"eval_gen_len": 2.4238,
"eval_loss": 0.1473228484392166,
"eval_runtime": 9.9975,
"eval_samples_per_second": 169.242,
"eval_steps_per_second": 1.4,
"step": 324
},
{
"epoch": 13.0,
"eval_bleu": 0.0,
"eval_gen_len": 2.4255,
"eval_loss": 0.13761219382286072,
"eval_runtime": 9.8987,
"eval_samples_per_second": 170.931,
"eval_steps_per_second": 1.414,
"step": 351
},
{
"epoch": 14.0,
"eval_bleu": 0.0,
"eval_gen_len": 2.419,
"eval_loss": 0.14949482679367065,
"eval_runtime": 10.1968,
"eval_samples_per_second": 165.935,
"eval_steps_per_second": 1.373,
"step": 378
},
{
"epoch": 15.0,
"eval_bleu": 0.0,
"eval_gen_len": 2.432,
"eval_loss": 0.13342921435832977,
"eval_runtime": 9.9102,
"eval_samples_per_second": 170.734,
"eval_steps_per_second": 1.413,
"step": 405
}
],
"max_steps": 540,
"num_train_epochs": 20,
"total_flos": 1.863941138457559e+17,
"trial_name": null,
"trial_params": null
}