|
{ |
|
"best_metric": 0.26493218541145325, |
|
"best_model_checkpoint": "./outputs/google/flan-t5-small_02112024_16_44_29/checkpoint-10275", |
|
"epoch": 8.0, |
|
"global_step": 16440, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.24, |
|
"learning_rate": 4.9513381995133826e-05, |
|
"loss": 0.6278, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 0.49, |
|
"learning_rate": 4.9026763990267643e-05, |
|
"loss": 0.4278, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 0.73, |
|
"learning_rate": 4.854014598540147e-05, |
|
"loss": 0.3906, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 0.97, |
|
"learning_rate": 4.8053527980535284e-05, |
|
"loss": 0.3726, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_f1": 0.3402346555086388, |
|
"eval_loss": 0.31867411732673645, |
|
"eval_precision": 0.3932500949967925, |
|
"eval_recall": 0.34399184859663345, |
|
"eval_runtime": 24.9698, |
|
"eval_samples_per_second": 36.564, |
|
"eval_steps_per_second": 4.606, |
|
"step": 2055 |
|
}, |
|
{ |
|
"epoch": 1.22, |
|
"learning_rate": 4.75669099756691e-05, |
|
"loss": 0.3505, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 1.46, |
|
"learning_rate": 4.708029197080292e-05, |
|
"loss": 0.3385, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 1.7, |
|
"learning_rate": 4.659367396593674e-05, |
|
"loss": 0.3299, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 1.95, |
|
"learning_rate": 4.610705596107056e-05, |
|
"loss": 0.316, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_f1": 0.44100378584011557, |
|
"eval_loss": 0.29325029253959656, |
|
"eval_precision": 0.5725633373653386, |
|
"eval_recall": 0.41354031034704636, |
|
"eval_runtime": 30.7804, |
|
"eval_samples_per_second": 29.662, |
|
"eval_steps_per_second": 3.736, |
|
"step": 4110 |
|
}, |
|
{ |
|
"epoch": 2.19, |
|
"learning_rate": 4.5620437956204383e-05, |
|
"loss": 0.3077, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 2.43, |
|
"learning_rate": 4.51338199513382e-05, |
|
"loss": 0.2965, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 2.68, |
|
"learning_rate": 4.4647201946472024e-05, |
|
"loss": 0.3038, |
|
"step": 5500 |
|
}, |
|
{ |
|
"epoch": 2.92, |
|
"learning_rate": 4.416058394160584e-05, |
|
"loss": 0.2948, |
|
"step": 6000 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_f1": 0.49142134605574894, |
|
"eval_loss": 0.27041032910346985, |
|
"eval_precision": 0.5482614717698139, |
|
"eval_recall": 0.4672472050791782, |
|
"eval_runtime": 32.1755, |
|
"eval_samples_per_second": 28.376, |
|
"eval_steps_per_second": 3.574, |
|
"step": 6165 |
|
}, |
|
{ |
|
"epoch": 3.16, |
|
"learning_rate": 4.3673965936739665e-05, |
|
"loss": 0.286, |
|
"step": 6500 |
|
}, |
|
{ |
|
"epoch": 3.41, |
|
"learning_rate": 4.318734793187348e-05, |
|
"loss": 0.2794, |
|
"step": 7000 |
|
}, |
|
{ |
|
"epoch": 3.65, |
|
"learning_rate": 4.27007299270073e-05, |
|
"loss": 0.2684, |
|
"step": 7500 |
|
}, |
|
{ |
|
"epoch": 3.89, |
|
"learning_rate": 4.221411192214112e-05, |
|
"loss": 0.2759, |
|
"step": 8000 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_f1": 0.5152580961177389, |
|
"eval_loss": 0.2656283974647522, |
|
"eval_precision": 0.561024311684815, |
|
"eval_recall": 0.4928332834870085, |
|
"eval_runtime": 32.9996, |
|
"eval_samples_per_second": 27.667, |
|
"eval_steps_per_second": 3.485, |
|
"step": 8220 |
|
}, |
|
{ |
|
"epoch": 4.14, |
|
"learning_rate": 4.172749391727494e-05, |
|
"loss": 0.2628, |
|
"step": 8500 |
|
}, |
|
{ |
|
"epoch": 4.38, |
|
"learning_rate": 4.124087591240876e-05, |
|
"loss": 0.2583, |
|
"step": 9000 |
|
}, |
|
{ |
|
"epoch": 4.62, |
|
"learning_rate": 4.075425790754258e-05, |
|
"loss": 0.2567, |
|
"step": 9500 |
|
}, |
|
{ |
|
"epoch": 4.87, |
|
"learning_rate": 4.02676399026764e-05, |
|
"loss": 0.2563, |
|
"step": 10000 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_f1": 0.5254077620147211, |
|
"eval_loss": 0.26493218541145325, |
|
"eval_precision": 0.5869446986868645, |
|
"eval_recall": 0.49228704075934504, |
|
"eval_runtime": 31.0527, |
|
"eval_samples_per_second": 29.402, |
|
"eval_steps_per_second": 3.703, |
|
"step": 10275 |
|
}, |
|
{ |
|
"epoch": 5.11, |
|
"learning_rate": 3.978102189781022e-05, |
|
"loss": 0.2553, |
|
"step": 10500 |
|
}, |
|
{ |
|
"epoch": 5.35, |
|
"learning_rate": 3.929440389294404e-05, |
|
"loss": 0.2482, |
|
"step": 11000 |
|
}, |
|
{ |
|
"epoch": 5.6, |
|
"learning_rate": 3.8807785888077864e-05, |
|
"loss": 0.2412, |
|
"step": 11500 |
|
}, |
|
{ |
|
"epoch": 5.84, |
|
"learning_rate": 3.832116788321168e-05, |
|
"loss": 0.2376, |
|
"step": 12000 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_f1": 0.5293819723661756, |
|
"eval_loss": 0.2736237049102783, |
|
"eval_precision": 0.5698156189027613, |
|
"eval_recall": 0.5158894882436182, |
|
"eval_runtime": 33.8492, |
|
"eval_samples_per_second": 26.973, |
|
"eval_steps_per_second": 3.397, |
|
"step": 12330 |
|
}, |
|
{ |
|
"epoch": 6.08, |
|
"learning_rate": 3.78345498783455e-05, |
|
"loss": 0.234, |
|
"step": 12500 |
|
}, |
|
{ |
|
"epoch": 6.33, |
|
"learning_rate": 3.734793187347932e-05, |
|
"loss": 0.2259, |
|
"step": 13000 |
|
}, |
|
{ |
|
"epoch": 6.57, |
|
"learning_rate": 3.686131386861314e-05, |
|
"loss": 0.2312, |
|
"step": 13500 |
|
}, |
|
{ |
|
"epoch": 6.81, |
|
"learning_rate": 3.637469586374696e-05, |
|
"loss": 0.2306, |
|
"step": 14000 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_f1": 0.5377831918627073, |
|
"eval_loss": 0.27052244544029236, |
|
"eval_precision": 0.5662163692648797, |
|
"eval_recall": 0.5227524158025398, |
|
"eval_runtime": 33.9607, |
|
"eval_samples_per_second": 26.884, |
|
"eval_steps_per_second": 3.386, |
|
"step": 14385 |
|
}, |
|
{ |
|
"epoch": 7.06, |
|
"learning_rate": 3.588807785888078e-05, |
|
"loss": 0.2355, |
|
"step": 14500 |
|
}, |
|
{ |
|
"epoch": 7.3, |
|
"learning_rate": 3.5401459854014604e-05, |
|
"loss": 0.2126, |
|
"step": 15000 |
|
}, |
|
{ |
|
"epoch": 7.54, |
|
"learning_rate": 3.491484184914842e-05, |
|
"loss": 0.2236, |
|
"step": 15500 |
|
}, |
|
{ |
|
"epoch": 7.79, |
|
"learning_rate": 3.4428223844282245e-05, |
|
"loss": 0.2186, |
|
"step": 16000 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_f1": 0.5354115040070326, |
|
"eval_loss": 0.28732189536094666, |
|
"eval_precision": 0.5835637777117146, |
|
"eval_recall": 0.5252217659081543, |
|
"eval_runtime": 35.8593, |
|
"eval_samples_per_second": 25.461, |
|
"eval_steps_per_second": 3.207, |
|
"step": 16440 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"step": 16440, |
|
"total_flos": 5028888562409472.0, |
|
"train_loss": 0.288517827129132, |
|
"train_runtime": 1921.0513, |
|
"train_samples_per_second": 106.934, |
|
"train_steps_per_second": 26.743 |
|
} |
|
], |
|
"max_steps": 51375, |
|
"num_train_epochs": 25, |
|
"total_flos": 5028888562409472.0, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|