{ "best_metric": 1.7871696949005127, "best_model_checkpoint": "/home3/s5431786/nlp-final-project/results/google-flan-t5-small-e-snli-generation-label_and_explanation-selected-b64/checkpoint-2000", "epoch": 2.096924510717614, "global_step": 18000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.23, "learning_rate": 0.0004659832246039143, "loss": 1.4692, "step": 2000 }, { "epoch": 0.23, "eval_accuracy": 0.8211745580166633, "eval_bertscore_f1": 0.9286575317503936, "eval_bleu": 0.38561860316652036, "eval_f1": 0.8203013643438366, "eval_loss": 1.7871696949005127, "eval_rouge1": 0.5787165816995035, "eval_rouge2": 0.3685417962966523, "eval_rougeL": 0.5239321926914862, "eval_rougeLsum": 0.5257244126819034, "eval_runtime": 153.5231, "eval_samples_per_second": 64.108, "eval_steps_per_second": 1.003, "step": 2000 }, { "epoch": 0.47, "learning_rate": 0.0009319664492078286, "loss": 1.2505, "step": 4000 }, { "epoch": 0.47, "eval_accuracy": 0.8262548262548263, "eval_bertscore_f1": 0.9307863125590817, "eval_bleu": 0.39038732251575425, "eval_f1": 0.8263713441477889, "eval_loss": 1.8808104991912842, "eval_rouge1": 0.5869703246365517, "eval_rouge2": 0.3748641547543645, "eval_rougeL": 0.5321311878885444, "eval_rougeLsum": 0.5336937989329478, "eval_runtime": 142.4217, "eval_samples_per_second": 69.105, "eval_steps_per_second": 1.081, "step": 4000 }, { "epoch": 0.7, "learning_rate": 0.0009790552803256977, "loss": 1.2003, "step": 6000 }, { "epoch": 0.7, "eval_accuracy": 0.8474903474903475, "eval_bertscore_f1": 0.9325015043987053, "eval_bleu": 0.40037514315917067, "eval_f1": 0.8480955479827984, "eval_loss": 1.8476512432098389, "eval_rouge1": 0.5984358503927201, "eval_rouge2": 0.39129615048248045, "eval_rougeL": 0.5452371782543385, "eval_rougeLsum": 0.5468731108541084, "eval_runtime": 144.1204, "eval_samples_per_second": 68.29, "eval_steps_per_second": 1.069, "step": 6000 }, { "epoch": 0.93, "learning_rate": 0.0009545298474518076, "loss": 1.1624, "step": 8000 }, { "epoch": 0.93, "eval_accuracy": 0.8598862019914651, "eval_bertscore_f1": 0.9334783476558407, "eval_bleu": 0.4024137500087889, "eval_f1": 0.8587313635433268, "eval_loss": 1.8243632316589355, "eval_rouge1": 0.602912531326099, "eval_rouge2": 0.39282903833995186, "eval_rougeL": 0.5440694412996867, "eval_rougeLsum": 0.5457091432223387, "eval_runtime": 142.2899, "eval_samples_per_second": 69.169, "eval_steps_per_second": 1.082, "step": 8000 }, { "epoch": 1.16, "learning_rate": 0.0009300044145779173, "loss": 1.1155, "step": 10000 }, { "epoch": 1.16, "eval_accuracy": 0.8695387116439748, "eval_bertscore_f1": 0.9330506412037212, "eval_bleu": 0.4022160428281426, "eval_f1": 0.868816289704145, "eval_loss": 1.8499114513397217, "eval_rouge1": 0.6082846765097942, "eval_rouge2": 0.4018899263767985, "eval_rougeL": 0.5518885347721499, "eval_rougeLsum": 0.5540212762276107, "eval_runtime": 150.2024, "eval_samples_per_second": 65.525, "eval_steps_per_second": 1.025, "step": 10000 }, { "epoch": 1.4, "learning_rate": 0.0009054789817040271, "loss": 1.0913, "step": 12000 }, { "epoch": 1.4, "eval_accuracy": 0.8691322901849218, "eval_bertscore_f1": 0.9338201101633912, "eval_bleu": 0.4012059786299585, "eval_f1": 0.8686267742768865, "eval_loss": 1.870266079902649, "eval_rouge1": 0.6062872493545299, "eval_rouge2": 0.39947246134905595, "eval_rougeL": 0.5500107773403655, "eval_rougeLsum": 0.5520562338476832, "eval_runtime": 151.4558, "eval_samples_per_second": 64.983, "eval_steps_per_second": 1.017, "step": 12000 }, { "epoch": 1.63, "learning_rate": 0.0008809535488301369, "loss": 1.0846, "step": 14000 }, { "epoch": 1.63, "eval_accuracy": 0.8750254013411908, "eval_bertscore_f1": 0.9330909099915095, "eval_bleu": 0.39881326611406565, "eval_f1": 0.875070205358106, "eval_loss": 1.832938551902771, "eval_rouge1": 0.6061633599628911, "eval_rouge2": 0.39694115489567416, "eval_rougeL": 0.550297473532996, "eval_rougeLsum": 0.5523036866159814, "eval_runtime": 154.4147, "eval_samples_per_second": 63.737, "eval_steps_per_second": 0.997, "step": 14000 }, { "epoch": 1.86, "learning_rate": 0.0008564281159562467, "loss": 1.0715, "step": 16000 }, { "epoch": 1.86, "eval_accuracy": 0.8753302174354806, "eval_bertscore_f1": 0.9349365859854345, "eval_bleu": 0.4116280426691763, "eval_f1": 0.8747037856852112, "eval_loss": 1.8349922895431519, "eval_rouge1": 0.6123794030106426, "eval_rouge2": 0.4063097561396414, "eval_rougeL": 0.5556039799857393, "eval_rougeLsum": 0.5576074204448696, "eval_runtime": 148.6901, "eval_samples_per_second": 66.191, "eval_steps_per_second": 1.036, "step": 16000 }, { "epoch": 2.1, "learning_rate": 0.0008319026830823564, "loss": 1.046, "step": 18000 }, { "epoch": 2.1, "eval_accuracy": 0.8814265393212761, "eval_bertscore_f1": 0.933173856183393, "eval_bleu": 0.4004651404942737, "eval_f1": 0.8813416551856146, "eval_loss": 1.8824745416641235, "eval_rouge1": 0.609629583349967, "eval_rouge2": 0.4060413051850321, "eval_rougeL": 0.5545586773158176, "eval_rougeLsum": 0.5564322531473485, "eval_runtime": 157.9661, "eval_samples_per_second": 62.304, "eval_steps_per_second": 0.975, "step": 18000 } ], "max_steps": 85840, "num_train_epochs": 10, "total_flos": 2.4686695794763776e+16, "trial_name": null, "trial_params": null }