{ "best_metric": 62.27396685546466, "best_model_checkpoint": "outputs/bitfit/t5-base/superglue-multirc/checkpoint-2400", "epoch": 3.0, "global_step": 2556, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.23, "eval_average_metrics": 58.45389071733288, "eval_em": 49.88986784140969, "eval_f1": 67.01791359325607, "eval_loss": 0.21679049730300903, "eval_runtime": 23.0565, "eval_samples_per_second": 105.133, "step": 200 }, { "epoch": 0.47, "eval_average_metrics": 61.27063054507724, "eval_em": 51.98237885462555, "eval_f1": 70.55888223552893, "eval_loss": 0.2198609709739685, "eval_runtime": 23.4946, "eval_samples_per_second": 103.173, "step": 400 }, { "epoch": 0.59, "learning_rate": 0.0002413145539906103, "loss": 0.2582, "step": 500 }, { "epoch": 0.7, "eval_average_metrics": 59.16978670550705, "eval_em": 49.779735682819386, "eval_f1": 68.55983772819472, "eval_loss": 0.20913197100162506, "eval_runtime": 23.7161, "eval_samples_per_second": 102.209, "step": 600 }, { "epoch": 0.94, "eval_average_metrics": 61.270356888999785, "eval_em": 51.43171806167401, "eval_f1": 71.10899571632555, "eval_loss": 0.20762182772159576, "eval_runtime": 26.3745, "eval_samples_per_second": 91.907, "step": 800 }, { "epoch": 1.17, "learning_rate": 0.00018262910798122063, "loss": 0.1865, "step": 1000 }, { "epoch": 1.17, "eval_average_metrics": 61.45286279488806, "eval_em": 51.87224669603524, "eval_f1": 71.03347889374089, "eval_loss": 0.2089201658964157, "eval_runtime": 24.8833, "eval_samples_per_second": 97.415, "step": 1000 }, { "epoch": 1.41, "eval_average_metrics": 61.79826184816632, "eval_em": 52.202643171806166, "eval_f1": 71.39388052452648, "eval_loss": 0.20319344103336334, "eval_runtime": 25.4876, "eval_samples_per_second": 95.105, "step": 1200 }, { "epoch": 1.64, "eval_average_metrics": 62.13396621755072, "eval_em": 52.53303964757709, "eval_f1": 71.73489278752436, "eval_loss": 0.21759574115276337, "eval_runtime": 26.3526, "eval_samples_per_second": 91.983, "step": 1400 }, { "epoch": 1.76, "learning_rate": 0.00012394366197183098, "loss": 0.1745, "step": 1500 }, { "epoch": 1.88, "eval_average_metrics": 62.159955413411296, "eval_em": 52.09251101321586, "eval_f1": 72.22739981360672, "eval_loss": 0.21236789226531982, "eval_runtime": 22.8791, "eval_samples_per_second": 105.948, "step": 1600 }, { "epoch": 2.11, "eval_average_metrics": 61.48864179183695, "eval_em": 51.651982378854626, "eval_f1": 71.32530120481927, "eval_loss": 0.2192794233560562, "eval_runtime": 23.8863, "eval_samples_per_second": 101.481, "step": 1800 }, { "epoch": 2.35, "learning_rate": 6.525821596244131e-05, "loss": 0.1692, "step": 2000 }, { "epoch": 2.35, "eval_average_metrics": 62.06655934464116, "eval_em": 52.75330396475771, "eval_f1": 71.37981472452462, "eval_loss": 0.2168177217245102, "eval_runtime": 23.5217, "eval_samples_per_second": 103.054, "step": 2000 }, { "epoch": 2.58, "eval_average_metrics": 62.263646102553764, "eval_em": 52.31277533039648, "eval_f1": 72.21451687471105, "eval_loss": 0.22297202050685883, "eval_runtime": 22.3978, "eval_samples_per_second": 108.225, "step": 2200 }, { "epoch": 2.82, "eval_average_metrics": 62.27396685546466, "eval_em": 52.6431718061674, "eval_f1": 71.90476190476191, "eval_loss": 0.22205480933189392, "eval_runtime": 23.6577, "eval_samples_per_second": 102.461, "step": 2400 }, { "epoch": 2.93, "learning_rate": 6.5727699530516425e-06, "loss": 0.1589, "step": 2500 }, { "epoch": 3.0, "step": 2556, "total_flos": 2.511166406964019e+16, "train_loss": 0.18877839930180654, "train_runtime": 1478.3404, "train_samples_per_second": 55.284, "train_steps_per_second": 1.729 } ], "max_steps": 2556, "num_train_epochs": 3, "total_flos": 2.511166406964019e+16, "trial_name": null, "trial_params": null }