{ "best_metric": 0.9174279061436503, "best_model_checkpoint": "DynamicFreightPackinglist_Jun24/checkpoint-3000", "epoch": 2.657218777679362, "global_step": 3000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.09, "eval_accuracy": 0.8657594809519709, "eval_f1": 0.294485668558126, "eval_loss": 0.6096277832984924, "eval_precision": 0.3776119402985075, "eval_recall": 0.24135463868352014, "eval_runtime": 37.7163, "eval_samples_per_second": 10.181, "eval_steps_per_second": 5.091, "step": 100 }, { "epoch": 0.18, "eval_accuracy": 0.9066833175437086, "eval_f1": 0.42788946412963086, "eval_loss": 0.466012567281723, "eval_precision": 0.49051950053954063, "eval_recall": 0.37944192702122587, "eval_runtime": 37.9564, "eval_samples_per_second": 10.117, "eval_steps_per_second": 5.058, "step": 200 }, { "epoch": 0.27, "eval_accuracy": 0.9190566416903511, "eval_f1": 0.45627078849540204, "eval_loss": 0.3901040554046631, "eval_precision": 0.5035267021736001, "eval_recall": 0.4171237777247794, "eval_runtime": 37.9745, "eval_samples_per_second": 10.112, "eval_steps_per_second": 5.056, "step": 300 }, { "epoch": 0.35, "eval_accuracy": 0.9322768638934343, "eval_f1": 0.5466886577010912, "eval_loss": 0.3380320370197296, "eval_precision": 0.5840336134453782, "eval_recall": 0.5138325781063677, "eval_runtime": 37.9718, "eval_samples_per_second": 10.113, "eval_steps_per_second": 5.056, "step": 400 }, { "epoch": 0.44, "learning_rate": 8.333333333333334e-06, "loss": 0.4269, "step": 500 }, { "epoch": 0.44, "eval_accuracy": 0.9360233112278586, "eval_f1": 0.5705544933078396, "eval_loss": 0.2771761417388916, "eval_precision": 0.6128148959474261, "eval_recall": 0.5337467207250179, "eval_runtime": 38.0237, "eval_samples_per_second": 10.099, "eval_steps_per_second": 5.049, "step": 500 }, { "epoch": 0.53, "eval_accuracy": 0.9542962133608934, "eval_f1": 0.6891029650944577, "eval_loss": 0.2250644564628601, "eval_precision": 0.7247368421052631, "eval_recall": 0.6568089673264965, "eval_runtime": 37.8718, "eval_samples_per_second": 10.139, "eval_steps_per_second": 5.07, "step": 600 }, { "epoch": 0.62, "eval_accuracy": 0.9598082278299314, "eval_f1": 0.730193368491241, "eval_loss": 0.2054944485425949, "eval_precision": 0.7425718160522747, "eval_recall": 0.7182208442642499, "eval_runtime": 37.7502, "eval_samples_per_second": 10.172, "eval_steps_per_second": 5.086, "step": 700 }, { "epoch": 0.71, "eval_accuracy": 0.9699853587115667, "eval_f1": 0.7988021024324654, "eval_loss": 0.16418181359767914, "eval_precision": 0.819332998996991, "eval_recall": 0.7792749821130456, "eval_runtime": 37.9005, "eval_samples_per_second": 10.132, "eval_steps_per_second": 5.066, "step": 800 }, { "epoch": 0.8, "eval_accuracy": 0.9699710045072202, "eval_f1": 0.7916867469879518, "eval_loss": 0.1568066030740738, "eval_precision": 0.7999756513270027, "eval_recall": 0.783567851180539, "eval_runtime": 37.6869, "eval_samples_per_second": 10.189, "eval_steps_per_second": 5.095, "step": 900 }, { "epoch": 0.89, "learning_rate": 6.666666666666667e-06, "loss": 0.2059, "step": 1000 }, { "epoch": 0.89, "eval_accuracy": 0.9699135876898344, "eval_f1": 0.8125, "eval_loss": 0.15771125257015228, "eval_precision": 0.828826593897296, "eval_recall": 0.7968041974719771, "eval_runtime": 37.8726, "eval_samples_per_second": 10.139, "eval_steps_per_second": 5.07, "step": 1000 }, { "epoch": 0.97, "eval_accuracy": 0.9756839778371085, "eval_f1": 0.844042306046341, "eval_loss": 0.1233619749546051, "eval_precision": 0.8660143018441852, "eval_recall": 0.8231576436918674, "eval_runtime": 37.8462, "eval_samples_per_second": 10.146, "eval_steps_per_second": 5.073, "step": 1100 }, { "epoch": 1.06, "eval_accuracy": 0.9739327649068412, "eval_f1": 0.8383422200678624, "eval_loss": 0.13158756494522095, "eval_precision": 0.852180339985218, "eval_recall": 0.8249463391366564, "eval_runtime": 37.9995, "eval_samples_per_second": 10.105, "eval_steps_per_second": 5.053, "step": 1200 }, { "epoch": 1.15, "eval_accuracy": 0.9773921281543364, "eval_f1": 0.8546778437251422, "eval_loss": 0.12233193963766098, "eval_precision": 0.8777177328138746, "eval_recall": 0.8328165990937276, "eval_runtime": 37.8677, "eval_samples_per_second": 10.141, "eval_steps_per_second": 5.07, "step": 1300 }, { "epoch": 1.24, "eval_accuracy": 0.9784830476846669, "eval_f1": 0.8620398310199154, "eval_loss": 0.1114952489733696, "eval_precision": 0.8726783968719453, "eval_recall": 0.8516575244455045, "eval_runtime": 37.8077, "eval_samples_per_second": 10.157, "eval_steps_per_second": 5.078, "step": 1400 }, { "epoch": 1.33, "learning_rate": 5e-06, "loss": 0.1384, "step": 1500 }, { "epoch": 1.33, "eval_accuracy": 0.9778801711021158, "eval_f1": 0.8650332474689989, "eval_loss": 0.10301075130701065, "eval_precision": 0.8691465029493198, "eval_recall": 0.8609587407584068, "eval_runtime": 37.7478, "eval_samples_per_second": 10.173, "eval_steps_per_second": 5.086, "step": 1500 }, { "epoch": 1.42, "eval_accuracy": 0.9811529296931071, "eval_f1": 0.8748258947495913, "eval_loss": 0.09539026767015457, "eval_precision": 0.8887658422542144, "eval_recall": 0.8613164798473647, "eval_runtime": 37.6325, "eval_samples_per_second": 10.204, "eval_steps_per_second": 5.102, "step": 1600 }, { "epoch": 1.51, "eval_accuracy": 0.9819711193408549, "eval_f1": 0.8838249516441005, "eval_loss": 0.09302261471748352, "eval_precision": 0.8961755332189262, "eval_recall": 0.8718101597901264, "eval_runtime": 37.72, "eval_samples_per_second": 10.18, "eval_steps_per_second": 5.09, "step": 1700 }, { "epoch": 1.59, "eval_accuracy": 0.9812821175322252, "eval_f1": 0.8815182901275221, "eval_loss": 0.09258309751749039, "eval_precision": 0.8851749428880606, "eval_recall": 0.8778917243024088, "eval_runtime": 37.682, "eval_samples_per_second": 10.191, "eval_steps_per_second": 5.095, "step": 1800 }, { "epoch": 1.68, "eval_accuracy": 0.9810380960583355, "eval_f1": 0.8837905834431532, "eval_loss": 0.0902891755104065, "eval_precision": 0.8879393355801637, "eval_recall": 0.8796804197471977, "eval_runtime": 37.6694, "eval_samples_per_second": 10.194, "eval_steps_per_second": 5.097, "step": 1900 }, { "epoch": 1.77, "learning_rate": 3.3333333333333333e-06, "loss": 0.0968, "step": 2000 }, { "epoch": 1.77, "eval_accuracy": 0.9826314127407918, "eval_f1": 0.8884760592077666, "eval_loss": 0.08607935905456543, "eval_precision": 0.8930249367546079, "eval_recall": 0.8839732888146912, "eval_runtime": 37.6927, "eval_samples_per_second": 10.188, "eval_steps_per_second": 5.094, "step": 2000 }, { "epoch": 1.86, "eval_accuracy": 0.9845692303275629, "eval_f1": 0.8967495219885278, "eval_loss": 0.07529100030660629, "eval_precision": 0.8986826347305389, "eval_recall": 0.8948247078464107, "eval_runtime": 37.5991, "eval_samples_per_second": 10.213, "eval_steps_per_second": 5.107, "step": 2100 }, { "epoch": 1.95, "eval_accuracy": 0.9830046220537996, "eval_f1": 0.8961644162982435, "eval_loss": 0.08021637052297592, "eval_precision": 0.8979885057471264, "eval_recall": 0.8943477223944669, "eval_runtime": 37.5671, "eval_samples_per_second": 10.222, "eval_steps_per_second": 5.111, "step": 2200 }, { "epoch": 2.04, "eval_accuracy": 0.9849137312318779, "eval_f1": 0.9005910800644815, "eval_loss": 0.07370590418577194, "eval_precision": 0.9018294870261868, "eval_recall": 0.899356069639876, "eval_runtime": 37.6512, "eval_samples_per_second": 10.199, "eval_steps_per_second": 5.099, "step": 2300 }, { "epoch": 2.13, "eval_accuracy": 0.9839807079493583, "eval_f1": 0.9032528103324563, "eval_loss": 0.07483410835266113, "eval_precision": 0.9058527224754138, "eval_recall": 0.9006677796327212, "eval_runtime": 37.6471, "eval_samples_per_second": 10.2, "eval_steps_per_second": 5.1, "step": 2400 }, { "epoch": 2.21, "learning_rate": 1.6666666666666667e-06, "loss": 0.0918, "step": 2500 }, { "epoch": 2.21, "eval_accuracy": 0.985301294749232, "eval_f1": 0.907269366092194, "eval_loss": 0.07416214793920517, "eval_precision": 0.9074317070261243, "eval_recall": 0.9071070832339614, "eval_runtime": 37.7271, "eval_samples_per_second": 10.178, "eval_steps_per_second": 5.089, "step": 2500 }, { "epoch": 2.3, "eval_accuracy": 0.986693652570838, "eval_f1": 0.9162969180956949, "eval_loss": 0.06871066987514496, "eval_precision": 0.9214905933429812, "eval_recall": 0.911161459575483, "eval_runtime": 37.5742, "eval_samples_per_second": 10.22, "eval_steps_per_second": 5.11, "step": 2600 }, { "epoch": 2.39, "eval_accuracy": 0.9862773806447909, "eval_f1": 0.9115873679183333, "eval_loss": 0.06786704063415527, "eval_precision": 0.9127316198445905, "eval_recall": 0.9104459813975674, "eval_runtime": 37.6479, "eval_samples_per_second": 10.2, "eval_steps_per_second": 5.1, "step": 2700 }, { "epoch": 2.48, "eval_accuracy": 0.9870381534751529, "eval_f1": 0.9173381080274545, "eval_loss": 0.06866415590047836, "eval_precision": 0.9182698052336002, "eval_recall": 0.9164082995468639, "eval_runtime": 37.6027, "eval_samples_per_second": 10.212, "eval_steps_per_second": 5.106, "step": 2800 }, { "epoch": 2.57, "eval_accuracy": 0.9870237992708064, "eval_f1": 0.9173084960296136, "eval_loss": 0.06812075525522232, "eval_precision": 0.918569891187373, "eval_recall": 0.916050560457906, "eval_runtime": 37.5601, "eval_samples_per_second": 10.224, "eval_steps_per_second": 5.112, "step": 2900 }, { "epoch": 2.66, "learning_rate": 0.0, "loss": 0.074, "step": 3000 }, { "epoch": 2.66, "eval_accuracy": 0.9870812160881922, "eval_f1": 0.9174279061436503, "eval_loss": 0.06755248457193375, "eval_precision": 0.9186894655028099, "eval_recall": 0.916169806820892, "eval_runtime": 37.5655, "eval_samples_per_second": 10.222, "eval_steps_per_second": 5.111, "step": 3000 } ], "max_steps": 3000, "num_train_epochs": 3, "total_flos": 1592999774208000.0, "trial_name": null, "trial_params": null }