{ "best_metric": 0.9160090191657272, "best_model_checkpoint": "swinv2-base-patch4-window12-192-22k-finetuned-lora-ISIC-2019/checkpoint-4875", "epoch": 99.2, "eval_steps": 500, "global_step": 6200, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.16, "learning_rate": 0.0009983870967741936, "loss": 1.4282, "step": 10 }, { "epoch": 0.32, "learning_rate": 0.0009970967741935483, "loss": 1.1082, "step": 20 }, { "epoch": 0.48, "learning_rate": 0.0009954838709677419, "loss": 1.0397, "step": 30 }, { "epoch": 0.64, "learning_rate": 0.0009938709677419356, "loss": 0.9258, "step": 40 }, { "epoch": 0.8, "learning_rate": 0.0009922580645161292, "loss": 0.8897, "step": 50 }, { "epoch": 0.96, "learning_rate": 0.0009906451612903225, "loss": 0.8488, "step": 60 }, { "epoch": 0.99, "step": 62, "train_accuracy": 0.718556119571348, "train_f1": 0.6867379798585972, "train_loss": 0.770628809928894, "train_precision": 0.708956589572109, "train_recall": 0.718556119571348, "train_runtime": 291.5866, "train_samples_per_second": 54.725, "train_steps_per_second": 0.857 }, { "epoch": 0.99, "eval_accuracy": 0.7153325817361894, "eval_f1": 0.6823083139813236, "eval_loss": 0.7977813482284546, "eval_precision": 0.7199162830832594, "eval_recall": 0.7153325817361894, "eval_runtime": 49.2679, "eval_samples_per_second": 36.007, "eval_steps_per_second": 0.568, "step": 62 }, { "epoch": 1.12, "learning_rate": 0.000989032258064516, "loss": 0.7836, "step": 70 }, { "epoch": 1.28, "learning_rate": 0.0009874193548387096, "loss": 0.772, "step": 80 }, { "epoch": 1.44, "learning_rate": 0.0009858064516129032, "loss": 0.8074, "step": 90 }, { "epoch": 1.6, "learning_rate": 0.0009841935483870968, "loss": 0.7912, "step": 100 }, { "epoch": 1.76, "learning_rate": 0.0009825806451612903, "loss": 0.7762, "step": 110 }, { "epoch": 1.92, "learning_rate": 0.0009809677419354839, "loss": 0.7795, "step": 120 }, { "epoch": 2.0, "step": 125, "train_accuracy": 0.7600426145265401, "train_f1": 0.7540133314127565, "train_loss": 0.6639156937599182, "train_precision": 0.7611520386158022, "train_recall": 0.7600426145265401, "train_runtime": 254.6664, "train_samples_per_second": 62.658, "train_steps_per_second": 0.982 }, { "epoch": 2.0, "eval_accuracy": 0.7497181510710259, "eval_f1": 0.7388896367994308, "eval_loss": 0.6961308717727661, "eval_precision": 0.7541740918352317, "eval_recall": 0.7497181510710259, "eval_runtime": 48.7662, "eval_samples_per_second": 36.378, "eval_steps_per_second": 0.574, "step": 125 }, { "epoch": 2.08, "learning_rate": 0.0009793548387096774, "loss": 0.7586, "step": 130 }, { "epoch": 2.24, "learning_rate": 0.000977741935483871, "loss": 0.705, "step": 140 }, { "epoch": 2.4, "learning_rate": 0.0009761290322580644, "loss": 0.6983, "step": 150 }, { "epoch": 2.56, "learning_rate": 0.0009745161290322581, "loss": 0.6913, "step": 160 }, { "epoch": 2.72, "learning_rate": 0.0009729032258064517, "loss": 0.6849, "step": 170 }, { "epoch": 2.88, "learning_rate": 0.0009714516129032258, "loss": 0.7169, "step": 180 }, { "epoch": 2.99, "step": 187, "train_accuracy": 0.7776524409350128, "train_f1": 0.7639537137185656, "train_loss": 0.6073001027107239, "train_precision": 0.7743141490761454, "train_recall": 0.7776524409350128, "train_runtime": 256.1493, "train_samples_per_second": 62.296, "train_steps_per_second": 0.976 }, { "epoch": 2.99, "eval_accuracy": 0.7717023675310034, "eval_f1": 0.7547317483415474, "eval_loss": 0.6364655494689941, "eval_precision": 0.7658539052724858, "eval_recall": 0.7717023675310034, "eval_runtime": 48.4464, "eval_samples_per_second": 36.618, "eval_steps_per_second": 0.578, "step": 187 }, { "epoch": 3.04, "learning_rate": 0.0009698387096774194, "loss": 0.6428, "step": 190 }, { "epoch": 3.2, "learning_rate": 0.0009682258064516129, "loss": 0.6604, "step": 200 }, { "epoch": 3.36, "learning_rate": 0.0009666129032258064, "loss": 0.6531, "step": 210 }, { "epoch": 3.52, "learning_rate": 0.000965, "loss": 0.643, "step": 220 }, { "epoch": 3.68, "learning_rate": 0.0009633870967741936, "loss": 0.6918, "step": 230 }, { "epoch": 3.84, "learning_rate": 0.0009617741935483872, "loss": 0.6442, "step": 240 }, { "epoch": 4.0, "learning_rate": 0.0009601612903225807, "loss": 0.6576, "step": 250 }, { "epoch": 4.0, "step": 250, "train_accuracy": 0.7903114620542708, "train_f1": 0.7760264280771675, "train_loss": 0.5970289707183838, "train_precision": 0.7953318203400003, "train_recall": 0.7903114620542708, "train_runtime": 256.7891, "train_samples_per_second": 62.14, "train_steps_per_second": 0.974 }, { "epoch": 4.0, "eval_accuracy": 0.790304396843292, "eval_f1": 0.7777020089235339, "eval_loss": 0.6154965162277222, "eval_precision": 0.7982692040791739, "eval_recall": 0.790304396843292, "eval_runtime": 46.9309, "eval_samples_per_second": 37.8, "eval_steps_per_second": 0.597, "step": 250 }, { "epoch": 4.16, "learning_rate": 0.0009585483870967742, "loss": 0.6104, "step": 260 }, { "epoch": 4.32, "learning_rate": 0.0009569354838709677, "loss": 0.5991, "step": 270 }, { "epoch": 4.48, "learning_rate": 0.0009553225806451613, "loss": 0.625, "step": 280 }, { "epoch": 4.64, "learning_rate": 0.0009537096774193548, "loss": 0.6223, "step": 290 }, { "epoch": 4.8, "learning_rate": 0.0009520967741935485, "loss": 0.6309, "step": 300 }, { "epoch": 4.96, "learning_rate": 0.000950483870967742, "loss": 0.6164, "step": 310 }, { "epoch": 4.99, "step": 312, "train_accuracy": 0.8017797831672621, "train_f1": 0.7931150004910923, "train_loss": 0.5476173758506775, "train_precision": 0.7996150347194898, "train_recall": 0.8017797831672621, "train_runtime": 254.273, "train_samples_per_second": 62.755, "train_steps_per_second": 0.983 }, { "epoch": 4.99, "eval_accuracy": 0.7733934611048479, "eval_f1": 0.7627200347192373, "eval_loss": 0.5989590883255005, "eval_precision": 0.7799215570339676, "eval_recall": 0.7733934611048479, "eval_runtime": 46.2691, "eval_samples_per_second": 38.341, "eval_steps_per_second": 0.605, "step": 312 }, { "epoch": 5.12, "learning_rate": 0.0009488709677419355, "loss": 0.6067, "step": 320 }, { "epoch": 5.28, "learning_rate": 0.0009472580645161291, "loss": 0.6144, "step": 330 }, { "epoch": 5.44, "learning_rate": 0.0009456451612903226, "loss": 0.5815, "step": 340 }, { "epoch": 5.6, "learning_rate": 0.0009440322580645162, "loss": 0.6036, "step": 350 }, { "epoch": 5.76, "learning_rate": 0.0009424193548387096, "loss": 0.5748, "step": 360 }, { "epoch": 5.92, "learning_rate": 0.0009408064516129032, "loss": 0.5779, "step": 370 }, { "epoch": 6.0, "step": 375, "train_accuracy": 0.8046625305508555, "train_f1": 0.8003331690711911, "train_loss": 0.5287690758705139, "train_precision": 0.8066353914139762, "train_recall": 0.8046625305508555, "train_runtime": 254.1046, "train_samples_per_second": 62.797, "train_steps_per_second": 0.984 }, { "epoch": 6.0, "eval_accuracy": 0.7745208568207441, "eval_f1": 0.7668632966865262, "eval_loss": 0.602535605430603, "eval_precision": 0.7770132133553053, "eval_recall": 0.7745208568207441, "eval_runtime": 38.0169, "eval_samples_per_second": 46.663, "eval_steps_per_second": 0.737, "step": 375 }, { "epoch": 6.08, "learning_rate": 0.0009391935483870969, "loss": 0.5808, "step": 380 }, { "epoch": 6.24, "learning_rate": 0.0009375806451612904, "loss": 0.5692, "step": 390 }, { "epoch": 6.4, "learning_rate": 0.0009359677419354839, "loss": 0.5525, "step": 400 }, { "epoch": 6.56, "learning_rate": 0.0009343548387096774, "loss": 0.562, "step": 410 }, { "epoch": 6.72, "learning_rate": 0.000932741935483871, "loss": 0.5858, "step": 420 }, { "epoch": 6.88, "learning_rate": 0.0009311290322580645, "loss": 0.5647, "step": 430 }, { "epoch": 6.99, "step": 437, "train_accuracy": 0.8250924359215391, "train_f1": 0.8156580365652172, "train_loss": 0.4726848304271698, "train_precision": 0.8244531001171268, "train_recall": 0.8250924359215391, "train_runtime": 254.8694, "train_samples_per_second": 62.609, "train_steps_per_second": 0.981 }, { "epoch": 6.99, "eval_accuracy": 0.8094701240135288, "eval_f1": 0.8000649092582361, "eval_loss": 0.5391651391983032, "eval_precision": 0.8082600629133598, "eval_recall": 0.8094701240135288, "eval_runtime": 33.5973, "eval_samples_per_second": 52.802, "eval_steps_per_second": 0.833, "step": 437 }, { "epoch": 7.04, "learning_rate": 0.0009295161290322581, "loss": 0.5795, "step": 440 }, { "epoch": 7.2, "learning_rate": 0.0009279032258064515, "loss": 0.535, "step": 450 }, { "epoch": 7.36, "learning_rate": 0.0009262903225806451, "loss": 0.5441, "step": 460 }, { "epoch": 7.52, "learning_rate": 0.0009246774193548388, "loss": 0.5329, "step": 470 }, { "epoch": 7.68, "learning_rate": 0.0009230645161290323, "loss": 0.5191, "step": 480 }, { "epoch": 7.84, "learning_rate": 0.0009214516129032259, "loss": 0.5428, "step": 490 }, { "epoch": 8.0, "learning_rate": 0.0009198387096774193, "loss": 0.5062, "step": 500 }, { "epoch": 8.0, "step": 500, "train_accuracy": 0.8309832675314909, "train_f1": 0.8223807681274183, "train_loss": 0.4595116674900055, "train_precision": 0.8314452738097804, "train_recall": 0.8309832675314909, "train_runtime": 254.2706, "train_samples_per_second": 62.756, "train_steps_per_second": 0.983 }, { "epoch": 8.0, "eval_accuracy": 0.8015783540022547, "eval_f1": 0.7895223836045016, "eval_loss": 0.5510557293891907, "eval_precision": 0.8031324191974503, "eval_recall": 0.8015783540022547, "eval_runtime": 33.1712, "eval_samples_per_second": 53.48, "eval_steps_per_second": 0.844, "step": 500 }, { "epoch": 8.16, "learning_rate": 0.0009182258064516129, "loss": 0.5424, "step": 510 }, { "epoch": 8.32, "learning_rate": 0.0009166129032258065, "loss": 0.5172, "step": 520 }, { "epoch": 8.48, "learning_rate": 0.000915, "loss": 0.5081, "step": 530 }, { "epoch": 8.64, "learning_rate": 0.0009133870967741935, "loss": 0.5357, "step": 540 }, { "epoch": 8.8, "learning_rate": 0.0009117741935483871, "loss": 0.5317, "step": 550 }, { "epoch": 8.96, "learning_rate": 0.0009101612903225807, "loss": 0.5479, "step": 560 }, { "epoch": 8.99, "step": 562, "train_accuracy": 0.8421382465375697, "train_f1": 0.8356541787788663, "train_loss": 0.4283278286457062, "train_precision": 0.8418489980800979, "train_recall": 0.8421382465375697, "train_runtime": 253.325, "train_samples_per_second": 62.99, "train_steps_per_second": 0.987 }, { "epoch": 8.99, "eval_accuracy": 0.8156708004509583, "eval_f1": 0.8099706186065314, "eval_loss": 0.5151851773262024, "eval_precision": 0.8175937941832333, "eval_recall": 0.8156708004509583, "eval_runtime": 29.3964, "eval_samples_per_second": 60.347, "eval_steps_per_second": 0.952, "step": 562 }, { "epoch": 9.12, "learning_rate": 0.0009087096774193548, "loss": 0.4922, "step": 570 }, { "epoch": 9.28, "learning_rate": 0.0009070967741935484, "loss": 0.4682, "step": 580 }, { "epoch": 9.44, "learning_rate": 0.0009054838709677419, "loss": 0.5159, "step": 590 }, { "epoch": 9.6, "learning_rate": 0.0009038709677419356, "loss": 0.5072, "step": 600 }, { "epoch": 9.76, "learning_rate": 0.0009022580645161291, "loss": 0.4946, "step": 610 }, { "epoch": 9.92, "learning_rate": 0.0009006451612903226, "loss": 0.504, "step": 620 }, { "epoch": 10.0, "step": 625, "train_accuracy": 0.8490317728896409, "train_f1": 0.8425370562453873, "train_loss": 0.4146420955657959, "train_precision": 0.8499471633168426, "train_recall": 0.8490317728896409, "train_runtime": 252.5657, "train_samples_per_second": 63.18, "train_steps_per_second": 0.99 }, { "epoch": 10.0, "eval_accuracy": 0.8246899661781285, "eval_f1": 0.8181338629292875, "eval_loss": 0.4954419434070587, "eval_precision": 0.8265610533827844, "eval_recall": 0.8246899661781285, "eval_runtime": 29.7136, "eval_samples_per_second": 59.703, "eval_steps_per_second": 0.942, "step": 625 }, { "epoch": 10.08, "learning_rate": 0.0008990322580645162, "loss": 0.4777, "step": 630 }, { "epoch": 10.24, "learning_rate": 0.0008974193548387097, "loss": 0.4595, "step": 640 }, { "epoch": 10.4, "learning_rate": 0.0008958064516129032, "loss": 0.4765, "step": 650 }, { "epoch": 10.56, "learning_rate": 0.0008941935483870967, "loss": 0.481, "step": 660 }, { "epoch": 10.72, "learning_rate": 0.0008925806451612903, "loss": 0.4936, "step": 670 }, { "epoch": 10.88, "learning_rate": 0.0008909677419354839, "loss": 0.4928, "step": 680 }, { "epoch": 10.99, "step": 687, "train_accuracy": 0.8662029203484364, "train_f1": 0.8651095243578739, "train_loss": 0.36719974875450134, "train_precision": 0.8661939607708877, "train_recall": 0.8662029203484364, "train_runtime": 248.0205, "train_samples_per_second": 64.337, "train_steps_per_second": 1.008 }, { "epoch": 10.99, "eval_accuracy": 0.8325817361894025, "eval_f1": 0.8330415565435833, "eval_loss": 0.4721773862838745, "eval_precision": 0.8382637561400605, "eval_recall": 0.8325817361894025, "eval_runtime": 29.1932, "eval_samples_per_second": 60.768, "eval_steps_per_second": 0.959, "step": 687 }, { "epoch": 11.04, "learning_rate": 0.0008893548387096775, "loss": 0.4791, "step": 690 }, { "epoch": 11.2, "learning_rate": 0.000887741935483871, "loss": 0.471, "step": 700 }, { "epoch": 11.36, "learning_rate": 0.0008861290322580645, "loss": 0.4514, "step": 710 }, { "epoch": 11.52, "learning_rate": 0.0008845161290322581, "loss": 0.4554, "step": 720 }, { "epoch": 11.68, "learning_rate": 0.0008829032258064516, "loss": 0.4778, "step": 730 }, { "epoch": 11.84, "learning_rate": 0.0008812903225806452, "loss": 0.4214, "step": 740 }, { "epoch": 12.0, "learning_rate": 0.0008796774193548387, "loss": 0.4555, "step": 750 }, { "epoch": 12.0, "step": 750, "train_accuracy": 0.8760418625054834, "train_f1": 0.8735297151164703, "train_loss": 0.341611385345459, "train_precision": 0.8749284746900984, "train_recall": 0.8760418625054834, "train_runtime": 251.381, "train_samples_per_second": 63.477, "train_steps_per_second": 0.995 }, { "epoch": 12.0, "eval_accuracy": 0.846674182638106, "eval_f1": 0.8431872563091386, "eval_loss": 0.43833523988723755, "eval_precision": 0.8434438125814474, "eval_recall": 0.846674182638106, "eval_runtime": 29.6753, "eval_samples_per_second": 59.78, "eval_steps_per_second": 0.944, "step": 750 }, { "epoch": 12.16, "learning_rate": 0.0008780645161290322, "loss": 0.4597, "step": 760 }, { "epoch": 12.32, "learning_rate": 0.0008764516129032259, "loss": 0.4253, "step": 770 }, { "epoch": 12.48, "learning_rate": 0.0008748387096774194, "loss": 0.473, "step": 780 }, { "epoch": 12.64, "learning_rate": 0.0008732258064516129, "loss": 0.4244, "step": 790 }, { "epoch": 12.8, "learning_rate": 0.0008716129032258064, "loss": 0.4602, "step": 800 }, { "epoch": 12.96, "learning_rate": 0.00087, "loss": 0.4345, "step": 810 }, { "epoch": 12.99, "step": 812, "train_accuracy": 0.8737857993357148, "train_f1": 0.8699664840253412, "train_loss": 0.3363898992538452, "train_precision": 0.8723546877750733, "train_recall": 0.8737857993357148, "train_runtime": 254.2635, "train_samples_per_second": 62.758, "train_steps_per_second": 0.983 }, { "epoch": 12.99, "eval_accuracy": 0.8511837655016911, "eval_f1": 0.8464360738395965, "eval_loss": 0.44016385078430176, "eval_precision": 0.8479714249543402, "eval_recall": 0.8511837655016911, "eval_runtime": 29.6817, "eval_samples_per_second": 59.767, "eval_steps_per_second": 0.943, "step": 812 }, { "epoch": 13.12, "learning_rate": 0.0008683870967741936, "loss": 0.4296, "step": 820 }, { "epoch": 13.28, "learning_rate": 0.0008667741935483871, "loss": 0.4024, "step": 830 }, { "epoch": 13.44, "learning_rate": 0.0008651612903225806, "loss": 0.4268, "step": 840 }, { "epoch": 13.6, "learning_rate": 0.0008635483870967742, "loss": 0.411, "step": 850 }, { "epoch": 13.76, "learning_rate": 0.0008619354838709678, "loss": 0.4179, "step": 860 }, { "epoch": 13.92, "learning_rate": 0.0008603225806451614, "loss": 0.4398, "step": 870 }, { "epoch": 14.0, "step": 875, "train_accuracy": 0.880553988845021, "train_f1": 0.8770183301442244, "train_loss": 0.3260194957256317, "train_precision": 0.8807172403068199, "train_recall": 0.880553988845021, "train_runtime": 252.7172, "train_samples_per_second": 63.142, "train_steps_per_second": 0.989 }, { "epoch": 14.0, "eval_accuracy": 0.8494926719278467, "eval_f1": 0.8469368583418073, "eval_loss": 0.44426438212394714, "eval_precision": 0.8497246468797232, "eval_recall": 0.8494926719278467, "eval_runtime": 29.5345, "eval_samples_per_second": 60.065, "eval_steps_per_second": 0.948, "step": 875 }, { "epoch": 14.08, "learning_rate": 0.0008587096774193549, "loss": 0.4153, "step": 880 }, { "epoch": 14.24, "learning_rate": 0.0008570967741935484, "loss": 0.4065, "step": 890 }, { "epoch": 14.4, "learning_rate": 0.0008554838709677419, "loss": 0.4045, "step": 900 }, { "epoch": 14.56, "learning_rate": 0.0008538709677419355, "loss": 0.3879, "step": 910 }, { "epoch": 14.72, "learning_rate": 0.000852258064516129, "loss": 0.4095, "step": 920 }, { "epoch": 14.88, "learning_rate": 0.0008506451612903226, "loss": 0.405, "step": 930 }, { "epoch": 14.99, "step": 937, "train_accuracy": 0.8919596415366297, "train_f1": 0.8898750533747908, "train_loss": 0.29893702268600464, "train_precision": 0.8905204704311594, "train_recall": 0.8919596415366297, "train_runtime": 255.1579, "train_samples_per_second": 62.538, "train_steps_per_second": 0.98 }, { "epoch": 14.99, "eval_accuracy": 0.8568207440811725, "eval_f1": 0.8543462911384269, "eval_loss": 0.4096240699291229, "eval_precision": 0.8552780691368613, "eval_recall": 0.8568207440811725, "eval_runtime": 29.6726, "eval_samples_per_second": 59.786, "eval_steps_per_second": 0.944, "step": 937 }, { "epoch": 15.04, "learning_rate": 0.0008490322580645162, "loss": 0.4047, "step": 940 }, { "epoch": 15.2, "learning_rate": 0.0008474193548387097, "loss": 0.4049, "step": 950 }, { "epoch": 15.36, "learning_rate": 0.0008458064516129033, "loss": 0.39, "step": 960 }, { "epoch": 15.52, "learning_rate": 0.0008441935483870968, "loss": 0.4253, "step": 970 }, { "epoch": 15.68, "learning_rate": 0.0008425806451612903, "loss": 0.3707, "step": 980 }, { "epoch": 15.84, "learning_rate": 0.0008409677419354838, "loss": 0.389, "step": 990 }, { "epoch": 16.0, "learning_rate": 0.0008393548387096774, "loss": 0.4069, "step": 1000 }, { "epoch": 16.0, "step": 1000, "train_accuracy": 0.8934636836498089, "train_f1": 0.8909693605701321, "train_loss": 0.2904220521450043, "train_precision": 0.893519044249712, "train_recall": 0.8934636836498089, "train_runtime": 254.2734, "train_samples_per_second": 62.755, "train_steps_per_second": 0.983 }, { "epoch": 16.0, "eval_accuracy": 0.8500563697857948, "eval_f1": 0.8452271271553625, "eval_loss": 0.4389975965023041, "eval_precision": 0.851487739267586, "eval_recall": 0.8500563697857948, "eval_runtime": 29.5522, "eval_samples_per_second": 60.029, "eval_steps_per_second": 0.947, "step": 1000 }, { "epoch": 16.16, "learning_rate": 0.0008377419354838711, "loss": 0.389, "step": 1010 }, { "epoch": 16.32, "learning_rate": 0.0008361290322580646, "loss": 0.3682, "step": 1020 }, { "epoch": 16.48, "learning_rate": 0.0008345161290322581, "loss": 0.3746, "step": 1030 }, { "epoch": 16.64, "learning_rate": 0.0008329032258064516, "loss": 0.3817, "step": 1040 }, { "epoch": 16.8, "learning_rate": 0.0008312903225806452, "loss": 0.3652, "step": 1050 }, { "epoch": 16.96, "learning_rate": 0.0008296774193548387, "loss": 0.3774, "step": 1060 }, { "epoch": 16.99, "step": 1062, "train_accuracy": 0.9058093626621545, "train_f1": 0.9046539806661633, "train_loss": 0.2608683109283447, "train_precision": 0.9049170910236276, "train_recall": 0.9058093626621545, "train_runtime": 253.2237, "train_samples_per_second": 63.015, "train_steps_per_second": 0.987 }, { "epoch": 16.99, "eval_accuracy": 0.8579481397970687, "eval_f1": 0.8563523858127897, "eval_loss": 0.415022075176239, "eval_precision": 0.8576310002165511, "eval_recall": 0.8579481397970687, "eval_runtime": 29.5963, "eval_samples_per_second": 59.94, "eval_steps_per_second": 0.946, "step": 1062 }, { "epoch": 17.12, "learning_rate": 0.0008280645161290323, "loss": 0.3537, "step": 1070 }, { "epoch": 17.28, "learning_rate": 0.0008264516129032257, "loss": 0.3743, "step": 1080 }, { "epoch": 17.44, "learning_rate": 0.0008248387096774194, "loss": 0.3648, "step": 1090 }, { "epoch": 17.6, "learning_rate": 0.000823225806451613, "loss": 0.3659, "step": 1100 }, { "epoch": 17.76, "learning_rate": 0.0008216129032258065, "loss": 0.3713, "step": 1110 }, { "epoch": 17.92, "learning_rate": 0.00082, "loss": 0.3631, "step": 1120 }, { "epoch": 18.0, "step": 1125, "train_accuracy": 0.9117628626934887, "train_f1": 0.9111752276141204, "train_loss": 0.24888941645622253, "train_precision": 0.9116531142476182, "train_recall": 0.9117628626934887, "train_runtime": 253.2878, "train_samples_per_second": 62.999, "train_steps_per_second": 0.987 }, { "epoch": 18.0, "eval_accuracy": 0.85456595264938, "eval_f1": 0.8546917151279523, "eval_loss": 0.42011961340904236, "eval_precision": 0.858590913110437, "eval_recall": 0.85456595264938, "eval_runtime": 29.5881, "eval_samples_per_second": 59.956, "eval_steps_per_second": 0.946, "step": 1125 }, { "epoch": 18.08, "learning_rate": 0.0008183870967741935, "loss": 0.3537, "step": 1130 }, { "epoch": 18.24, "learning_rate": 0.0008167741935483871, "loss": 0.3214, "step": 1140 }, { "epoch": 18.4, "learning_rate": 0.0008151612903225807, "loss": 0.3464, "step": 1150 }, { "epoch": 18.56, "learning_rate": 0.0008135483870967742, "loss": 0.3503, "step": 1160 }, { "epoch": 18.72, "learning_rate": 0.0008119354838709677, "loss": 0.3745, "step": 1170 }, { "epoch": 18.88, "learning_rate": 0.0008103225806451613, "loss": 0.3458, "step": 1180 }, { "epoch": 18.99, "step": 1187, "train_accuracy": 0.912326878485931, "train_f1": 0.9113314150149505, "train_loss": 0.24995951354503632, "train_precision": 0.9115719864017833, "train_recall": 0.912326878485931, "train_runtime": 254.6215, "train_samples_per_second": 62.669, "train_steps_per_second": 0.982 }, { "epoch": 18.99, "eval_accuracy": 0.8562570462232244, "eval_f1": 0.8542249820828076, "eval_loss": 0.40477874875068665, "eval_precision": 0.8544614619611243, "eval_recall": 0.8562570462232244, "eval_runtime": 29.856, "eval_samples_per_second": 59.418, "eval_steps_per_second": 0.938, "step": 1187 }, { "epoch": 19.04, "learning_rate": 0.0008087096774193549, "loss": 0.3953, "step": 1190 }, { "epoch": 19.2, "learning_rate": 0.0008070967741935484, "loss": 0.3386, "step": 1200 }, { "epoch": 19.36, "learning_rate": 0.000805483870967742, "loss": 0.3322, "step": 1210 }, { "epoch": 19.52, "learning_rate": 0.0008038709677419355, "loss": 0.3425, "step": 1220 }, { "epoch": 19.68, "learning_rate": 0.000802258064516129, "loss": 0.3448, "step": 1230 }, { "epoch": 19.84, "learning_rate": 0.0008006451612903226, "loss": 0.3534, "step": 1240 }, { "epoch": 20.0, "learning_rate": 0.0007990322580645161, "loss": 0.3361, "step": 1250 }, { "epoch": 20.0, "step": 1250, "train_accuracy": 0.9059346995049194, "train_f1": 0.9033631776657957, "train_loss": 0.2528255581855774, "train_precision": 0.9064546977324616, "train_recall": 0.9059346995049194, "train_runtime": 252.7613, "train_samples_per_second": 63.131, "train_steps_per_second": 0.989 }, { "epoch": 20.0, "eval_accuracy": 0.8596392333709132, "eval_f1": 0.8566333454163209, "eval_loss": 0.4370974004268646, "eval_precision": 0.8585278408293291, "eval_recall": 0.8596392333709132, "eval_runtime": 29.8096, "eval_samples_per_second": 59.511, "eval_steps_per_second": 0.939, "step": 1250 }, { "epoch": 20.16, "learning_rate": 0.0007974193548387097, "loss": 0.3154, "step": 1260 }, { "epoch": 20.32, "learning_rate": 0.0007958064516129032, "loss": 0.3478, "step": 1270 }, { "epoch": 20.48, "learning_rate": 0.0007941935483870968, "loss": 0.3385, "step": 1280 }, { "epoch": 20.64, "learning_rate": 0.0007925806451612904, "loss": 0.3327, "step": 1290 }, { "epoch": 20.8, "learning_rate": 0.0007909677419354839, "loss": 0.3398, "step": 1300 }, { "epoch": 20.96, "learning_rate": 0.0007893548387096774, "loss": 0.3386, "step": 1310 }, { "epoch": 20.99, "step": 1312, "train_accuracy": 0.9205991101084163, "train_f1": 0.9202297733826367, "train_loss": 0.22639435529708862, "train_precision": 0.9204915599848654, "train_recall": 0.9205991101084163, "train_runtime": 253.7128, "train_samples_per_second": 62.894, "train_steps_per_second": 0.985 }, { "epoch": 20.99, "eval_accuracy": 0.8686583990980834, "eval_f1": 0.8680154821185954, "eval_loss": 0.39551448822021484, "eval_precision": 0.8689593382775722, "eval_recall": 0.8686583990980834, "eval_runtime": 29.773, "eval_samples_per_second": 59.584, "eval_steps_per_second": 0.94, "step": 1312 }, { "epoch": 21.12, "learning_rate": 0.0007877419354838709, "loss": 0.3038, "step": 1320 }, { "epoch": 21.28, "learning_rate": 0.0007861290322580645, "loss": 0.3157, "step": 1330 }, { "epoch": 21.44, "learning_rate": 0.0007845161290322582, "loss": 0.318, "step": 1340 }, { "epoch": 21.6, "learning_rate": 0.0007829032258064517, "loss": 0.2993, "step": 1350 }, { "epoch": 21.76, "learning_rate": 0.0007812903225806452, "loss": 0.3185, "step": 1360 }, { "epoch": 21.92, "learning_rate": 0.0007796774193548387, "loss": 0.3091, "step": 1370 }, { "epoch": 22.0, "step": 1375, "train_accuracy": 0.9207871153725637, "train_f1": 0.919568201335574, "train_loss": 0.21673625707626343, "train_precision": 0.9203664780549666, "train_recall": 0.9207871153725637, "train_runtime": 249.1604, "train_samples_per_second": 64.043, "train_steps_per_second": 1.003 }, { "epoch": 22.0, "eval_accuracy": 0.8680947012401353, "eval_f1": 0.8657724581221397, "eval_loss": 0.4277941584587097, "eval_precision": 0.8671942484944011, "eval_recall": 0.8680947012401353, "eval_runtime": 29.1495, "eval_samples_per_second": 60.859, "eval_steps_per_second": 0.961, "step": 1375 }, { "epoch": 22.08, "learning_rate": 0.0007780645161290323, "loss": 0.3109, "step": 1380 }, { "epoch": 22.24, "learning_rate": 0.0007764516129032258, "loss": 0.3082, "step": 1390 }, { "epoch": 22.4, "learning_rate": 0.0007748387096774193, "loss": 0.3133, "step": 1400 }, { "epoch": 22.56, "learning_rate": 0.0007732258064516128, "loss": 0.3217, "step": 1410 }, { "epoch": 22.72, "learning_rate": 0.0007716129032258065, "loss": 0.3145, "step": 1420 }, { "epoch": 22.88, "learning_rate": 0.0007700000000000001, "loss": 0.3081, "step": 1430 }, { "epoch": 22.99, "step": 1437, "train_accuracy": 0.9301247101585511, "train_f1": 0.9298726796945993, "train_loss": 0.2020701915025711, "train_precision": 0.9301061473852973, "train_recall": 0.9301247101585511, "train_runtime": 248.5533, "train_samples_per_second": 64.2, "train_steps_per_second": 1.006 }, { "epoch": 22.99, "eval_accuracy": 0.8675310033821871, "eval_f1": 0.8662116604826631, "eval_loss": 0.39544782042503357, "eval_precision": 0.866086748268126, "eval_recall": 0.8675310033821871, "eval_runtime": 29.2034, "eval_samples_per_second": 60.746, "eval_steps_per_second": 0.959, "step": 1437 }, { "epoch": 23.04, "learning_rate": 0.0007683870967741936, "loss": 0.3357, "step": 1440 }, { "epoch": 23.2, "learning_rate": 0.0007667741935483871, "loss": 0.2981, "step": 1450 }, { "epoch": 23.36, "learning_rate": 0.0007651612903225806, "loss": 0.2823, "step": 1460 }, { "epoch": 23.52, "learning_rate": 0.0007635483870967742, "loss": 0.3036, "step": 1470 }, { "epoch": 23.68, "learning_rate": 0.0007619354838709678, "loss": 0.3097, "step": 1480 }, { "epoch": 23.84, "learning_rate": 0.0007603225806451613, "loss": 0.3004, "step": 1490 }, { "epoch": 24.0, "learning_rate": 0.0007587096774193549, "loss": 0.3031, "step": 1500 }, { "epoch": 24.0, "step": 1500, "train_accuracy": 0.9242965469699819, "train_f1": 0.9232184701149497, "train_loss": 0.20474377274513245, "train_precision": 0.9253522346156541, "train_recall": 0.9242965469699819, "train_runtime": 248.6452, "train_samples_per_second": 64.176, "train_steps_per_second": 1.005 }, { "epoch": 24.0, "eval_accuracy": 0.8720405862457723, "eval_f1": 0.8716583234363133, "eval_loss": 0.42239370942115784, "eval_precision": 0.8734092383360484, "eval_recall": 0.8720405862457723, "eval_runtime": 29.0555, "eval_samples_per_second": 61.055, "eval_steps_per_second": 0.964, "step": 1500 }, { "epoch": 24.16, "learning_rate": 0.0007570967741935484, "loss": 0.2858, "step": 1510 }, { "epoch": 24.32, "learning_rate": 0.000755483870967742, "loss": 0.2999, "step": 1520 }, { "epoch": 24.48, "learning_rate": 0.0007538709677419355, "loss": 0.3135, "step": 1530 }, { "epoch": 24.64, "learning_rate": 0.000752258064516129, "loss": 0.2951, "step": 1540 }, { "epoch": 24.8, "learning_rate": 0.0007506451612903225, "loss": 0.3136, "step": 1550 }, { "epoch": 24.96, "learning_rate": 0.0007490322580645161, "loss": 0.2918, "step": 1560 }, { "epoch": 24.99, "step": 1562, "train_accuracy": 0.9315660838503478, "train_f1": 0.9309767971055543, "train_loss": 0.1887647807598114, "train_precision": 0.9311524146378474, "train_recall": 0.9315660838503478, "train_runtime": 249.2905, "train_samples_per_second": 64.01, "train_steps_per_second": 1.003 }, { "epoch": 24.99, "eval_accuracy": 0.8680947012401353, "eval_f1": 0.8669054461224185, "eval_loss": 0.43037477135658264, "eval_precision": 0.8673301666844889, "eval_recall": 0.8680947012401353, "eval_runtime": 29.0965, "eval_samples_per_second": 60.97, "eval_steps_per_second": 0.962, "step": 1562 }, { "epoch": 25.12, "learning_rate": 0.0007474193548387097, "loss": 0.2943, "step": 1570 }, { "epoch": 25.28, "learning_rate": 0.0007458064516129033, "loss": 0.2796, "step": 1580 }, { "epoch": 25.44, "learning_rate": 0.0007441935483870968, "loss": 0.2712, "step": 1590 }, { "epoch": 25.6, "learning_rate": 0.0007425806451612903, "loss": 0.2862, "step": 1600 }, { "epoch": 25.76, "learning_rate": 0.0007409677419354839, "loss": 0.2833, "step": 1610 }, { "epoch": 25.92, "learning_rate": 0.0007393548387096775, "loss": 0.2594, "step": 1620 }, { "epoch": 26.0, "step": 1625, "train_accuracy": 0.934824841762236, "train_f1": 0.9340766757397655, "train_loss": 0.18092262744903564, "train_precision": 0.9349816666427498, "train_recall": 0.934824841762236, "train_runtime": 249.0812, "train_samples_per_second": 64.063, "train_steps_per_second": 1.004 }, { "epoch": 26.0, "eval_accuracy": 0.8776775648252536, "eval_f1": 0.8766912677805229, "eval_loss": 0.421634703874588, "eval_precision": 0.8774332235361698, "eval_recall": 0.8776775648252536, "eval_runtime": 30.0967, "eval_samples_per_second": 58.943, "eval_steps_per_second": 0.93, "step": 1625 }, { "epoch": 26.08, "learning_rate": 0.000737741935483871, "loss": 0.2729, "step": 1630 }, { "epoch": 26.24, "learning_rate": 0.0007361290322580645, "loss": 0.2801, "step": 1640 }, { "epoch": 26.4, "learning_rate": 0.000734516129032258, "loss": 0.2653, "step": 1650 }, { "epoch": 26.56, "learning_rate": 0.0007329032258064517, "loss": 0.3044, "step": 1660 }, { "epoch": 26.72, "learning_rate": 0.0007312903225806452, "loss": 0.2751, "step": 1670 }, { "epoch": 26.88, "learning_rate": 0.0007296774193548388, "loss": 0.3028, "step": 1680 }, { "epoch": 26.99, "step": 1687, "train_accuracy": 0.93670489440371, "train_f1": 0.9361197667432394, "train_loss": 0.1785627156496048, "train_precision": 0.9365292015778245, "train_recall": 0.93670489440371, "train_runtime": 255.0897, "train_samples_per_second": 62.554, "train_steps_per_second": 0.98 }, { "epoch": 26.99, "eval_accuracy": 0.8810597519729425, "eval_f1": 0.8793922695566861, "eval_loss": 0.40421751141548157, "eval_precision": 0.8798634255905717, "eval_recall": 0.8810597519729425, "eval_runtime": 45.5693, "eval_samples_per_second": 38.93, "eval_steps_per_second": 0.614, "step": 1687 }, { "epoch": 27.04, "learning_rate": 0.0007280645161290323, "loss": 0.2499, "step": 1690 }, { "epoch": 27.2, "learning_rate": 0.0007264516129032258, "loss": 0.2792, "step": 1700 }, { "epoch": 27.36, "learning_rate": 0.0007248387096774194, "loss": 0.2792, "step": 1710 }, { "epoch": 27.52, "learning_rate": 0.0007232258064516129, "loss": 0.2865, "step": 1720 }, { "epoch": 27.68, "learning_rate": 0.0007216129032258064, "loss": 0.2845, "step": 1730 }, { "epoch": 27.84, "learning_rate": 0.0007199999999999999, "loss": 0.2861, "step": 1740 }, { "epoch": 28.0, "learning_rate": 0.0007183870967741936, "loss": 0.2758, "step": 1750 }, { "epoch": 28.0, "step": 1750, "train_accuracy": 0.938459610202419, "train_f1": 0.9377525981628592, "train_loss": 0.1685272455215454, "train_precision": 0.9389554252034343, "train_recall": 0.938459610202419, "train_runtime": 253.2422, "train_samples_per_second": 63.011, "train_steps_per_second": 0.987 }, { "epoch": 28.0, "eval_accuracy": 0.8680947012401353, "eval_f1": 0.8681614791663694, "eval_loss": 0.41954031586647034, "eval_precision": 0.8691594298818118, "eval_recall": 0.8680947012401353, "eval_runtime": 47.5593, "eval_samples_per_second": 37.301, "eval_steps_per_second": 0.589, "step": 1750 }, { "epoch": 28.16, "learning_rate": 0.0007167741935483872, "loss": 0.2659, "step": 1760 }, { "epoch": 28.32, "learning_rate": 0.0007151612903225807, "loss": 0.2522, "step": 1770 }, { "epoch": 28.48, "learning_rate": 0.0007135483870967742, "loss": 0.2755, "step": 1780 }, { "epoch": 28.64, "learning_rate": 0.0007119354838709677, "loss": 0.2736, "step": 1790 }, { "epoch": 28.8, "learning_rate": 0.0007103225806451613, "loss": 0.2847, "step": 1800 }, { "epoch": 28.96, "learning_rate": 0.0007087096774193548, "loss": 0.2833, "step": 1810 }, { "epoch": 28.99, "step": 1812, "train_accuracy": 0.9406530049508053, "train_f1": 0.9397675181987466, "train_loss": 0.16751761734485626, "train_precision": 0.9410854777530413, "train_recall": 0.9406530049508053, "train_runtime": 254.9572, "train_samples_per_second": 62.587, "train_steps_per_second": 0.981 }, { "epoch": 28.99, "eval_accuracy": 0.8759864712514093, "eval_f1": 0.872766620485809, "eval_loss": 0.37792226672172546, "eval_precision": 0.8741418008848874, "eval_recall": 0.8759864712514093, "eval_runtime": 41.0022, "eval_samples_per_second": 43.266, "eval_steps_per_second": 0.683, "step": 1812 }, { "epoch": 29.12, "learning_rate": 0.0007070967741935484, "loss": 0.2487, "step": 1820 }, { "epoch": 29.28, "learning_rate": 0.000705483870967742, "loss": 0.2712, "step": 1830 }, { "epoch": 29.44, "learning_rate": 0.0007038709677419355, "loss": 0.243, "step": 1840 }, { "epoch": 29.6, "learning_rate": 0.0007022580645161291, "loss": 0.2438, "step": 1850 }, { "epoch": 29.76, "learning_rate": 0.0007006451612903226, "loss": 0.2834, "step": 1860 }, { "epoch": 29.92, "learning_rate": 0.0006990322580645161, "loss": 0.2414, "step": 1870 }, { "epoch": 30.0, "step": 1875, "train_accuracy": 0.9470451839318168, "train_f1": 0.9467087754155913, "train_loss": 0.15353631973266602, "train_precision": 0.9468910650190296, "train_recall": 0.9470451839318168, "train_runtime": 255.1175, "train_samples_per_second": 62.548, "train_steps_per_second": 0.98 }, { "epoch": 30.0, "eval_accuracy": 0.8799323562570462, "eval_f1": 0.8785953814489085, "eval_loss": 0.4351659119129181, "eval_precision": 0.8796722516525893, "eval_recall": 0.8799323562570462, "eval_runtime": 38.7284, "eval_samples_per_second": 45.806, "eval_steps_per_second": 0.723, "step": 1875 }, { "epoch": 30.08, "learning_rate": 0.0006974193548387096, "loss": 0.2458, "step": 1880 }, { "epoch": 30.24, "learning_rate": 0.0006958064516129032, "loss": 0.2436, "step": 1890 }, { "epoch": 30.4, "learning_rate": 0.0006941935483870968, "loss": 0.2279, "step": 1900 }, { "epoch": 30.56, "learning_rate": 0.0006925806451612904, "loss": 0.2496, "step": 1910 }, { "epoch": 30.72, "learning_rate": 0.0006909677419354839, "loss": 0.2527, "step": 1920 }, { "epoch": 30.88, "learning_rate": 0.0006893548387096774, "loss": 0.2508, "step": 1930 }, { "epoch": 30.99, "step": 1937, "train_accuracy": 0.945729147082785, "train_f1": 0.9452594948649355, "train_loss": 0.14930781722068787, "train_precision": 0.9455852542228912, "train_recall": 0.945729147082785, "train_runtime": 254.6951, "train_samples_per_second": 62.651, "train_steps_per_second": 0.982 }, { "epoch": 30.99, "eval_accuracy": 0.887260428410372, "eval_f1": 0.8853880807732613, "eval_loss": 0.418369859457016, "eval_precision": 0.8856923487657594, "eval_recall": 0.887260428410372, "eval_runtime": 39.5926, "eval_samples_per_second": 44.806, "eval_steps_per_second": 0.707, "step": 1937 }, { "epoch": 31.04, "learning_rate": 0.000687741935483871, "loss": 0.2344, "step": 1940 }, { "epoch": 31.2, "learning_rate": 0.0006861290322580645, "loss": 0.2417, "step": 1950 }, { "epoch": 31.36, "learning_rate": 0.0006845161290322581, "loss": 0.252, "step": 1960 }, { "epoch": 31.52, "learning_rate": 0.0006829032258064516, "loss": 0.2465, "step": 1970 }, { "epoch": 31.68, "learning_rate": 0.0006812903225806451, "loss": 0.2405, "step": 1980 }, { "epoch": 31.84, "learning_rate": 0.0006796774193548388, "loss": 0.2275, "step": 1990 }, { "epoch": 32.0, "learning_rate": 0.0006780645161290323, "loss": 0.2509, "step": 2000 }, { "epoch": 32.0, "step": 2000, "train_accuracy": 0.9509932944789121, "train_f1": 0.950617708879211, "train_loss": 0.14158745110034943, "train_precision": 0.9510854186462011, "train_recall": 0.9509932944789121, "train_runtime": 255.2742, "train_samples_per_second": 62.509, "train_steps_per_second": 0.979 }, { "epoch": 32.0, "eval_accuracy": 0.8889515219842165, "eval_f1": 0.8871024769373068, "eval_loss": 0.41492128372192383, "eval_precision": 0.8891530304505318, "eval_recall": 0.8889515219842165, "eval_runtime": 35.6073, "eval_samples_per_second": 49.821, "eval_steps_per_second": 0.786, "step": 2000 }, { "epoch": 32.16, "learning_rate": 0.0006764516129032258, "loss": 0.22, "step": 2010 }, { "epoch": 32.32, "learning_rate": 0.0006748387096774193, "loss": 0.243, "step": 2020 }, { "epoch": 32.48, "learning_rate": 0.0006732258064516129, "loss": 0.2465, "step": 2030 }, { "epoch": 32.64, "learning_rate": 0.0006716129032258065, "loss": 0.2352, "step": 2040 }, { "epoch": 32.8, "learning_rate": 0.00067, "loss": 0.2314, "step": 2050 }, { "epoch": 32.96, "learning_rate": 0.0006683870967741935, "loss": 0.2425, "step": 2060 }, { "epoch": 32.99, "step": 2062, "train_accuracy": 0.9521839944851789, "train_f1": 0.9519406193802002, "train_loss": 0.13532106578350067, "train_precision": 0.9520376150741188, "train_recall": 0.9521839944851789, "train_runtime": 253.863, "train_samples_per_second": 62.857, "train_steps_per_second": 0.985 }, { "epoch": 32.99, "eval_accuracy": 0.8900789177001127, "eval_f1": 0.8892207946311137, "eval_loss": 0.41321179270744324, "eval_precision": 0.889613661345136, "eval_recall": 0.8900789177001127, "eval_runtime": 34.1249, "eval_samples_per_second": 51.985, "eval_steps_per_second": 0.821, "step": 2062 }, { "epoch": 33.12, "learning_rate": 0.0006667741935483871, "loss": 0.2533, "step": 2070 }, { "epoch": 33.28, "learning_rate": 0.0006651612903225807, "loss": 0.2495, "step": 2080 }, { "epoch": 33.44, "learning_rate": 0.0006635483870967743, "loss": 0.2216, "step": 2090 }, { "epoch": 33.6, "learning_rate": 0.0006619354838709678, "loss": 0.2334, "step": 2100 }, { "epoch": 33.76, "learning_rate": 0.0006603225806451613, "loss": 0.209, "step": 2110 }, { "epoch": 33.92, "learning_rate": 0.0006587096774193548, "loss": 0.2319, "step": 2120 }, { "epoch": 34.0, "step": 2125, "train_accuracy": 0.9527480102776211, "train_f1": 0.9523272165039456, "train_loss": 0.13454996049404144, "train_precision": 0.9527286937272258, "train_recall": 0.9527480102776211, "train_runtime": 253.9192, "train_samples_per_second": 62.843, "train_steps_per_second": 0.985 }, { "epoch": 34.0, "eval_accuracy": 0.8906426155580609, "eval_f1": 0.8896475365939425, "eval_loss": 0.3986554443836212, "eval_precision": 0.889369678049395, "eval_recall": 0.8906426155580609, "eval_runtime": 32.2322, "eval_samples_per_second": 55.038, "eval_steps_per_second": 0.869, "step": 2125 }, { "epoch": 34.08, "learning_rate": 0.0006570967741935484, "loss": 0.2142, "step": 2130 }, { "epoch": 34.24, "learning_rate": 0.0006554838709677419, "loss": 0.195, "step": 2140 }, { "epoch": 34.4, "learning_rate": 0.0006538709677419356, "loss": 0.2257, "step": 2150 }, { "epoch": 34.56, "learning_rate": 0.000652258064516129, "loss": 0.2191, "step": 2160 }, { "epoch": 34.72, "learning_rate": 0.0006506451612903226, "loss": 0.2472, "step": 2170 }, { "epoch": 34.88, "learning_rate": 0.0006490322580645162, "loss": 0.256, "step": 2180 }, { "epoch": 34.99, "step": 2187, "train_accuracy": 0.956633452403334, "train_f1": 0.9563227521739598, "train_loss": 0.13102850317955017, "train_precision": 0.9566100366343153, "train_recall": 0.956633452403334, "train_runtime": 255.8713, "train_samples_per_second": 62.363, "train_steps_per_second": 0.977 }, { "epoch": 34.99, "eval_accuracy": 0.8878241262683202, "eval_f1": 0.8863562863477997, "eval_loss": 0.40525099635124207, "eval_precision": 0.8863594064224781, "eval_recall": 0.8878241262683202, "eval_runtime": 29.2139, "eval_samples_per_second": 60.725, "eval_steps_per_second": 0.958, "step": 2187 }, { "epoch": 35.04, "learning_rate": 0.0006474193548387097, "loss": 0.2196, "step": 2190 }, { "epoch": 35.2, "learning_rate": 0.0006458064516129032, "loss": 0.208, "step": 2200 }, { "epoch": 35.36, "learning_rate": 0.0006441935483870967, "loss": 0.2125, "step": 2210 }, { "epoch": 35.52, "learning_rate": 0.0006425806451612903, "loss": 0.234, "step": 2220 }, { "epoch": 35.68, "learning_rate": 0.0006409677419354839, "loss": 0.2161, "step": 2230 }, { "epoch": 35.84, "learning_rate": 0.0006393548387096775, "loss": 0.2384, "step": 2240 }, { "epoch": 36.0, "learning_rate": 0.000637741935483871, "loss": 0.2005, "step": 2250 }, { "epoch": 36.0, "step": 2250, "train_accuracy": 0.9563201102964216, "train_f1": 0.9559487475587907, "train_loss": 0.1280374825000763, "train_precision": 0.95649817681943, "train_recall": 0.9563201102964216, "train_runtime": 249.7425, "train_samples_per_second": 63.894, "train_steps_per_second": 1.001 }, { "epoch": 36.0, "eval_accuracy": 0.8906426155580609, "eval_f1": 0.8889303745678712, "eval_loss": 0.42412662506103516, "eval_precision": 0.8905735232548874, "eval_recall": 0.8906426155580609, "eval_runtime": 29.236, "eval_samples_per_second": 60.679, "eval_steps_per_second": 0.958, "step": 2250 }, { "epoch": 36.16, "learning_rate": 0.0006361290322580645, "loss": 0.2062, "step": 2260 }, { "epoch": 36.32, "learning_rate": 0.0006345161290322581, "loss": 0.2251, "step": 2270 }, { "epoch": 36.48, "learning_rate": 0.0006329032258064516, "loss": 0.2086, "step": 2280 }, { "epoch": 36.64, "learning_rate": 0.0006312903225806452, "loss": 0.2239, "step": 2290 }, { "epoch": 36.8, "learning_rate": 0.0006296774193548387, "loss": 0.2053, "step": 2300 }, { "epoch": 36.96, "learning_rate": 0.0006280645161290322, "loss": 0.2151, "step": 2310 }, { "epoch": 36.99, "step": 2312, "train_accuracy": 0.9576361471454534, "train_f1": 0.9574828276125282, "train_loss": 0.12214481085538864, "train_precision": 0.9575674620543635, "train_recall": 0.9576361471454534, "train_runtime": 250.154, "train_samples_per_second": 63.789, "train_steps_per_second": 0.999 }, { "epoch": 36.99, "eval_accuracy": 0.8928974069898534, "eval_f1": 0.8924893933635943, "eval_loss": 0.44935598969459534, "eval_precision": 0.89342937260661, "eval_recall": 0.8928974069898534, "eval_runtime": 28.948, "eval_samples_per_second": 61.282, "eval_steps_per_second": 0.967, "step": 2312 }, { "epoch": 37.12, "learning_rate": 0.0006264516129032259, "loss": 0.2049, "step": 2320 }, { "epoch": 37.28, "learning_rate": 0.0006248387096774194, "loss": 0.2165, "step": 2330 }, { "epoch": 37.44, "learning_rate": 0.0006232258064516129, "loss": 0.2106, "step": 2340 }, { "epoch": 37.6, "learning_rate": 0.0006216129032258064, "loss": 0.211, "step": 2350 }, { "epoch": 37.76, "learning_rate": 0.00062, "loss": 0.1914, "step": 2360 }, { "epoch": 37.92, "learning_rate": 0.0006183870967741936, "loss": 0.2264, "step": 2370 }, { "epoch": 38.0, "step": 2375, "train_accuracy": 0.9594535313655449, "train_f1": 0.9591420123249457, "train_loss": 0.11748312413692474, "train_precision": 0.9594846416905936, "train_recall": 0.9594535313655449, "train_runtime": 250.2463, "train_samples_per_second": 63.765, "train_steps_per_second": 0.999 }, { "epoch": 38.0, "eval_accuracy": 0.8889515219842165, "eval_f1": 0.8874516370478664, "eval_loss": 0.39475908875465393, "eval_precision": 0.8871997983000491, "eval_recall": 0.8889515219842165, "eval_runtime": 29.3223, "eval_samples_per_second": 60.5, "eval_steps_per_second": 0.955, "step": 2375 }, { "epoch": 38.08, "learning_rate": 0.0006167741935483871, "loss": 0.2018, "step": 2380 }, { "epoch": 38.24, "learning_rate": 0.0006151612903225806, "loss": 0.2047, "step": 2390 }, { "epoch": 38.4, "learning_rate": 0.0006135483870967742, "loss": 0.1931, "step": 2400 }, { "epoch": 38.56, "learning_rate": 0.0006119354838709678, "loss": 0.1973, "step": 2410 }, { "epoch": 38.72, "learning_rate": 0.0006103225806451613, "loss": 0.1901, "step": 2420 }, { "epoch": 38.88, "learning_rate": 0.0006087096774193549, "loss": 0.2128, "step": 2430 }, { "epoch": 38.99, "step": 2437, "train_accuracy": 0.9598295418938397, "train_f1": 0.959583924650842, "train_loss": 0.12042330950498581, "train_precision": 0.9599378088639902, "train_recall": 0.9598295418938397, "train_runtime": 250.3192, "train_samples_per_second": 63.747, "train_steps_per_second": 0.999 }, { "epoch": 38.99, "eval_accuracy": 0.8934611048478016, "eval_f1": 0.8921610181685623, "eval_loss": 0.4096975028514862, "eval_precision": 0.8925841926833548, "eval_recall": 0.8934611048478016, "eval_runtime": 29.0714, "eval_samples_per_second": 61.022, "eval_steps_per_second": 0.963, "step": 2437 }, { "epoch": 39.04, "learning_rate": 0.0006070967741935484, "loss": 0.2022, "step": 2440 }, { "epoch": 39.2, "learning_rate": 0.0006054838709677419, "loss": 0.2015, "step": 2450 }, { "epoch": 39.36, "learning_rate": 0.0006038709677419355, "loss": 0.1906, "step": 2460 }, { "epoch": 39.52, "learning_rate": 0.000602258064516129, "loss": 0.2003, "step": 2470 }, { "epoch": 39.68, "learning_rate": 0.0006006451612903226, "loss": 0.2248, "step": 2480 }, { "epoch": 39.84, "learning_rate": 0.0005990322580645161, "loss": 0.1946, "step": 2490 }, { "epoch": 40.0, "learning_rate": 0.0005974193548387097, "loss": 0.2025, "step": 2500 }, { "epoch": 40.0, "step": 2500, "train_accuracy": 0.9597668734724573, "train_f1": 0.9596223430089906, "train_loss": 0.11334564536809921, "train_precision": 0.9597271475233058, "train_recall": 0.9597668734724573, "train_runtime": 249.5517, "train_samples_per_second": 63.943, "train_steps_per_second": 1.002 }, { "epoch": 40.0, "eval_accuracy": 0.8906426155580609, "eval_f1": 0.8896192336703185, "eval_loss": 0.4116363823413849, "eval_precision": 0.8906240785065708, "eval_recall": 0.8906426155580609, "eval_runtime": 29.0689, "eval_samples_per_second": 61.027, "eval_steps_per_second": 0.963, "step": 2500 }, { "epoch": 40.16, "learning_rate": 0.0005958064516129033, "loss": 0.1783, "step": 2510 }, { "epoch": 40.32, "learning_rate": 0.0005941935483870968, "loss": 0.1915, "step": 2520 }, { "epoch": 40.48, "learning_rate": 0.0005925806451612903, "loss": 0.2113, "step": 2530 }, { "epoch": 40.64, "learning_rate": 0.0005909677419354838, "loss": 0.1906, "step": 2540 }, { "epoch": 40.8, "learning_rate": 0.0005893548387096774, "loss": 0.1835, "step": 2550 }, { "epoch": 40.96, "learning_rate": 0.0005877419354838711, "loss": 0.2171, "step": 2560 }, { "epoch": 40.99, "step": 2562, "train_accuracy": 0.9614589208497838, "train_f1": 0.9612864417727561, "train_loss": 0.11530015617609024, "train_precision": 0.9614218707043837, "train_recall": 0.9614589208497838, "train_runtime": 250.011, "train_samples_per_second": 63.825, "train_steps_per_second": 1.0 }, { "epoch": 40.99, "eval_accuracy": 0.8917700112739572, "eval_f1": 0.890807210174242, "eval_loss": 0.39598962664604187, "eval_precision": 0.8908114942653367, "eval_recall": 0.8917700112739572, "eval_runtime": 29.1379, "eval_samples_per_second": 60.883, "eval_steps_per_second": 0.961, "step": 2562 }, { "epoch": 41.12, "learning_rate": 0.0005861290322580646, "loss": 0.1964, "step": 2570 }, { "epoch": 41.28, "learning_rate": 0.0005845161290322581, "loss": 0.1827, "step": 2580 }, { "epoch": 41.44, "learning_rate": 0.0005829032258064516, "loss": 0.2079, "step": 2590 }, { "epoch": 41.6, "learning_rate": 0.0005812903225806452, "loss": 0.2013, "step": 2600 }, { "epoch": 41.76, "learning_rate": 0.0005796774193548387, "loss": 0.2037, "step": 2610 }, { "epoch": 41.92, "learning_rate": 0.0005780645161290323, "loss": 0.2036, "step": 2620 }, { "epoch": 42.0, "step": 2625, "train_accuracy": 0.9622736103277558, "train_f1": 0.9620354688265563, "train_loss": 0.10922261327505112, "train_precision": 0.9625027768138478, "train_recall": 0.9622736103277558, "train_runtime": 249.7106, "train_samples_per_second": 63.902, "train_steps_per_second": 1.001 }, { "epoch": 42.0, "eval_accuracy": 0.8928974069898534, "eval_f1": 0.891600694267099, "eval_loss": 0.3954656422138214, "eval_precision": 0.8932440084981708, "eval_recall": 0.8928974069898534, "eval_runtime": 29.1604, "eval_samples_per_second": 60.836, "eval_steps_per_second": 0.96, "step": 2625 }, { "epoch": 42.08, "learning_rate": 0.0005764516129032257, "loss": 0.1971, "step": 2630 }, { "epoch": 42.24, "learning_rate": 0.0005748387096774194, "loss": 0.1976, "step": 2640 }, { "epoch": 42.4, "learning_rate": 0.000573225806451613, "loss": 0.2098, "step": 2650 }, { "epoch": 42.56, "learning_rate": 0.0005716129032258065, "loss": 0.1833, "step": 2660 }, { "epoch": 42.72, "learning_rate": 0.00057, "loss": 0.1936, "step": 2670 }, { "epoch": 42.88, "learning_rate": 0.0005683870967741935, "loss": 0.1849, "step": 2680 }, { "epoch": 42.99, "step": 2687, "train_accuracy": 0.9676004261452654, "train_f1": 0.9675534222659815, "train_loss": 0.10426949709653854, "train_precision": 0.9676367935294685, "train_recall": 0.9676004261452654, "train_runtime": 251.7545, "train_samples_per_second": 63.383, "train_steps_per_second": 0.993 }, { "epoch": 42.99, "eval_accuracy": 0.8996617812852311, "eval_f1": 0.8986036298251875, "eval_loss": 0.3904741108417511, "eval_precision": 0.8992691335353804, "eval_recall": 0.8996617812852311, "eval_runtime": 29.0995, "eval_samples_per_second": 60.963, "eval_steps_per_second": 0.962, "step": 2687 }, { "epoch": 43.04, "learning_rate": 0.0005667741935483871, "loss": 0.2041, "step": 2690 }, { "epoch": 43.2, "learning_rate": 0.0005651612903225807, "loss": 0.174, "step": 2700 }, { "epoch": 43.36, "learning_rate": 0.0005635483870967742, "loss": 0.1792, "step": 2710 }, { "epoch": 43.52, "learning_rate": 0.0005619354838709677, "loss": 0.1688, "step": 2720 }, { "epoch": 43.68, "learning_rate": 0.0005603225806451613, "loss": 0.1741, "step": 2730 }, { "epoch": 43.84, "learning_rate": 0.0005587096774193549, "loss": 0.2102, "step": 2740 }, { "epoch": 44.0, "learning_rate": 0.0005570967741935484, "loss": 0.1852, "step": 2750 }, { "epoch": 44.0, "step": 2750, "train_accuracy": 0.964843015604437, "train_f1": 0.9647050151290405, "train_loss": 0.10291223973035812, "train_precision": 0.9649053412080801, "train_recall": 0.964843015604437, "train_runtime": 250.3464, "train_samples_per_second": 63.74, "train_steps_per_second": 0.999 }, { "epoch": 44.0, "eval_accuracy": 0.891206313416009, "eval_f1": 0.8900612906872463, "eval_loss": 0.42409268021583557, "eval_precision": 0.891982003380522, "eval_recall": 0.891206313416009, "eval_runtime": 29.1706, "eval_samples_per_second": 60.815, "eval_steps_per_second": 0.96, "step": 2750 }, { "epoch": 44.16, "learning_rate": 0.000555483870967742, "loss": 0.1816, "step": 2760 }, { "epoch": 44.32, "learning_rate": 0.0005538709677419355, "loss": 0.1765, "step": 2770 }, { "epoch": 44.48, "learning_rate": 0.000552258064516129, "loss": 0.1748, "step": 2780 }, { "epoch": 44.64, "learning_rate": 0.0005506451612903226, "loss": 0.2168, "step": 2790 }, { "epoch": 44.8, "learning_rate": 0.0005490322580645161, "loss": 0.215, "step": 2800 }, { "epoch": 44.96, "learning_rate": 0.0005474193548387097, "loss": 0.1721, "step": 2810 }, { "epoch": 44.99, "step": 2812, "train_accuracy": 0.9665350629817635, "train_f1": 0.9664032195703065, "train_loss": 0.09303626418113708, "train_precision": 0.9665823467276443, "train_recall": 0.9665350629817635, "train_runtime": 250.871, "train_samples_per_second": 63.606, "train_steps_per_second": 0.997 }, { "epoch": 44.99, "eval_accuracy": 0.8962795941375423, "eval_f1": 0.8948599549258702, "eval_loss": 0.4103808104991913, "eval_precision": 0.8955637765539853, "eval_recall": 0.8962795941375423, "eval_runtime": 29.0827, "eval_samples_per_second": 60.998, "eval_steps_per_second": 0.963, "step": 2812 }, { "epoch": 45.12, "learning_rate": 0.0005458064516129032, "loss": 0.1553, "step": 2820 }, { "epoch": 45.28, "learning_rate": 0.0005441935483870968, "loss": 0.1801, "step": 2830 }, { "epoch": 45.44, "learning_rate": 0.0005425806451612904, "loss": 0.1815, "step": 2840 }, { "epoch": 45.6, "learning_rate": 0.0005409677419354839, "loss": 0.2039, "step": 2850 }, { "epoch": 45.76, "learning_rate": 0.0005393548387096774, "loss": 0.1867, "step": 2860 }, { "epoch": 45.92, "learning_rate": 0.0005377419354838709, "loss": 0.186, "step": 2870 }, { "epoch": 46.0, "step": 2875, "train_accuracy": 0.9643416682333772, "train_f1": 0.9642012339068207, "train_loss": 0.09887776523828506, "train_precision": 0.9644991194334305, "train_recall": 0.9643416682333772, "train_runtime": 254.5578, "train_samples_per_second": 62.685, "train_steps_per_second": 0.982 }, { "epoch": 46.0, "eval_accuracy": 0.8917700112739572, "eval_f1": 0.8901319153136237, "eval_loss": 0.4248127341270447, "eval_precision": 0.8912530636364911, "eval_recall": 0.8917700112739572, "eval_runtime": 29.5608, "eval_samples_per_second": 60.012, "eval_steps_per_second": 0.947, "step": 2875 }, { "epoch": 46.08, "learning_rate": 0.0005361290322580645, "loss": 0.1569, "step": 2880 }, { "epoch": 46.24, "learning_rate": 0.0005345161290322581, "loss": 0.1876, "step": 2890 }, { "epoch": 46.4, "learning_rate": 0.0005329032258064517, "loss": 0.1667, "step": 2900 }, { "epoch": 46.56, "learning_rate": 0.0005312903225806452, "loss": 0.169, "step": 2910 }, { "epoch": 46.72, "learning_rate": 0.0005296774193548387, "loss": 0.1803, "step": 2920 }, { "epoch": 46.88, "learning_rate": 0.0005280645161290323, "loss": 0.1811, "step": 2930 }, { "epoch": 46.99, "step": 2937, "train_accuracy": 0.9637149840195526, "train_f1": 0.9634798755891425, "train_loss": 0.10527843236923218, "train_precision": 0.9638723537275108, "train_recall": 0.9637149840195526, "train_runtime": 254.7727, "train_samples_per_second": 62.632, "train_steps_per_second": 0.981 }, { "epoch": 46.99, "eval_accuracy": 0.9013528748590756, "eval_f1": 0.8999103289546431, "eval_loss": 0.42358672618865967, "eval_precision": 0.9005857132412932, "eval_recall": 0.9013528748590756, "eval_runtime": 29.8042, "eval_samples_per_second": 59.522, "eval_steps_per_second": 0.939, "step": 2937 }, { "epoch": 47.04, "learning_rate": 0.0005264516129032258, "loss": 0.1698, "step": 2940 }, { "epoch": 47.2, "learning_rate": 0.0005248387096774193, "loss": 0.1744, "step": 2950 }, { "epoch": 47.36, "learning_rate": 0.0005232258064516128, "loss": 0.1718, "step": 2960 }, { "epoch": 47.52, "learning_rate": 0.0005216129032258065, "loss": 0.1777, "step": 2970 }, { "epoch": 47.68, "learning_rate": 0.0005200000000000001, "loss": 0.1872, "step": 2980 }, { "epoch": 47.84, "learning_rate": 0.0005183870967741936, "loss": 0.1586, "step": 2990 }, { "epoch": 48.0, "learning_rate": 0.0005167741935483871, "loss": 0.1891, "step": 3000 }, { "epoch": 48.0, "step": 3000, "train_accuracy": 0.9668484050886759, "train_f1": 0.966687633803237, "train_loss": 0.09668122977018356, "train_precision": 0.9668284956038484, "train_recall": 0.9668484050886759, "train_runtime": 255.4386, "train_samples_per_second": 62.469, "train_steps_per_second": 0.979 }, { "epoch": 48.0, "eval_accuracy": 0.90304396843292, "eval_f1": 0.9023176970973613, "eval_loss": 0.40747305750846863, "eval_precision": 0.902276892363872, "eval_recall": 0.90304396843292, "eval_runtime": 29.6296, "eval_samples_per_second": 59.873, "eval_steps_per_second": 0.945, "step": 3000 }, { "epoch": 48.16, "learning_rate": 0.0005151612903225806, "loss": 0.1566, "step": 3010 }, { "epoch": 48.32, "learning_rate": 0.0005135483870967742, "loss": 0.1511, "step": 3020 }, { "epoch": 48.48, "learning_rate": 0.0005119354838709677, "loss": 0.1914, "step": 3030 }, { "epoch": 48.64, "learning_rate": 0.0005103225806451613, "loss": 0.1828, "step": 3040 }, { "epoch": 48.8, "learning_rate": 0.0005087096774193549, "loss": 0.1749, "step": 3050 }, { "epoch": 48.96, "learning_rate": 0.0005070967741935484, "loss": 0.1791, "step": 3060 }, { "epoch": 48.99, "step": 3062, "train_accuracy": 0.9676630945666479, "train_f1": 0.9675103889274802, "train_loss": 0.09363168478012085, "train_precision": 0.9676662039614543, "train_recall": 0.9676630945666479, "train_runtime": 255.9566, "train_samples_per_second": 62.343, "train_steps_per_second": 0.977 }, { "epoch": 48.99, "eval_accuracy": 0.8996617812852311, "eval_f1": 0.8987006309929039, "eval_loss": 0.4219958186149597, "eval_precision": 0.8986787206496698, "eval_recall": 0.8996617812852311, "eval_runtime": 29.8773, "eval_samples_per_second": 59.376, "eval_steps_per_second": 0.937, "step": 3062 }, { "epoch": 49.12, "learning_rate": 0.000505483870967742, "loss": 0.1666, "step": 3070 }, { "epoch": 49.28, "learning_rate": 0.0005038709677419355, "loss": 0.1626, "step": 3080 }, { "epoch": 49.44, "learning_rate": 0.000502258064516129, "loss": 0.1771, "step": 3090 }, { "epoch": 49.6, "learning_rate": 0.0005006451612903225, "loss": 0.179, "step": 3100 }, { "epoch": 49.76, "learning_rate": 0.0004990322580645161, "loss": 0.1634, "step": 3110 }, { "epoch": 49.92, "learning_rate": 0.0004974193548387097, "loss": 0.1702, "step": 3120 }, { "epoch": 50.0, "step": 3125, "train_accuracy": 0.9695431472081218, "train_f1": 0.9694274832881341, "train_loss": 0.09215661138296127, "train_precision": 0.9695025177310069, "train_recall": 0.9695431472081218, "train_runtime": 257.2202, "train_samples_per_second": 62.036, "train_steps_per_second": 0.972 }, { "epoch": 50.0, "eval_accuracy": 0.8928974069898534, "eval_f1": 0.8922038394852897, "eval_loss": 0.4357841908931732, "eval_precision": 0.8922256622710033, "eval_recall": 0.8928974069898534, "eval_runtime": 30.2592, "eval_samples_per_second": 58.627, "eval_steps_per_second": 0.925, "step": 3125 }, { "epoch": 50.08, "learning_rate": 0.0004958064516129032, "loss": 0.1738, "step": 3130 }, { "epoch": 50.24, "learning_rate": 0.0004941935483870968, "loss": 0.1781, "step": 3140 }, { "epoch": 50.4, "learning_rate": 0.0004925806451612903, "loss": 0.1814, "step": 3150 }, { "epoch": 50.56, "learning_rate": 0.0004909677419354839, "loss": 0.1766, "step": 3160 }, { "epoch": 50.72, "learning_rate": 0.0004893548387096775, "loss": 0.1689, "step": 3170 }, { "epoch": 50.88, "learning_rate": 0.00048774193548387095, "loss": 0.1667, "step": 3180 }, { "epoch": 50.99, "step": 3187, "train_accuracy": 0.9679137682521777, "train_f1": 0.9678451858925848, "train_loss": 0.08850996196269989, "train_precision": 0.9680124054185439, "train_recall": 0.9679137682521777, "train_runtime": 259.9309, "train_samples_per_second": 61.389, "train_steps_per_second": 0.962 }, { "epoch": 50.99, "eval_accuracy": 0.8957158962795941, "eval_f1": 0.8947220269155864, "eval_loss": 0.4486236274242401, "eval_precision": 0.8959867186310805, "eval_recall": 0.8957158962795941, "eval_runtime": 30.0872, "eval_samples_per_second": 58.962, "eval_steps_per_second": 0.931, "step": 3187 }, { "epoch": 51.04, "learning_rate": 0.00048612903225806457, "loss": 0.1506, "step": 3190 }, { "epoch": 51.2, "learning_rate": 0.00048451612903225807, "loss": 0.1555, "step": 3200 }, { "epoch": 51.36, "learning_rate": 0.00048290322580645163, "loss": 0.164, "step": 3210 }, { "epoch": 51.52, "learning_rate": 0.00048129032258064513, "loss": 0.1574, "step": 3220 }, { "epoch": 51.68, "learning_rate": 0.0004796774193548387, "loss": 0.1554, "step": 3230 }, { "epoch": 51.84, "learning_rate": 0.0004780645161290323, "loss": 0.1653, "step": 3240 }, { "epoch": 52.0, "learning_rate": 0.0004764516129032258, "loss": 0.1733, "step": 3250 }, { "epoch": 52.0, "step": 3250, "train_accuracy": 0.9680391050949426, "train_f1": 0.9679543842076324, "train_loss": 0.09445594996213913, "train_precision": 0.9681396256853804, "train_recall": 0.9680391050949426, "train_runtime": 256.4705, "train_samples_per_second": 62.218, "train_steps_per_second": 0.975 }, { "epoch": 52.0, "eval_accuracy": 0.8990980834272829, "eval_f1": 0.8984372111101244, "eval_loss": 0.43172532320022583, "eval_precision": 0.8994814917612028, "eval_recall": 0.8990980834272829, "eval_runtime": 29.5992, "eval_samples_per_second": 59.934, "eval_steps_per_second": 0.946, "step": 3250 }, { "epoch": 52.16, "learning_rate": 0.00047483870967741937, "loss": 0.1639, "step": 3260 }, { "epoch": 52.32, "learning_rate": 0.00047322580645161287, "loss": 0.1541, "step": 3270 }, { "epoch": 52.48, "learning_rate": 0.0004716129032258065, "loss": 0.1554, "step": 3280 }, { "epoch": 52.64, "learning_rate": 0.00047, "loss": 0.175, "step": 3290 }, { "epoch": 52.8, "learning_rate": 0.00046838709677419354, "loss": 0.1697, "step": 3300 }, { "epoch": 52.96, "learning_rate": 0.0004667741935483871, "loss": 0.1704, "step": 3310 }, { "epoch": 52.99, "step": 3312, "train_accuracy": 0.9716112051137432, "train_f1": 0.9715237218187844, "train_loss": 0.08361362665891647, "train_precision": 0.9715640137675557, "train_recall": 0.9716112051137432, "train_runtime": 251.4627, "train_samples_per_second": 63.457, "train_steps_per_second": 0.994 }, { "epoch": 52.99, "eval_accuracy": 0.9052987598647125, "eval_f1": 0.9044568554057598, "eval_loss": 0.41901707649230957, "eval_precision": 0.9045753701091548, "eval_recall": 0.9052987598647125, "eval_runtime": 29.1923, "eval_samples_per_second": 60.769, "eval_steps_per_second": 0.959, "step": 3312 }, { "epoch": 53.12, "learning_rate": 0.00046516129032258066, "loss": 0.1537, "step": 3320 }, { "epoch": 53.28, "learning_rate": 0.0004635483870967742, "loss": 0.158, "step": 3330 }, { "epoch": 53.44, "learning_rate": 0.0004619354838709677, "loss": 0.1493, "step": 3340 }, { "epoch": 53.6, "learning_rate": 0.0004603225806451613, "loss": 0.1429, "step": 3350 }, { "epoch": 53.76, "learning_rate": 0.00045870967741935484, "loss": 0.1628, "step": 3360 }, { "epoch": 53.92, "learning_rate": 0.0004570967741935484, "loss": 0.1584, "step": 3370 }, { "epoch": 54.0, "step": 3375, "train_accuracy": 0.9703578366860939, "train_f1": 0.970311857800694, "train_loss": 0.08544992655515671, "train_precision": 0.9704579277168014, "train_recall": 0.9703578366860939, "train_runtime": 251.0811, "train_samples_per_second": 63.553, "train_steps_per_second": 0.996 }, { "epoch": 54.0, "eval_accuracy": 0.9052987598647125, "eval_f1": 0.904599065142192, "eval_loss": 0.4305163323879242, "eval_precision": 0.9055272931459877, "eval_recall": 0.9052987598647125, "eval_runtime": 29.1269, "eval_samples_per_second": 60.906, "eval_steps_per_second": 0.961, "step": 3375 }, { "epoch": 54.08, "learning_rate": 0.00045548387096774196, "loss": 0.1577, "step": 3380 }, { "epoch": 54.24, "learning_rate": 0.00045387096774193546, "loss": 0.168, "step": 3390 }, { "epoch": 54.4, "learning_rate": 0.00045225806451612907, "loss": 0.1541, "step": 3400 }, { "epoch": 54.56, "learning_rate": 0.0004506451612903226, "loss": 0.1443, "step": 3410 }, { "epoch": 54.72, "learning_rate": 0.00044903225806451613, "loss": 0.1363, "step": 3420 }, { "epoch": 54.88, "learning_rate": 0.0004474193548387097, "loss": 0.1763, "step": 3430 }, { "epoch": 54.99, "step": 3437, "train_accuracy": 0.9722378893275678, "train_f1": 0.9722304845282628, "train_loss": 0.08548293262720108, "train_precision": 0.9724014188580902, "train_recall": 0.9722378893275678, "train_runtime": 250.8193, "train_samples_per_second": 63.62, "train_steps_per_second": 0.997 }, { "epoch": 54.99, "eval_accuracy": 0.8940248027057497, "eval_f1": 0.8945776482571843, "eval_loss": 0.4349919259548187, "eval_precision": 0.896683319174708, "eval_recall": 0.8940248027057497, "eval_runtime": 29.0389, "eval_samples_per_second": 61.09, "eval_steps_per_second": 0.964, "step": 3437 }, { "epoch": 55.04, "learning_rate": 0.00044580645161290325, "loss": 0.163, "step": 3440 }, { "epoch": 55.2, "learning_rate": 0.0004441935483870968, "loss": 0.1468, "step": 3450 }, { "epoch": 55.36, "learning_rate": 0.0004425806451612903, "loss": 0.1356, "step": 3460 }, { "epoch": 55.52, "learning_rate": 0.00044096774193548387, "loss": 0.1485, "step": 3470 }, { "epoch": 55.68, "learning_rate": 0.00043935483870967743, "loss": 0.1444, "step": 3480 }, { "epoch": 55.84, "learning_rate": 0.000437741935483871, "loss": 0.1463, "step": 3490 }, { "epoch": 56.0, "learning_rate": 0.00043612903225806454, "loss": 0.1609, "step": 3500 }, { "epoch": 56.0, "step": 3500, "train_accuracy": 0.9711725261640659, "train_f1": 0.9710418724528065, "train_loss": 0.08499421924352646, "train_precision": 0.9711871907063745, "train_recall": 0.9711725261640659, "train_runtime": 251.6401, "train_samples_per_second": 63.412, "train_steps_per_second": 0.993 }, { "epoch": 56.0, "eval_accuracy": 0.90304396843292, "eval_f1": 0.901618221901619, "eval_loss": 0.4472709894180298, "eval_precision": 0.9023465256016576, "eval_recall": 0.90304396843292, "eval_runtime": 29.9118, "eval_samples_per_second": 59.308, "eval_steps_per_second": 0.936, "step": 3500 }, { "epoch": 56.16, "learning_rate": 0.00043451612903225805, "loss": 0.1393, "step": 3510 }, { "epoch": 56.32, "learning_rate": 0.00043290322580645166, "loss": 0.1481, "step": 3520 }, { "epoch": 56.48, "learning_rate": 0.00043129032258064516, "loss": 0.1449, "step": 3530 }, { "epoch": 56.64, "learning_rate": 0.0004296774193548387, "loss": 0.168, "step": 3540 }, { "epoch": 56.8, "learning_rate": 0.0004280645161290322, "loss": 0.1722, "step": 3550 }, { "epoch": 56.96, "learning_rate": 0.00042645161290322584, "loss": 0.1549, "step": 3560 }, { "epoch": 56.99, "step": 3562, "train_accuracy": 0.9697311524722693, "train_f1": 0.96954160239289, "train_loss": 0.0850997045636177, "train_precision": 0.9698850921890346, "train_recall": 0.9697311524722693, "train_runtime": 250.5824, "train_samples_per_second": 63.68, "train_steps_per_second": 0.998 }, { "epoch": 56.99, "eval_accuracy": 0.9041713641488163, "eval_f1": 0.9027359585690536, "eval_loss": 0.4477776885032654, "eval_precision": 0.9037863994127037, "eval_recall": 0.9041713641488163, "eval_runtime": 29.1274, "eval_samples_per_second": 60.905, "eval_steps_per_second": 0.961, "step": 3562 }, { "epoch": 57.12, "learning_rate": 0.0004248387096774194, "loss": 0.1415, "step": 3570 }, { "epoch": 57.28, "learning_rate": 0.0004232258064516129, "loss": 0.1557, "step": 3580 }, { "epoch": 57.44, "learning_rate": 0.00042161290322580646, "loss": 0.143, "step": 3590 }, { "epoch": 57.6, "learning_rate": 0.00042, "loss": 0.154, "step": 3600 }, { "epoch": 57.76, "learning_rate": 0.0004183870967741936, "loss": 0.1325, "step": 3610 }, { "epoch": 57.92, "learning_rate": 0.0004167741935483871, "loss": 0.1586, "step": 3620 }, { "epoch": 58.0, "step": 3625, "train_accuracy": 0.9711098577426834, "train_f1": 0.9710190406318763, "train_loss": 0.08111045509576797, "train_precision": 0.971108783894692, "train_recall": 0.9711098577426834, "train_runtime": 252.5322, "train_samples_per_second": 63.188, "train_steps_per_second": 0.99 }, { "epoch": 58.0, "eval_accuracy": 0.9024802705749718, "eval_f1": 0.9011546163080018, "eval_loss": 0.4446905255317688, "eval_precision": 0.9024443209930092, "eval_recall": 0.9024802705749718, "eval_runtime": 29.4234, "eval_samples_per_second": 60.292, "eval_steps_per_second": 0.952, "step": 3625 }, { "epoch": 58.08, "learning_rate": 0.00041516129032258064, "loss": 0.1589, "step": 3630 }, { "epoch": 58.24, "learning_rate": 0.00041354838709677425, "loss": 0.1368, "step": 3640 }, { "epoch": 58.4, "learning_rate": 0.00041193548387096775, "loss": 0.135, "step": 3650 }, { "epoch": 58.56, "learning_rate": 0.0004103225806451613, "loss": 0.1393, "step": 3660 }, { "epoch": 58.72, "learning_rate": 0.0004087096774193548, "loss": 0.1414, "step": 3670 }, { "epoch": 58.88, "learning_rate": 0.00040709677419354843, "loss": 0.1476, "step": 3680 }, { "epoch": 58.99, "step": 3687, "train_accuracy": 0.9716738735351257, "train_f1": 0.9716109081205196, "train_loss": 0.08109210431575775, "train_precision": 0.971619589233349, "train_recall": 0.9716738735351257, "train_runtime": 251.3717, "train_samples_per_second": 63.48, "train_steps_per_second": 0.995 }, { "epoch": 58.99, "eval_accuracy": 0.9007891770011274, "eval_f1": 0.8998310286529279, "eval_loss": 0.46749255061149597, "eval_precision": 0.9005611855026796, "eval_recall": 0.9007891770011274, "eval_runtime": 29.4648, "eval_samples_per_second": 60.207, "eval_steps_per_second": 0.95, "step": 3687 }, { "epoch": 59.04, "learning_rate": 0.00040548387096774193, "loss": 0.1469, "step": 3690 }, { "epoch": 59.2, "learning_rate": 0.0004038709677419355, "loss": 0.1285, "step": 3700 }, { "epoch": 59.36, "learning_rate": 0.00040225806451612905, "loss": 0.1543, "step": 3710 }, { "epoch": 59.52, "learning_rate": 0.00040064516129032255, "loss": 0.1576, "step": 3720 }, { "epoch": 59.68, "learning_rate": 0.00039903225806451616, "loss": 0.1639, "step": 3730 }, { "epoch": 59.84, "learning_rate": 0.00039741935483870967, "loss": 0.1602, "step": 3740 }, { "epoch": 60.0, "learning_rate": 0.0003958064516129032, "loss": 0.1308, "step": 3750 }, { "epoch": 60.0, "step": 3750, "train_accuracy": 0.9714231998495958, "train_f1": 0.9713301650863866, "train_loss": 0.08129285275936127, "train_precision": 0.9713703959271734, "train_recall": 0.9714231998495958, "train_runtime": 251.5017, "train_samples_per_second": 63.447, "train_steps_per_second": 0.994 }, { "epoch": 60.0, "eval_accuracy": 0.9047350620067643, "eval_f1": 0.9038436882672473, "eval_loss": 0.4706019163131714, "eval_precision": 0.9044402371933982, "eval_recall": 0.9047350620067643, "eval_runtime": 30.419, "eval_samples_per_second": 58.319, "eval_steps_per_second": 0.92, "step": 3750 }, { "epoch": 60.16, "learning_rate": 0.00039419354838709673, "loss": 0.1425, "step": 3760 }, { "epoch": 60.32, "learning_rate": 0.00039258064516129034, "loss": 0.1372, "step": 3770 }, { "epoch": 60.48, "learning_rate": 0.0003909677419354839, "loss": 0.1429, "step": 3780 }, { "epoch": 60.64, "learning_rate": 0.0003893548387096774, "loss": 0.1366, "step": 3790 }, { "epoch": 60.8, "learning_rate": 0.00038774193548387096, "loss": 0.1503, "step": 3800 }, { "epoch": 60.96, "learning_rate": 0.0003861290322580645, "loss": 0.1558, "step": 3810 }, { "epoch": 60.99, "step": 3812, "train_accuracy": 0.9736165945979821, "train_f1": 0.9735015663251901, "train_loss": 0.07483678311109543, "train_precision": 0.9736053164344912, "train_recall": 0.9736165945979821, "train_runtime": 250.9181, "train_samples_per_second": 63.594, "train_steps_per_second": 0.996 }, { "epoch": 60.99, "eval_accuracy": 0.9024802705749718, "eval_f1": 0.9010669627888577, "eval_loss": 0.45878297090530396, "eval_precision": 0.9016661622070999, "eval_recall": 0.9024802705749718, "eval_runtime": 30.1022, "eval_samples_per_second": 58.933, "eval_steps_per_second": 0.93, "step": 3812 }, { "epoch": 61.12, "learning_rate": 0.0003845161290322581, "loss": 0.1222, "step": 3820 }, { "epoch": 61.28, "learning_rate": 0.0003829032258064516, "loss": 0.1555, "step": 3830 }, { "epoch": 61.44, "learning_rate": 0.00038129032258064514, "loss": 0.1306, "step": 3840 }, { "epoch": 61.6, "learning_rate": 0.00037967741935483875, "loss": 0.1618, "step": 3850 }, { "epoch": 61.76, "learning_rate": 0.00037806451612903226, "loss": 0.1436, "step": 3860 }, { "epoch": 61.92, "learning_rate": 0.0003764516129032258, "loss": 0.1418, "step": 3870 }, { "epoch": 62.0, "step": 3875, "train_accuracy": 0.9729899103841574, "train_f1": 0.9729148616100128, "train_loss": 0.07707332819700241, "train_precision": 0.9730221901785945, "train_recall": 0.9729899103841574, "train_runtime": 254.0917, "train_samples_per_second": 62.8, "train_steps_per_second": 0.984 }, { "epoch": 62.0, "eval_accuracy": 0.9013528748590756, "eval_f1": 0.9008617353869077, "eval_loss": 0.4513218104839325, "eval_precision": 0.9012600116180024, "eval_recall": 0.9013528748590756, "eval_runtime": 29.9385, "eval_samples_per_second": 59.255, "eval_steps_per_second": 0.935, "step": 3875 }, { "epoch": 62.08, "learning_rate": 0.0003748387096774193, "loss": 0.173, "step": 3880 }, { "epoch": 62.24, "learning_rate": 0.00037322580645161293, "loss": 0.1304, "step": 3890 }, { "epoch": 62.4, "learning_rate": 0.0003716129032258065, "loss": 0.1579, "step": 3900 }, { "epoch": 62.56, "learning_rate": 0.00037, "loss": 0.1388, "step": 3910 }, { "epoch": 62.72, "learning_rate": 0.00036838709677419355, "loss": 0.152, "step": 3920 }, { "epoch": 62.88, "learning_rate": 0.0003667741935483871, "loss": 0.1283, "step": 3930 }, { "epoch": 62.99, "step": 3937, "train_accuracy": 0.9760606630318982, "train_f1": 0.9759960239064865, "train_loss": 0.07244587689638138, "train_precision": 0.9760629730336429, "train_recall": 0.9760606630318982, "train_runtime": 252.7156, "train_samples_per_second": 63.142, "train_steps_per_second": 0.989 }, { "epoch": 62.99, "eval_accuracy": 0.8990980834272829, "eval_f1": 0.8976577160373229, "eval_loss": 0.46622931957244873, "eval_precision": 0.8981920636717567, "eval_recall": 0.8990980834272829, "eval_runtime": 30.0055, "eval_samples_per_second": 59.122, "eval_steps_per_second": 0.933, "step": 3937 }, { "epoch": 63.04, "learning_rate": 0.00036516129032258067, "loss": 0.1423, "step": 3940 }, { "epoch": 63.2, "learning_rate": 0.0003635483870967742, "loss": 0.1345, "step": 3950 }, { "epoch": 63.36, "learning_rate": 0.00036193548387096773, "loss": 0.1225, "step": 3960 }, { "epoch": 63.52, "learning_rate": 0.00036032258064516134, "loss": 0.1399, "step": 3970 }, { "epoch": 63.68, "learning_rate": 0.00035870967741935485, "loss": 0.1409, "step": 3980 }, { "epoch": 63.84, "learning_rate": 0.0003570967741935484, "loss": 0.1431, "step": 3990 }, { "epoch": 64.0, "learning_rate": 0.0003554838709677419, "loss": 0.1375, "step": 4000 }, { "epoch": 64.0, "step": 4000, "train_accuracy": 0.9777527104092248, "train_f1": 0.9776952189068061, "train_loss": 0.07026933133602142, "train_precision": 0.9777982624530956, "train_recall": 0.9777527104092248, "train_runtime": 254.2798, "train_samples_per_second": 62.754, "train_steps_per_second": 0.983 }, { "epoch": 64.0, "eval_accuracy": 0.90304396843292, "eval_f1": 0.9018013838304384, "eval_loss": 0.43738722801208496, "eval_precision": 0.9018869567596777, "eval_recall": 0.90304396843292, "eval_runtime": 30.384, "eval_samples_per_second": 58.386, "eval_steps_per_second": 0.922, "step": 4000 }, { "epoch": 64.16, "learning_rate": 0.0003538709677419355, "loss": 0.121, "step": 4010 }, { "epoch": 64.32, "learning_rate": 0.000352258064516129, "loss": 0.1532, "step": 4020 }, { "epoch": 64.48, "learning_rate": 0.0003506451612903226, "loss": 0.1307, "step": 4030 }, { "epoch": 64.64, "learning_rate": 0.00034903225806451614, "loss": 0.1403, "step": 4040 }, { "epoch": 64.8, "learning_rate": 0.0003474193548387097, "loss": 0.1467, "step": 4050 }, { "epoch": 64.96, "learning_rate": 0.00034580645161290326, "loss": 0.1255, "step": 4060 }, { "epoch": 64.99, "step": 4062, "train_accuracy": 0.9758099893463683, "train_f1": 0.9757450720707583, "train_loss": 0.0738762691617012, "train_precision": 0.9758253961539621, "train_recall": 0.9758099893463683, "train_runtime": 270.7799, "train_samples_per_second": 58.93, "train_steps_per_second": 0.923 }, { "epoch": 64.99, "eval_accuracy": 0.9041713641488163, "eval_f1": 0.9027682806702938, "eval_loss": 0.43671032786369324, "eval_precision": 0.9029520225388282, "eval_recall": 0.9041713641488163, "eval_runtime": 46.2, "eval_samples_per_second": 38.398, "eval_steps_per_second": 0.606, "step": 4062 }, { "epoch": 65.12, "learning_rate": 0.00034419354838709676, "loss": 0.1398, "step": 4070 }, { "epoch": 65.28, "learning_rate": 0.0003425806451612903, "loss": 0.1294, "step": 4080 }, { "epoch": 65.44, "learning_rate": 0.0003409677419354839, "loss": 0.1192, "step": 4090 }, { "epoch": 65.6, "learning_rate": 0.00033935483870967744, "loss": 0.1274, "step": 4100 }, { "epoch": 65.76, "learning_rate": 0.000337741935483871, "loss": 0.1332, "step": 4110 }, { "epoch": 65.92, "learning_rate": 0.0003361290322580645, "loss": 0.1356, "step": 4120 }, { "epoch": 66.0, "step": 4125, "train_accuracy": 0.9761233314532807, "train_f1": 0.9759950169974181, "train_loss": 0.07223277539014816, "train_precision": 0.9761999631640097, "train_recall": 0.9761233314532807, "train_runtime": 254.9857, "train_samples_per_second": 62.58, "train_steps_per_second": 0.98 }, { "epoch": 66.0, "eval_accuracy": 0.9002254791431793, "eval_f1": 0.8985023992882097, "eval_loss": 0.47199180722236633, "eval_precision": 0.8998740225780659, "eval_recall": 0.9002254791431793, "eval_runtime": 46.4259, "eval_samples_per_second": 38.211, "eval_steps_per_second": 0.603, "step": 4125 }, { "epoch": 66.08, "learning_rate": 0.0003345161290322581, "loss": 0.1288, "step": 4130 }, { "epoch": 66.24, "learning_rate": 0.0003329032258064516, "loss": 0.1373, "step": 4140 }, { "epoch": 66.4, "learning_rate": 0.0003312903225806452, "loss": 0.1424, "step": 4150 }, { "epoch": 66.56, "learning_rate": 0.0003296774193548387, "loss": 0.1369, "step": 4160 }, { "epoch": 66.72, "learning_rate": 0.0003280645161290323, "loss": 0.1366, "step": 4170 }, { "epoch": 66.88, "learning_rate": 0.00032645161290322585, "loss": 0.1363, "step": 4180 }, { "epoch": 66.99, "step": 4187, "train_accuracy": 0.9745566209187191, "train_f1": 0.9744197447101088, "train_loss": 0.07206864655017853, "train_precision": 0.9746863463745119, "train_recall": 0.9745566209187191, "train_runtime": 255.3323, "train_samples_per_second": 62.495, "train_steps_per_second": 0.979 }, { "epoch": 66.99, "eval_accuracy": 0.8974069898534386, "eval_f1": 0.8958287812129277, "eval_loss": 0.4912644624710083, "eval_precision": 0.897064496045103, "eval_recall": 0.8974069898534386, "eval_runtime": 42.5384, "eval_samples_per_second": 41.703, "eval_steps_per_second": 0.658, "step": 4187 }, { "epoch": 67.04, "learning_rate": 0.00032483870967741935, "loss": 0.1427, "step": 4190 }, { "epoch": 67.2, "learning_rate": 0.0003232258064516129, "loss": 0.1423, "step": 4200 }, { "epoch": 67.36, "learning_rate": 0.00032161290322580647, "loss": 0.1346, "step": 4210 }, { "epoch": 67.52, "learning_rate": 0.00032, "loss": 0.1349, "step": 4220 }, { "epoch": 67.68, "learning_rate": 0.00031838709677419353, "loss": 0.1222, "step": 4230 }, { "epoch": 67.84, "learning_rate": 0.0003167741935483871, "loss": 0.1332, "step": 4240 }, { "epoch": 68.0, "learning_rate": 0.0003151612903225807, "loss": 0.1307, "step": 4250 }, { "epoch": 68.0, "step": 4250, "train_accuracy": 0.9771260261954001, "train_f1": 0.9770837683590446, "train_loss": 0.06861759722232819, "train_precision": 0.9771261688994373, "train_recall": 0.9771260261954001, "train_runtime": 258.9242, "train_samples_per_second": 61.628, "train_steps_per_second": 0.966 }, { "epoch": 68.0, "eval_accuracy": 0.9041713641488163, "eval_f1": 0.9032565731221586, "eval_loss": 0.440946489572525, "eval_precision": 0.9031641144165843, "eval_recall": 0.9041713641488163, "eval_runtime": 39.476, "eval_samples_per_second": 44.939, "eval_steps_per_second": 0.709, "step": 4250 }, { "epoch": 68.16, "learning_rate": 0.0003135483870967742, "loss": 0.1264, "step": 4260 }, { "epoch": 68.32, "learning_rate": 0.00031193548387096776, "loss": 0.1441, "step": 4270 }, { "epoch": 68.48, "learning_rate": 0.00031032258064516127, "loss": 0.127, "step": 4280 }, { "epoch": 68.64, "learning_rate": 0.0003087096774193548, "loss": 0.1392, "step": 4290 }, { "epoch": 68.8, "learning_rate": 0.0003070967741935484, "loss": 0.143, "step": 4300 }, { "epoch": 68.96, "learning_rate": 0.00030548387096774194, "loss": 0.1209, "step": 4310 }, { "epoch": 68.99, "step": 4312, "train_accuracy": 0.975621984082221, "train_f1": 0.9755696733303983, "train_loss": 0.07073085755109787, "train_precision": 0.9756366046304416, "train_recall": 0.975621984082221, "train_runtime": 256.8947, "train_samples_per_second": 62.115, "train_steps_per_second": 0.973 }, { "epoch": 68.99, "eval_accuracy": 0.9075535512965051, "eval_f1": 0.9068001649833212, "eval_loss": 0.4593234956264496, "eval_precision": 0.9074473642395492, "eval_recall": 0.9075535512965051, "eval_runtime": 44.7864, "eval_samples_per_second": 39.61, "eval_steps_per_second": 0.625, "step": 4312 }, { "epoch": 69.12, "learning_rate": 0.0003038709677419355, "loss": 0.1404, "step": 4320 }, { "epoch": 69.28, "learning_rate": 0.000302258064516129, "loss": 0.1417, "step": 4330 }, { "epoch": 69.44, "learning_rate": 0.0003006451612903226, "loss": 0.1137, "step": 4340 }, { "epoch": 69.6, "learning_rate": 0.0002990322580645161, "loss": 0.118, "step": 4350 }, { "epoch": 69.76, "learning_rate": 0.0002974193548387097, "loss": 0.1159, "step": 4360 }, { "epoch": 69.92, "learning_rate": 0.0002958064516129032, "loss": 0.1463, "step": 4370 }, { "epoch": 70.0, "step": 4375, "train_accuracy": 0.9780660525161371, "train_f1": 0.9780045954132663, "train_loss": 0.06600172072649002, "train_precision": 0.9780539223141508, "train_recall": 0.9780660525161371, "train_runtime": 257.4363, "train_samples_per_second": 61.984, "train_steps_per_second": 0.971 }, { "epoch": 70.0, "eval_accuracy": 0.9036076662908681, "eval_f1": 0.9023949767425765, "eval_loss": 0.4772753119468689, "eval_precision": 0.9028653821326578, "eval_recall": 0.9036076662908681, "eval_runtime": 40.3083, "eval_samples_per_second": 44.011, "eval_steps_per_second": 0.695, "step": 4375 }, { "epoch": 70.08, "learning_rate": 0.0002941935483870968, "loss": 0.1154, "step": 4380 }, { "epoch": 70.24, "learning_rate": 0.00029258064516129035, "loss": 0.1401, "step": 4390 }, { "epoch": 70.4, "learning_rate": 0.00029096774193548386, "loss": 0.1348, "step": 4400 }, { "epoch": 70.56, "learning_rate": 0.0002893548387096774, "loss": 0.1333, "step": 4410 }, { "epoch": 70.72, "learning_rate": 0.00028774193548387097, "loss": 0.1292, "step": 4420 }, { "epoch": 70.88, "learning_rate": 0.00028612903225806453, "loss": 0.1217, "step": 4430 }, { "epoch": 70.99, "step": 4437, "train_accuracy": 0.976562010402958, "train_f1": 0.976489238828708, "train_loss": 0.0662013366818428, "train_precision": 0.9765934380829007, "train_recall": 0.976562010402958, "train_runtime": 257.6318, "train_samples_per_second": 61.937, "train_steps_per_second": 0.97 }, { "epoch": 70.99, "eval_accuracy": 0.9098083427282976, "eval_f1": 0.9089720394690067, "eval_loss": 0.44329407811164856, "eval_precision": 0.9092946695808038, "eval_recall": 0.9098083427282976, "eval_runtime": 34.2569, "eval_samples_per_second": 51.785, "eval_steps_per_second": 0.817, "step": 4437 }, { "epoch": 71.04, "learning_rate": 0.0002845161290322581, "loss": 0.1271, "step": 4440 }, { "epoch": 71.2, "learning_rate": 0.0002829032258064516, "loss": 0.1108, "step": 4450 }, { "epoch": 71.36, "learning_rate": 0.0002812903225806452, "loss": 0.1156, "step": 4460 }, { "epoch": 71.52, "learning_rate": 0.0002796774193548387, "loss": 0.1385, "step": 4470 }, { "epoch": 71.68, "learning_rate": 0.00027806451612903227, "loss": 0.1333, "step": 4480 }, { "epoch": 71.84, "learning_rate": 0.00027645161290322577, "loss": 0.107, "step": 4490 }, { "epoch": 72.0, "learning_rate": 0.0002748387096774194, "loss": 0.1361, "step": 4500 }, { "epoch": 72.0, "step": 4500, "train_accuracy": 0.9758726577677508, "train_f1": 0.9758377736683368, "train_loss": 0.0710226520895958, "train_precision": 0.9758628894264394, "train_recall": 0.9758726577677508, "train_runtime": 260.0539, "train_samples_per_second": 61.36, "train_steps_per_second": 0.961 }, { "epoch": 72.0, "eval_accuracy": 0.9075535512965051, "eval_f1": 0.9071424091130842, "eval_loss": 0.43427780270576477, "eval_precision": 0.907402566021774, "eval_recall": 0.9075535512965051, "eval_runtime": 30.9428, "eval_samples_per_second": 57.332, "eval_steps_per_second": 0.905, "step": 4500 }, { "epoch": 72.16, "learning_rate": 0.00027322580645161294, "loss": 0.1166, "step": 4510 }, { "epoch": 72.32, "learning_rate": 0.00027161290322580645, "loss": 0.1422, "step": 4520 }, { "epoch": 72.48, "learning_rate": 0.00027, "loss": 0.1253, "step": 4530 }, { "epoch": 72.64, "learning_rate": 0.00026838709677419356, "loss": 0.1287, "step": 4540 }, { "epoch": 72.8, "learning_rate": 0.0002667741935483871, "loss": 0.1257, "step": 4550 }, { "epoch": 72.96, "learning_rate": 0.0002651612903225806, "loss": 0.1164, "step": 4560 }, { "epoch": 72.99, "step": 4562, "train_accuracy": 0.9780660525161371, "train_f1": 0.9780243494069962, "train_loss": 0.0632663145661354, "train_precision": 0.978042686088855, "train_recall": 0.9780660525161371, "train_runtime": 253.9785, "train_samples_per_second": 62.828, "train_steps_per_second": 0.984 }, { "epoch": 72.99, "eval_accuracy": 0.9013528748590756, "eval_f1": 0.90025705081473, "eval_loss": 0.4536808431148529, "eval_precision": 0.9003205156911865, "eval_recall": 0.9013528748590756, "eval_runtime": 30.6887, "eval_samples_per_second": 57.806, "eval_steps_per_second": 0.912, "step": 4562 }, { "epoch": 73.12, "learning_rate": 0.0002635483870967742, "loss": 0.1255, "step": 4570 }, { "epoch": 73.28, "learning_rate": 0.0002619354838709678, "loss": 0.1278, "step": 4580 }, { "epoch": 73.44, "learning_rate": 0.0002603225806451613, "loss": 0.1296, "step": 4590 }, { "epoch": 73.6, "learning_rate": 0.00025870967741935486, "loss": 0.1337, "step": 4600 }, { "epoch": 73.76, "learning_rate": 0.00025709677419354836, "loss": 0.1215, "step": 4610 }, { "epoch": 73.92, "learning_rate": 0.00025548387096774197, "loss": 0.1313, "step": 4620 }, { "epoch": 74.0, "step": 4625, "train_accuracy": 0.9766246788243405, "train_f1": 0.9765319317829301, "train_loss": 0.06763936579227448, "train_precision": 0.976670123477298, "train_recall": 0.9766246788243405, "train_runtime": 252.1633, "train_samples_per_second": 63.28, "train_steps_per_second": 0.991 }, { "epoch": 74.0, "eval_accuracy": 0.90304396843292, "eval_f1": 0.9020628517400072, "eval_loss": 0.44354888796806335, "eval_precision": 0.9022087129927616, "eval_recall": 0.90304396843292, "eval_runtime": 29.2384, "eval_samples_per_second": 60.674, "eval_steps_per_second": 0.958, "step": 4625 }, { "epoch": 74.08, "learning_rate": 0.0002538709677419355, "loss": 0.1295, "step": 4630 }, { "epoch": 74.24, "learning_rate": 0.00025225806451612903, "loss": 0.1257, "step": 4640 }, { "epoch": 74.4, "learning_rate": 0.0002506451612903226, "loss": 0.1009, "step": 4650 }, { "epoch": 74.56, "learning_rate": 0.00024903225806451615, "loss": 0.1254, "step": 4660 }, { "epoch": 74.72, "learning_rate": 0.00024741935483870965, "loss": 0.1291, "step": 4670 }, { "epoch": 74.88, "learning_rate": 0.00024580645161290327, "loss": 0.1291, "step": 4680 }, { "epoch": 74.99, "step": 4687, "train_accuracy": 0.97737669988093, "train_f1": 0.9773174710084362, "train_loss": 0.06480351090431213, "train_precision": 0.9773832839286731, "train_recall": 0.97737669988093, "train_runtime": 266.3469, "train_samples_per_second": 59.911, "train_steps_per_second": 0.939 }, { "epoch": 74.99, "eval_accuracy": 0.9052987598647125, "eval_f1": 0.9045329930179677, "eval_loss": 0.44802290201187134, "eval_precision": 0.9044815010640291, "eval_recall": 0.9052987598647125, "eval_runtime": 46.7594, "eval_samples_per_second": 37.939, "eval_steps_per_second": 0.599, "step": 4687 }, { "epoch": 75.04, "learning_rate": 0.00024419354838709677, "loss": 0.1316, "step": 4690 }, { "epoch": 75.2, "learning_rate": 0.00024258064516129033, "loss": 0.1315, "step": 4700 }, { "epoch": 75.36, "learning_rate": 0.0002409677419354839, "loss": 0.11, "step": 4710 }, { "epoch": 75.52, "learning_rate": 0.00023935483870967742, "loss": 0.1253, "step": 4720 }, { "epoch": 75.68, "learning_rate": 0.00023774193548387098, "loss": 0.1193, "step": 4730 }, { "epoch": 75.84, "learning_rate": 0.0002361290322580645, "loss": 0.1122, "step": 4740 }, { "epoch": 76.0, "learning_rate": 0.0002345161290322581, "loss": 0.132, "step": 4750 }, { "epoch": 76.0, "step": 4750, "train_accuracy": 0.9790060788368741, "train_f1": 0.9789581823313721, "train_loss": 0.060503240674734116, "train_precision": 0.9790325316940118, "train_recall": 0.9790060788368741, "train_runtime": 258.2855, "train_samples_per_second": 61.78, "train_steps_per_second": 0.968 }, { "epoch": 76.0, "eval_accuracy": 0.9058624577226606, "eval_f1": 0.904482480434317, "eval_loss": 0.46171513199806213, "eval_precision": 0.9050040535484158, "eval_recall": 0.9058624577226606, "eval_runtime": 42.9199, "eval_samples_per_second": 41.333, "eval_steps_per_second": 0.652, "step": 4750 }, { "epoch": 76.16, "learning_rate": 0.00023290322580645162, "loss": 0.1141, "step": 4760 }, { "epoch": 76.32, "learning_rate": 0.00023129032258064516, "loss": 0.111, "step": 4770 }, { "epoch": 76.48, "learning_rate": 0.0002296774193548387, "loss": 0.1362, "step": 4780 }, { "epoch": 76.64, "learning_rate": 0.00022806451612903224, "loss": 0.1303, "step": 4790 }, { "epoch": 76.8, "learning_rate": 0.0002264516129032258, "loss": 0.1128, "step": 4800 }, { "epoch": 76.96, "learning_rate": 0.00022483870967741936, "loss": 0.1197, "step": 4810 }, { "epoch": 76.99, "step": 4812, "train_accuracy": 0.9780033840947546, "train_f1": 0.9779246149243382, "train_loss": 0.06653548032045364, "train_precision": 0.9780194906548296, "train_recall": 0.9780033840947546, "train_runtime": 255.9446, "train_samples_per_second": 62.346, "train_steps_per_second": 0.977 }, { "epoch": 76.99, "eval_accuracy": 0.9058624577226606, "eval_f1": 0.904136777153852, "eval_loss": 0.45922645926475525, "eval_precision": 0.9042117586049208, "eval_recall": 0.9058624577226606, "eval_runtime": 37.615, "eval_samples_per_second": 47.162, "eval_steps_per_second": 0.744, "step": 4812 }, { "epoch": 77.12, "learning_rate": 0.00022322580645161292, "loss": 0.1185, "step": 4820 }, { "epoch": 77.28, "learning_rate": 0.00022161290322580645, "loss": 0.1297, "step": 4830 }, { "epoch": 77.44, "learning_rate": 0.00022, "loss": 0.1167, "step": 4840 }, { "epoch": 77.6, "learning_rate": 0.00021838709677419354, "loss": 0.1185, "step": 4850 }, { "epoch": 77.76, "learning_rate": 0.0002167741935483871, "loss": 0.1095, "step": 4860 }, { "epoch": 77.92, "learning_rate": 0.00021516129032258063, "loss": 0.1199, "step": 4870 }, { "epoch": 78.0, "step": 4875, "train_accuracy": 0.9789434104154916, "train_f1": 0.9789055395945256, "train_loss": 0.06331050395965576, "train_precision": 0.9789060427186901, "train_recall": 0.9789434104154916, "train_runtime": 255.8602, "train_samples_per_second": 62.366, "train_steps_per_second": 0.977 }, { "epoch": 78.0, "eval_accuracy": 0.9160090191657272, "eval_f1": 0.9156304372279399, "eval_loss": 0.4329167902469635, "eval_precision": 0.9156707582414666, "eval_recall": 0.9160090191657272, "eval_runtime": 36.868, "eval_samples_per_second": 48.118, "eval_steps_per_second": 0.759, "step": 4875 }, { "epoch": 78.08, "learning_rate": 0.0002135483870967742, "loss": 0.1098, "step": 4880 }, { "epoch": 78.24, "learning_rate": 0.00021193548387096774, "loss": 0.1134, "step": 4890 }, { "epoch": 78.4, "learning_rate": 0.0002103225806451613, "loss": 0.1103, "step": 4900 }, { "epoch": 78.56, "learning_rate": 0.00020870967741935483, "loss": 0.1266, "step": 4910 }, { "epoch": 78.72, "learning_rate": 0.0002070967741935484, "loss": 0.1083, "step": 4920 }, { "epoch": 78.88, "learning_rate": 0.00020548387096774192, "loss": 0.124, "step": 4930 }, { "epoch": 78.99, "step": 4937, "train_accuracy": 0.978191389358902, "train_f1": 0.9781684943478942, "train_loss": 0.06074240058660507, "train_precision": 0.9782183084448501, "train_recall": 0.978191389358902, "train_runtime": 255.7407, "train_samples_per_second": 62.395, "train_steps_per_second": 0.978 }, { "epoch": 78.99, "eval_accuracy": 0.9148816234498309, "eval_f1": 0.914220821168919, "eval_loss": 0.4336497485637665, "eval_precision": 0.9142236947687447, "eval_recall": 0.9148816234498309, "eval_runtime": 31.4364, "eval_samples_per_second": 56.431, "eval_steps_per_second": 0.891, "step": 4937 }, { "epoch": 79.04, "learning_rate": 0.00020387096774193548, "loss": 0.13, "step": 4940 }, { "epoch": 79.2, "learning_rate": 0.00020225806451612904, "loss": 0.1212, "step": 4950 }, { "epoch": 79.36, "learning_rate": 0.0002006451612903226, "loss": 0.0928, "step": 4960 }, { "epoch": 79.52, "learning_rate": 0.00019903225806451613, "loss": 0.1227, "step": 4970 }, { "epoch": 79.68, "learning_rate": 0.00019741935483870969, "loss": 0.1283, "step": 4980 }, { "epoch": 79.84, "learning_rate": 0.00019580645161290322, "loss": 0.1174, "step": 4990 }, { "epoch": 80.0, "learning_rate": 0.00019419354838709678, "loss": 0.118, "step": 5000 }, { "epoch": 80.0, "step": 5000, "train_accuracy": 0.9766246788243405, "train_f1": 0.9765541131510495, "train_loss": 0.0666293278336525, "train_precision": 0.9766229850859756, "train_recall": 0.9766246788243405, "train_runtime": 259.1008, "train_samples_per_second": 61.586, "train_steps_per_second": 0.965 }, { "epoch": 80.0, "eval_accuracy": 0.9086809470124013, "eval_f1": 0.90750875812957, "eval_loss": 0.45560184121131897, "eval_precision": 0.9079785564126395, "eval_recall": 0.9086809470124013, "eval_runtime": 31.9115, "eval_samples_per_second": 55.591, "eval_steps_per_second": 0.877, "step": 5000 }, { "epoch": 80.16, "learning_rate": 0.0001925806451612903, "loss": 0.0913, "step": 5010 }, { "epoch": 80.32, "learning_rate": 0.0001909677419354839, "loss": 0.124, "step": 5020 }, { "epoch": 80.48, "learning_rate": 0.00018935483870967742, "loss": 0.1009, "step": 5030 }, { "epoch": 80.64, "learning_rate": 0.00018774193548387098, "loss": 0.1101, "step": 5040 }, { "epoch": 80.8, "learning_rate": 0.0001861290322580645, "loss": 0.1066, "step": 5050 }, { "epoch": 80.96, "learning_rate": 0.00018451612903225807, "loss": 0.1135, "step": 5060 }, { "epoch": 80.99, "step": 5062, "train_accuracy": 0.9778153788306072, "train_f1": 0.9777754434919425, "train_loss": 0.0617908276617527, "train_precision": 0.9778452684709104, "train_recall": 0.9778153788306072, "train_runtime": 256.2036, "train_samples_per_second": 62.282, "train_steps_per_second": 0.976 }, { "epoch": 80.99, "eval_accuracy": 0.9098083427282976, "eval_f1": 0.9089912962963755, "eval_loss": 0.4518835246562958, "eval_precision": 0.9089474065575852, "eval_recall": 0.9098083427282976, "eval_runtime": 30.3175, "eval_samples_per_second": 58.514, "eval_steps_per_second": 0.924, "step": 5062 }, { "epoch": 81.12, "learning_rate": 0.0001829032258064516, "loss": 0.1126, "step": 5070 }, { "epoch": 81.28, "learning_rate": 0.0001812903225806452, "loss": 0.1193, "step": 5080 }, { "epoch": 81.44, "learning_rate": 0.00017967741935483872, "loss": 0.1, "step": 5090 }, { "epoch": 81.6, "learning_rate": 0.00017806451612903228, "loss": 0.1133, "step": 5100 }, { "epoch": 81.76, "learning_rate": 0.0001764516129032258, "loss": 0.1108, "step": 5110 }, { "epoch": 81.92, "learning_rate": 0.00017483870967741936, "loss": 0.1047, "step": 5120 }, { "epoch": 82.0, "step": 5125, "train_accuracy": 0.9804474525286708, "train_f1": 0.9803932668866718, "train_loss": 0.05864088237285614, "train_precision": 0.9804524158920493, "train_recall": 0.9804474525286708, "train_runtime": 255.5222, "train_samples_per_second": 62.449, "train_steps_per_second": 0.978 }, { "epoch": 82.0, "eval_accuracy": 0.9086809470124013, "eval_f1": 0.9077573719855858, "eval_loss": 0.46281760931015015, "eval_precision": 0.9078136987288633, "eval_recall": 0.9086809470124013, "eval_runtime": 29.6004, "eval_samples_per_second": 59.932, "eval_steps_per_second": 0.946, "step": 5125 }, { "epoch": 82.08, "learning_rate": 0.0001732258064516129, "loss": 0.1049, "step": 5130 }, { "epoch": 82.24, "learning_rate": 0.00017161290322580645, "loss": 0.1198, "step": 5140 }, { "epoch": 82.4, "learning_rate": 0.00017, "loss": 0.1013, "step": 5150 }, { "epoch": 82.56, "learning_rate": 0.00016838709677419357, "loss": 0.1196, "step": 5160 }, { "epoch": 82.72, "learning_rate": 0.0001667741935483871, "loss": 0.1076, "step": 5170 }, { "epoch": 82.88, "learning_rate": 0.00016516129032258066, "loss": 0.0977, "step": 5180 }, { "epoch": 82.99, "step": 5187, "train_accuracy": 0.9785047314658144, "train_f1": 0.9784666340134569, "train_loss": 0.061825916171073914, "train_precision": 0.9784978840692157, "train_recall": 0.9785047314658144, "train_runtime": 254.0139, "train_samples_per_second": 62.819, "train_steps_per_second": 0.984 }, { "epoch": 82.99, "eval_accuracy": 0.9098083427282976, "eval_f1": 0.9089103848523707, "eval_loss": 0.4576462209224701, "eval_precision": 0.9088881743285697, "eval_recall": 0.9098083427282976, "eval_runtime": 29.6463, "eval_samples_per_second": 59.839, "eval_steps_per_second": 0.944, "step": 5187 }, { "epoch": 83.04, "learning_rate": 0.0001635483870967742, "loss": 0.0983, "step": 5190 }, { "epoch": 83.2, "learning_rate": 0.00016193548387096775, "loss": 0.1126, "step": 5200 }, { "epoch": 83.36, "learning_rate": 0.00016032258064516128, "loss": 0.1362, "step": 5210 }, { "epoch": 83.52, "learning_rate": 0.00015870967741935487, "loss": 0.1073, "step": 5220 }, { "epoch": 83.68, "learning_rate": 0.0001570967741935484, "loss": 0.111, "step": 5230 }, { "epoch": 83.84, "learning_rate": 0.00015548387096774195, "loss": 0.1125, "step": 5240 }, { "epoch": 84.0, "learning_rate": 0.00015387096774193549, "loss": 0.1149, "step": 5250 }, { "epoch": 84.0, "step": 5250, "train_accuracy": 0.980886131478348, "train_f1": 0.9808510090193131, "train_loss": 0.05500573664903641, "train_precision": 0.9808883134493344, "train_recall": 0.980886131478348, "train_runtime": 260.1325, "train_samples_per_second": 61.342, "train_steps_per_second": 0.961 }, { "epoch": 84.0, "eval_accuracy": 0.9120631341600902, "eval_f1": 0.911138462348306, "eval_loss": 0.4605374038219452, "eval_precision": 0.9110930924781012, "eval_recall": 0.9120631341600902, "eval_runtime": 29.9251, "eval_samples_per_second": 59.281, "eval_steps_per_second": 0.936, "step": 5250 }, { "epoch": 84.16, "learning_rate": 0.00015225806451612904, "loss": 0.0955, "step": 5260 }, { "epoch": 84.32, "learning_rate": 0.00015064516129032257, "loss": 0.1187, "step": 5270 }, { "epoch": 84.48, "learning_rate": 0.0001490322580645161, "loss": 0.1101, "step": 5280 }, { "epoch": 84.64, "learning_rate": 0.0001474193548387097, "loss": 0.106, "step": 5290 }, { "epoch": 84.8, "learning_rate": 0.00014580645161290322, "loss": 0.099, "step": 5300 }, { "epoch": 84.96, "learning_rate": 0.00014419354838709678, "loss": 0.1241, "step": 5310 }, { "epoch": 84.99, "step": 5312, "train_accuracy": 0.9786927367299618, "train_f1": 0.9786376256812076, "train_loss": 0.0632563978433609, "train_precision": 0.9786888233858622, "train_recall": 0.9786927367299618, "train_runtime": 253.1029, "train_samples_per_second": 63.046, "train_steps_per_second": 0.988 }, { "epoch": 84.99, "eval_accuracy": 0.9131905298759865, "eval_f1": 0.9126492909049198, "eval_loss": 0.4541684687137604, "eval_precision": 0.9125019654104216, "eval_recall": 0.9131905298759865, "eval_runtime": 36.7528, "eval_samples_per_second": 48.268, "eval_steps_per_second": 0.762, "step": 5312 }, { "epoch": 85.12, "learning_rate": 0.0001425806451612903, "loss": 0.1174, "step": 5320 }, { "epoch": 85.28, "learning_rate": 0.00014096774193548387, "loss": 0.1129, "step": 5330 }, { "epoch": 85.44, "learning_rate": 0.0001393548387096774, "loss": 0.0965, "step": 5340 }, { "epoch": 85.6, "learning_rate": 0.00013774193548387099, "loss": 0.0996, "step": 5350 }, { "epoch": 85.76, "learning_rate": 0.00013612903225806452, "loss": 0.1188, "step": 5360 }, { "epoch": 85.92, "learning_rate": 0.00013451612903225807, "loss": 0.1262, "step": 5370 }, { "epoch": 86.0, "step": 5375, "train_accuracy": 0.9786927367299618, "train_f1": 0.9786430332999637, "train_loss": 0.06230182945728302, "train_precision": 0.9787228334576183, "train_recall": 0.9786927367299618, "train_runtime": 254.0805, "train_samples_per_second": 62.803, "train_steps_per_second": 0.984 }, { "epoch": 86.0, "eval_accuracy": 0.9081172491544532, "eval_f1": 0.9073973897547527, "eval_loss": 0.45515382289886475, "eval_precision": 0.9074033025441, "eval_recall": 0.9081172491544532, "eval_runtime": 29.4676, "eval_samples_per_second": 60.202, "eval_steps_per_second": 0.95, "step": 5375 }, { "epoch": 86.08, "learning_rate": 0.0001329032258064516, "loss": 0.1058, "step": 5380 }, { "epoch": 86.24, "learning_rate": 0.00013129032258064516, "loss": 0.1131, "step": 5390 }, { "epoch": 86.4, "learning_rate": 0.0001296774193548387, "loss": 0.1009, "step": 5400 }, { "epoch": 86.56, "learning_rate": 0.00012806451612903225, "loss": 0.1047, "step": 5410 }, { "epoch": 86.72, "learning_rate": 0.0001264516129032258, "loss": 0.1055, "step": 5420 }, { "epoch": 86.88, "learning_rate": 0.00012483870967741934, "loss": 0.1114, "step": 5430 }, { "epoch": 86.99, "step": 5437, "train_accuracy": 0.9789434104154916, "train_f1": 0.9788727186488501, "train_loss": 0.05873732641339302, "train_precision": 0.9789898516890257, "train_recall": 0.9789434104154916, "train_runtime": 252.3787, "train_samples_per_second": 63.226, "train_steps_per_second": 0.991 }, { "epoch": 86.99, "eval_accuracy": 0.9081172491544532, "eval_f1": 0.907050844291005, "eval_loss": 0.46865400671958923, "eval_precision": 0.9071698989671065, "eval_recall": 0.9081172491544532, "eval_runtime": 29.1201, "eval_samples_per_second": 60.92, "eval_steps_per_second": 0.962, "step": 5437 }, { "epoch": 87.04, "learning_rate": 0.0001232258064516129, "loss": 0.0953, "step": 5440 }, { "epoch": 87.2, "learning_rate": 0.00012161290322580646, "loss": 0.0895, "step": 5450 }, { "epoch": 87.36, "learning_rate": 0.00012, "loss": 0.1122, "step": 5460 }, { "epoch": 87.52, "learning_rate": 0.00011838709677419356, "loss": 0.1169, "step": 5470 }, { "epoch": 87.68, "learning_rate": 0.0001167741935483871, "loss": 0.1031, "step": 5480 }, { "epoch": 87.84, "learning_rate": 0.00011516129032258065, "loss": 0.1052, "step": 5490 }, { "epoch": 88.0, "learning_rate": 0.00011354838709677421, "loss": 0.0835, "step": 5500 }, { "epoch": 88.0, "step": 5500, "train_accuracy": 0.9811994735852604, "train_f1": 0.9811537862655559, "train_loss": 0.05588332563638687, "train_precision": 0.9812213014473542, "train_recall": 0.9811994735852604, "train_runtime": 251.2614, "train_samples_per_second": 63.508, "train_steps_per_second": 0.995 }, { "epoch": 88.0, "eval_accuracy": 0.9098083427282976, "eval_f1": 0.908811337868185, "eval_loss": 0.4702069163322449, "eval_precision": 0.9089224577124531, "eval_recall": 0.9098083427282976, "eval_runtime": 29.3425, "eval_samples_per_second": 60.458, "eval_steps_per_second": 0.954, "step": 5500 }, { "epoch": 88.16, "learning_rate": 0.00011193548387096775, "loss": 0.1158, "step": 5510 }, { "epoch": 88.32, "learning_rate": 0.0001103225806451613, "loss": 0.1029, "step": 5520 }, { "epoch": 88.48, "learning_rate": 0.00010870967741935483, "loss": 0.0978, "step": 5530 }, { "epoch": 88.64, "learning_rate": 0.00010709677419354839, "loss": 0.1028, "step": 5540 }, { "epoch": 88.8, "learning_rate": 0.00010548387096774193, "loss": 0.1053, "step": 5550 }, { "epoch": 88.96, "learning_rate": 0.00010387096774193548, "loss": 0.1174, "step": 5560 }, { "epoch": 88.99, "step": 5562, "train_accuracy": 0.9806981262142007, "train_f1": 0.980651790063678, "train_loss": 0.05491610988974571, "train_precision": 0.9806996834447476, "train_recall": 0.9806981262142007, "train_runtime": 252.31, "train_samples_per_second": 63.244, "train_steps_per_second": 0.991 }, { "epoch": 88.99, "eval_accuracy": 0.9058624577226606, "eval_f1": 0.9047448567468519, "eval_loss": 0.4772195518016815, "eval_precision": 0.9049010825589036, "eval_recall": 0.9058624577226606, "eval_runtime": 29.443, "eval_samples_per_second": 60.252, "eval_steps_per_second": 0.951, "step": 5562 }, { "epoch": 89.12, "learning_rate": 0.00010225806451612903, "loss": 0.1106, "step": 5570 }, { "epoch": 89.28, "learning_rate": 0.00010064516129032258, "loss": 0.0965, "step": 5580 }, { "epoch": 89.44, "learning_rate": 9.903225806451612e-05, "loss": 0.1145, "step": 5590 }, { "epoch": 89.6, "learning_rate": 9.741935483870967e-05, "loss": 0.1069, "step": 5600 }, { "epoch": 89.76, "learning_rate": 9.580645161290323e-05, "loss": 0.1008, "step": 5610 }, { "epoch": 89.92, "learning_rate": 9.419354838709677e-05, "loss": 0.103, "step": 5620 }, { "epoch": 90.0, "step": 5625, "train_accuracy": 0.9815754841135552, "train_f1": 0.9815346716904167, "train_loss": 0.05348266288638115, "train_precision": 0.9815797384790222, "train_recall": 0.9815754841135552, "train_runtime": 252.062, "train_samples_per_second": 63.306, "train_steps_per_second": 0.992 }, { "epoch": 90.0, "eval_accuracy": 0.9075535512965051, "eval_f1": 0.9065308517183118, "eval_loss": 0.4701833724975586, "eval_precision": 0.9065469838144254, "eval_recall": 0.9075535512965051, "eval_runtime": 29.5689, "eval_samples_per_second": 59.995, "eval_steps_per_second": 0.947, "step": 5625 }, { "epoch": 90.08, "learning_rate": 9.258064516129032e-05, "loss": 0.0977, "step": 5630 }, { "epoch": 90.24, "learning_rate": 9.096774193548387e-05, "loss": 0.0948, "step": 5640 }, { "epoch": 90.4, "learning_rate": 8.935483870967742e-05, "loss": 0.0803, "step": 5650 }, { "epoch": 90.56, "learning_rate": 8.774193548387096e-05, "loss": 0.1025, "step": 5660 }, { "epoch": 90.72, "learning_rate": 8.612903225806452e-05, "loss": 0.1056, "step": 5670 }, { "epoch": 90.88, "learning_rate": 8.451612903225807e-05, "loss": 0.1086, "step": 5680 }, { "epoch": 90.99, "step": 5687, "train_accuracy": 0.9794447577865514, "train_f1": 0.9794042503142155, "train_loss": 0.05922425910830498, "train_precision": 0.979461044879249, "train_recall": 0.9794447577865514, "train_runtime": 253.2112, "train_samples_per_second": 63.019, "train_steps_per_second": 0.987 }, { "epoch": 90.99, "eval_accuracy": 0.9081172491544532, "eval_f1": 0.9074336656449804, "eval_loss": 0.4727869927883148, "eval_precision": 0.9075490421138191, "eval_recall": 0.9081172491544532, "eval_runtime": 29.3104, "eval_samples_per_second": 60.525, "eval_steps_per_second": 0.955, "step": 5687 }, { "epoch": 91.04, "learning_rate": 8.290322580645161e-05, "loss": 0.1074, "step": 5690 }, { "epoch": 91.2, "learning_rate": 8.129032258064515e-05, "loss": 0.1017, "step": 5700 }, { "epoch": 91.36, "learning_rate": 7.967741935483871e-05, "loss": 0.0971, "step": 5710 }, { "epoch": 91.52, "learning_rate": 7.806451612903226e-05, "loss": 0.1191, "step": 5720 }, { "epoch": 91.68, "learning_rate": 7.64516129032258e-05, "loss": 0.0995, "step": 5730 }, { "epoch": 91.84, "learning_rate": 7.483870967741936e-05, "loss": 0.1142, "step": 5740 }, { "epoch": 92.0, "learning_rate": 7.32258064516129e-05, "loss": 0.1087, "step": 5750 }, { "epoch": 92.0, "step": 5750, "train_accuracy": 0.9796954314720813, "train_f1": 0.9796272548376432, "train_loss": 0.05848938599228859, "train_precision": 0.9797640627474504, "train_recall": 0.9796954314720813, "train_runtime": 254.0646, "train_samples_per_second": 62.807, "train_steps_per_second": 0.984 }, { "epoch": 92.0, "eval_accuracy": 0.9075535512965051, "eval_f1": 0.9065640932569152, "eval_loss": 0.4691586196422577, "eval_precision": 0.9068629961295476, "eval_recall": 0.9075535512965051, "eval_runtime": 29.6211, "eval_samples_per_second": 59.89, "eval_steps_per_second": 0.945, "step": 5750 }, { "epoch": 92.16, "learning_rate": 7.161290322580645e-05, "loss": 0.1036, "step": 5760 }, { "epoch": 92.32, "learning_rate": 7.000000000000001e-05, "loss": 0.0991, "step": 5770 }, { "epoch": 92.48, "learning_rate": 6.838709677419355e-05, "loss": 0.1042, "step": 5780 }, { "epoch": 92.64, "learning_rate": 6.67741935483871e-05, "loss": 0.0997, "step": 5790 }, { "epoch": 92.8, "learning_rate": 6.516129032258064e-05, "loss": 0.0921, "step": 5800 }, { "epoch": 92.96, "learning_rate": 6.35483870967742e-05, "loss": 0.1041, "step": 5810 }, { "epoch": 92.99, "step": 5812, "train_accuracy": 0.979131415679639, "train_f1": 0.9790799084691278, "train_loss": 0.0558781623840332, "train_precision": 0.9791236279775183, "train_recall": 0.979131415679639, "train_runtime": 253.4519, "train_samples_per_second": 62.959, "train_steps_per_second": 0.986 }, { "epoch": 92.99, "eval_accuracy": 0.9086809470124013, "eval_f1": 0.9078901238987158, "eval_loss": 0.45839613676071167, "eval_precision": 0.9079266988153948, "eval_recall": 0.9086809470124013, "eval_runtime": 29.4342, "eval_samples_per_second": 60.27, "eval_steps_per_second": 0.951, "step": 5812 }, { "epoch": 93.12, "learning_rate": 6.193548387096774e-05, "loss": 0.116, "step": 5820 }, { "epoch": 93.28, "learning_rate": 6.0322580645161295e-05, "loss": 0.103, "step": 5830 }, { "epoch": 93.44, "learning_rate": 5.870967741935484e-05, "loss": 0.1129, "step": 5840 }, { "epoch": 93.6, "learning_rate": 5.709677419354839e-05, "loss": 0.1034, "step": 5850 }, { "epoch": 93.76, "learning_rate": 5.5483870967741936e-05, "loss": 0.1134, "step": 5860 }, { "epoch": 93.92, "learning_rate": 5.387096774193549e-05, "loss": 0.1109, "step": 5870 }, { "epoch": 94.0, "step": 5875, "train_accuracy": 0.9796327630506988, "train_f1": 0.9795750790681897, "train_loss": 0.05882110819220543, "train_precision": 0.9796458578935032, "train_recall": 0.9796327630506988, "train_runtime": 253.4567, "train_samples_per_second": 62.957, "train_steps_per_second": 0.986 }, { "epoch": 94.0, "eval_accuracy": 0.9092446448703495, "eval_f1": 0.9084684905580462, "eval_loss": 0.45630526542663574, "eval_precision": 0.9085750924367912, "eval_recall": 0.9092446448703495, "eval_runtime": 29.3382, "eval_samples_per_second": 60.467, "eval_steps_per_second": 0.954, "step": 5875 }, { "epoch": 94.08, "learning_rate": 5.225806451612904e-05, "loss": 0.0848, "step": 5880 }, { "epoch": 94.24, "learning_rate": 5.064516129032258e-05, "loss": 0.1063, "step": 5890 }, { "epoch": 94.4, "learning_rate": 4.9032258064516135e-05, "loss": 0.0929, "step": 5900 }, { "epoch": 94.56, "learning_rate": 4.741935483870968e-05, "loss": 0.1039, "step": 5910 }, { "epoch": 94.72, "learning_rate": 4.580645161290323e-05, "loss": 0.099, "step": 5920 }, { "epoch": 94.88, "learning_rate": 4.4193548387096775e-05, "loss": 0.1026, "step": 5930 }, { "epoch": 94.99, "step": 5937, "train_accuracy": 0.9824528420129097, "train_f1": 0.9824112060096897, "train_loss": 0.05392773821949959, "train_precision": 0.9824786275566851, "train_recall": 0.9824528420129097, "train_runtime": 252.5661, "train_samples_per_second": 63.179, "train_steps_per_second": 0.99 }, { "epoch": 94.99, "eval_accuracy": 0.9126268320180383, "eval_f1": 0.9117417948122799, "eval_loss": 0.4614848494529724, "eval_precision": 0.911808467672524, "eval_recall": 0.9126268320180383, "eval_runtime": 29.3223, "eval_samples_per_second": 60.5, "eval_steps_per_second": 0.955, "step": 5937 }, { "epoch": 95.04, "learning_rate": 4.258064516129032e-05, "loss": 0.1026, "step": 5940 }, { "epoch": 95.2, "learning_rate": 4.096774193548387e-05, "loss": 0.0942, "step": 5950 }, { "epoch": 95.36, "learning_rate": 3.9354838709677416e-05, "loss": 0.0936, "step": 5960 }, { "epoch": 95.52, "learning_rate": 3.774193548387097e-05, "loss": 0.0833, "step": 5970 }, { "epoch": 95.68, "learning_rate": 3.612903225806452e-05, "loss": 0.096, "step": 5980 }, { "epoch": 95.84, "learning_rate": 3.451612903225806e-05, "loss": 0.106, "step": 5990 }, { "epoch": 96.0, "learning_rate": 3.2903225806451614e-05, "loss": 0.0895, "step": 6000 }, { "epoch": 96.0, "step": 6000, "train_accuracy": 0.9817634893777025, "train_f1": 0.9817217910538368, "train_loss": 0.053316567093133926, "train_precision": 0.981748670799393, "train_recall": 0.9817634893777025, "train_runtime": 254.5693, "train_samples_per_second": 62.682, "train_steps_per_second": 0.982 }, { "epoch": 96.0, "eval_accuracy": 0.9092446448703495, "eval_f1": 0.908628347766777, "eval_loss": 0.4585205316543579, "eval_precision": 0.9086756206676724, "eval_recall": 0.9092446448703495, "eval_runtime": 29.7078, "eval_samples_per_second": 59.715, "eval_steps_per_second": 0.943, "step": 6000 }, { "epoch": 96.16, "learning_rate": 3.129032258064516e-05, "loss": 0.1019, "step": 6010 }, { "epoch": 96.32, "learning_rate": 2.967741935483871e-05, "loss": 0.1046, "step": 6020 }, { "epoch": 96.48, "learning_rate": 2.806451612903226e-05, "loss": 0.125, "step": 6030 }, { "epoch": 96.64, "learning_rate": 2.6451612903225806e-05, "loss": 0.0977, "step": 6040 }, { "epoch": 96.8, "learning_rate": 2.4838709677419354e-05, "loss": 0.104, "step": 6050 }, { "epoch": 96.96, "learning_rate": 2.3225806451612906e-05, "loss": 0.1045, "step": 6060 }, { "epoch": 96.99, "step": 6062, "train_accuracy": 0.9817008209563202, "train_f1": 0.9816508134314273, "train_loss": 0.05279777571558952, "train_precision": 0.9816910608821193, "train_recall": 0.9817008209563202, "train_runtime": 252.7534, "train_samples_per_second": 63.133, "train_steps_per_second": 0.989 }, { "epoch": 96.99, "eval_accuracy": 0.9098083427282976, "eval_f1": 0.909112926020381, "eval_loss": 0.45533671975135803, "eval_precision": 0.9090721377215957, "eval_recall": 0.9098083427282976, "eval_runtime": 33.0675, "eval_samples_per_second": 53.648, "eval_steps_per_second": 0.847, "step": 6062 }, { "epoch": 97.12, "learning_rate": 2.1612903225806454e-05, "loss": 0.0862, "step": 6070 }, { "epoch": 97.28, "learning_rate": 2e-05, "loss": 0.1078, "step": 6080 }, { "epoch": 97.44, "learning_rate": 1.838709677419355e-05, "loss": 0.1078, "step": 6090 }, { "epoch": 97.6, "learning_rate": 1.6774193548387098e-05, "loss": 0.107, "step": 6100 }, { "epoch": 97.76, "learning_rate": 1.5161290322580646e-05, "loss": 0.1139, "step": 6110 }, { "epoch": 97.92, "learning_rate": 1.3548387096774194e-05, "loss": 0.1081, "step": 6120 }, { "epoch": 98.0, "step": 6125, "train_accuracy": 0.9812621420066429, "train_f1": 0.9812114737389049, "train_loss": 0.054921120405197144, "train_precision": 0.9812508070970374, "train_recall": 0.9812621420066429, "train_runtime": 252.6106, "train_samples_per_second": 63.168, "train_steps_per_second": 0.99 }, { "epoch": 98.0, "eval_accuracy": 0.9103720405862458, "eval_f1": 0.9096321309054232, "eval_loss": 0.4532192647457123, "eval_precision": 0.9096536769299824, "eval_recall": 0.9103720405862458, "eval_runtime": 29.6384, "eval_samples_per_second": 59.855, "eval_steps_per_second": 0.945, "step": 6125 }, { "epoch": 98.08, "learning_rate": 1.1935483870967743e-05, "loss": 0.1011, "step": 6130 }, { "epoch": 98.24, "learning_rate": 1.0322580645161291e-05, "loss": 0.1031, "step": 6140 }, { "epoch": 98.4, "learning_rate": 8.709677419354838e-06, "loss": 0.0821, "step": 6150 }, { "epoch": 98.56, "learning_rate": 7.096774193548388e-06, "loss": 0.0901, "step": 6160 }, { "epoch": 98.72, "learning_rate": 5.483870967741935e-06, "loss": 0.0809, "step": 6170 }, { "epoch": 98.88, "learning_rate": 3.870967741935484e-06, "loss": 0.0932, "step": 6180 }, { "epoch": 98.99, "step": 6187, "train_accuracy": 0.9805101209500533, "train_f1": 0.9804742522228167, "train_loss": 0.055186156183481216, "train_precision": 0.980498073403408, "train_recall": 0.9805101209500533, "train_runtime": 254.3736, "train_samples_per_second": 62.731, "train_steps_per_second": 0.983 }, { "epoch": 98.99, "eval_accuracy": 0.9098083427282976, "eval_f1": 0.9090900239365977, "eval_loss": 0.4536750614643097, "eval_precision": 0.9091114953941556, "eval_recall": 0.9098083427282976, "eval_runtime": 29.5537, "eval_samples_per_second": 60.026, "eval_steps_per_second": 0.947, "step": 6187 }, { "epoch": 99.04, "learning_rate": 2.2580645161290324e-06, "loss": 0.1136, "step": 6190 }, { "epoch": 99.2, "learning_rate": 6.451612903225807e-07, "loss": 0.0934, "step": 6200 }, { "epoch": 99.2, "step": 6200, "train_accuracy": 0.9809487998997305, "train_f1": 0.9809066394306372, "train_loss": 0.05620851740241051, "train_precision": 0.9809434303564252, "train_recall": 0.9809487998997305, "train_runtime": 257.0414, "train_samples_per_second": 62.08, "train_steps_per_second": 0.973 }, { "epoch": 99.2, "eval_accuracy": 0.9098083427282976, "eval_f1": 0.9090900239365977, "eval_loss": 0.4539656639099121, "eval_precision": 0.9091114953941556, "eval_recall": 0.9098083427282976, "eval_runtime": 29.6217, "eval_samples_per_second": 59.889, "eval_steps_per_second": 0.945, "step": 6200 }, { "epoch": 99.2, "step": 6200, "total_flos": 9.4522774317222e+19, "train_loss": 0.2388173005080992, "train_runtime": 58791.9316, "train_samples_per_second": 27.141, "train_steps_per_second": 0.105 } ], "logging_steps": 10, "max_steps": 6200, "num_train_epochs": 100, "save_steps": 500, "total_flos": 9.4522774317222e+19, "trial_name": null, "trial_params": null }