{ "best_metric": 0.9564356435643564, "best_model_checkpoint": "/content/drive/MyDrive/wav2vec2-base2_temp/checkpoint-22702", "epoch": 44.9990089197225, "global_step": 22702, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.99, "learning_rate": 5.869047619047619e-07, "loss": 1.7909, "step": 500 }, { "epoch": 1.0, "eval_accuracy": 0.22574257425742575, "eval_f1": 0.08821474321649003, "eval_loss": 1.7777053117752075, "eval_precision": 0.11965788905676666, "eval_recall": 0.17184714795008912, "eval_runtime": 11.4913, "eval_samples_per_second": 43.946, "eval_steps_per_second": 11.052, "step": 504 }, { "epoch": 1.98, "learning_rate": 1.1797619047619049e-06, "loss": 1.7457, "step": 1000 }, { "epoch": 2.0, "eval_accuracy": 0.3485148514851485, "eval_f1": 0.08614782183064122, "eval_loss": 1.6808362007141113, "eval_precision": 0.05808580858085808, "eval_recall": 0.16666666666666666, "eval_runtime": 9.5448, "eval_samples_per_second": 52.908, "eval_steps_per_second": 13.306, "step": 1009 }, { "epoch": 2.97, "learning_rate": 1.775e-06, "loss": 1.6522, "step": 1500 }, { "epoch": 3.0, "eval_accuracy": 0.4277227722772277, "eval_f1": 0.2012091077291391, "eval_loss": 1.5670676231384277, "eval_precision": 0.21909966172261253, "eval_recall": 0.25960391732450555, "eval_runtime": 11.3538, "eval_samples_per_second": 44.479, "eval_steps_per_second": 11.186, "step": 1513 }, { "epoch": 3.96, "learning_rate": 2.3702380952380955e-06, "loss": 1.5185, "step": 2000 }, { "epoch": 4.0, "eval_accuracy": 0.5881188118811881, "eval_f1": 0.3725029550190217, "eval_loss": 1.3283705711364746, "eval_precision": 0.44973544973544977, "eval_recall": 0.42331231676819914, "eval_runtime": 10.0287, "eval_samples_per_second": 50.356, "eval_steps_per_second": 12.664, "step": 2018 }, { "epoch": 4.96, "learning_rate": 2.9654761904761905e-06, "loss": 1.2985, "step": 2500 }, { "epoch": 5.0, "eval_accuracy": 0.6772277227722773, "eval_f1": 0.4729958594455382, "eval_loss": 1.0731083154678345, "eval_precision": 0.43875160660457085, "eval_recall": 0.528141923436041, "eval_runtime": 12.9008, "eval_samples_per_second": 39.145, "eval_steps_per_second": 9.844, "step": 2522 }, { "epoch": 5.95, "learning_rate": 3.5595238095238097e-06, "loss": 1.0891, "step": 3000 }, { "epoch": 6.0, "eval_accuracy": 0.6871287128712872, "eval_f1": 0.5190569356664213, "eval_loss": 0.9219310879707336, "eval_precision": 0.5714776497659865, "eval_recall": 0.5614828961887786, "eval_runtime": 11.3089, "eval_samples_per_second": 44.655, "eval_steps_per_second": 11.23, "step": 3027 }, { "epoch": 6.94, "learning_rate": 4.152380952380952e-06, "loss": 0.898, "step": 3500 }, { "epoch": 7.0, "eval_accuracy": 0.7623762376237624, "eval_f1": 0.6067418025396825, "eval_loss": 0.7551212906837463, "eval_precision": 0.6263669695520484, "eval_recall": 0.6273902894491129, "eval_runtime": 10.502, "eval_samples_per_second": 48.086, "eval_steps_per_second": 12.093, "step": 3531 }, { "epoch": 7.93, "learning_rate": 4.7476190476190475e-06, "loss": 0.7131, "step": 4000 }, { "epoch": 8.0, "eval_accuracy": 0.8237623762376237, "eval_f1": 0.6820230695773629, "eval_loss": 0.5713428258895874, "eval_precision": 0.6794105204506714, "eval_recall": 0.7097026992615229, "eval_runtime": 11.2886, "eval_samples_per_second": 44.736, "eval_steps_per_second": 11.25, "step": 4036 }, { "epoch": 8.92, "learning_rate": 5.342857142857143e-06, "loss": 0.5432, "step": 4500 }, { "epoch": 9.0, "eval_accuracy": 0.8613861386138614, "eval_f1": 0.7306731549704363, "eval_loss": 0.4402145743370056, "eval_precision": 0.7078735307061095, "eval_recall": 0.7635915881504117, "eval_runtime": 10.2752, "eval_samples_per_second": 49.147, "eval_steps_per_second": 12.36, "step": 4540 }, { "epoch": 9.91, "learning_rate": 5.9380952380952385e-06, "loss": 0.4296, "step": 5000 }, { "epoch": 10.0, "eval_accuracy": 0.8534653465346534, "eval_f1": 0.7203056745493539, "eval_loss": 0.42783123254776, "eval_precision": 0.7042866897841077, "eval_recall": 0.7496972880061116, "eval_runtime": 10.0025, "eval_samples_per_second": 50.488, "eval_steps_per_second": 12.697, "step": 5045 }, { "epoch": 10.9, "learning_rate": 6.532142857142857e-06, "loss": 0.3869, "step": 5500 }, { "epoch": 11.0, "eval_accuracy": 0.8772277227722772, "eval_f1": 0.7461735637601347, "eval_loss": 0.3639691174030304, "eval_precision": 0.7306143706983171, "eval_recall": 0.7771949537390714, "eval_runtime": 12.5987, "eval_samples_per_second": 40.083, "eval_steps_per_second": 10.08, "step": 5549 }, { "epoch": 11.89, "learning_rate": 7.127380952380952e-06, "loss": 0.3606, "step": 6000 }, { "epoch": 12.0, "eval_accuracy": 0.8673267326732673, "eval_f1": 0.7317576200752773, "eval_loss": 0.4499942660331726, "eval_precision": 0.7133735090373348, "eval_recall": 0.7651407987437399, "eval_runtime": 10.9939, "eval_samples_per_second": 45.934, "eval_steps_per_second": 11.552, "step": 6054 }, { "epoch": 12.88, "learning_rate": 7.722619047619049e-06, "loss": 0.3626, "step": 6500 }, { "epoch": 13.0, "eval_accuracy": 0.8653465346534653, "eval_f1": 0.7374268578667081, "eval_loss": 0.460127055644989, "eval_precision": 0.7374934142677786, "eval_recall": 0.7631706773618538, "eval_runtime": 10.5614, "eval_samples_per_second": 47.816, "eval_steps_per_second": 12.025, "step": 6558 }, { "epoch": 13.88, "learning_rate": 8.317857142857142e-06, "loss": 0.3276, "step": 7000 }, { "epoch": 14.0, "eval_accuracy": 0.8732673267326733, "eval_f1": 0.7421428470955433, "eval_loss": 0.41789284348487854, "eval_precision": 0.7395445813585981, "eval_recall": 0.7673902894491129, "eval_runtime": 10.505, "eval_samples_per_second": 48.072, "eval_steps_per_second": 12.09, "step": 7063 }, { "epoch": 14.87, "learning_rate": 8.913095238095238e-06, "loss": 0.3327, "step": 7500 }, { "epoch": 15.0, "eval_accuracy": 0.8910891089108911, "eval_f1": 0.7616771274725501, "eval_loss": 0.3447856605052948, "eval_precision": 0.7497788374032539, "eval_recall": 0.7904575163398694, "eval_runtime": 10.1528, "eval_samples_per_second": 49.74, "eval_steps_per_second": 12.509, "step": 7567 }, { "epoch": 15.86, "learning_rate": 9.508333333333333e-06, "loss": 0.3043, "step": 8000 }, { "epoch": 16.0, "eval_accuracy": 0.8851485148514852, "eval_f1": 0.7518326259740746, "eval_loss": 0.3687730133533478, "eval_precision": 0.7422745662572229, "eval_recall": 0.7788982259570495, "eval_runtime": 11.1359, "eval_samples_per_second": 45.349, "eval_steps_per_second": 11.405, "step": 8072 }, { "epoch": 16.85, "learning_rate": 1.0103571428571429e-05, "loss": 0.3127, "step": 8500 }, { "epoch": 17.0, "eval_accuracy": 0.8891089108910891, "eval_f1": 0.7565562985281078, "eval_loss": 0.3414187431335449, "eval_precision": 0.7434316232942377, "eval_recall": 0.7861912189118071, "eval_runtime": 10.7404, "eval_samples_per_second": 47.019, "eval_steps_per_second": 11.824, "step": 8576 }, { "epoch": 17.84, "learning_rate": 1.0698809523809525e-05, "loss": 0.306, "step": 9000 }, { "epoch": 18.0, "eval_accuracy": 0.8792079207920792, "eval_f1": 0.7478424649155898, "eval_loss": 0.4159949719905853, "eval_precision": 0.7357367052282306, "eval_recall": 0.7744677871148459, "eval_runtime": 10.479, "eval_samples_per_second": 48.192, "eval_steps_per_second": 12.119, "step": 9081 }, { "epoch": 18.83, "learning_rate": 1.1294047619047618e-05, "loss": 0.2756, "step": 9500 }, { "epoch": 19.0, "eval_accuracy": 0.8495049504950495, "eval_f1": 0.7182407626265085, "eval_loss": 0.7052268981933594, "eval_precision": 0.7064460784313725, "eval_recall": 0.7463492063492062, "eval_runtime": 11.111, "eval_samples_per_second": 45.45, "eval_steps_per_second": 11.43, "step": 9585 }, { "epoch": 19.82, "learning_rate": 1.1888095238095239e-05, "loss": 0.3233, "step": 10000 }, { "epoch": 20.0, "eval_accuracy": 0.904950495049505, "eval_f1": 0.7712251064475479, "eval_loss": 0.2911510169506073, "eval_precision": 0.7413165742555666, "eval_recall": 0.8109531236737119, "eval_runtime": 10.6787, "eval_samples_per_second": 47.29, "eval_steps_per_second": 11.893, "step": 10090 }, { "epoch": 20.81, "learning_rate": 1.2483333333333333e-05, "loss": 0.2932, "step": 10500 }, { "epoch": 21.0, "eval_accuracy": 0.904950495049505, "eval_f1": 0.8543450476033496, "eval_loss": 0.42383888363838196, "eval_precision": 0.8654226983060155, "eval_recall": 0.853277359895007, "eval_runtime": 9.6742, "eval_samples_per_second": 52.201, "eval_steps_per_second": 13.128, "step": 10594 }, { "epoch": 21.8, "learning_rate": 1.307857142857143e-05, "loss": 0.2698, "step": 11000 }, { "epoch": 22.0, "eval_accuracy": 0.9128712871287129, "eval_f1": 0.8604450377673127, "eval_loss": 0.386119544506073, "eval_precision": 0.9000550023499306, "eval_recall": 0.8544778424190188, "eval_runtime": 11.5253, "eval_samples_per_second": 43.817, "eval_steps_per_second": 11.019, "step": 11099 }, { "epoch": 22.79, "learning_rate": 1.3673809523809524e-05, "loss": 0.2658, "step": 11500 }, { "epoch": 23.0, "eval_accuracy": 0.9366336633663367, "eval_f1": 0.9043163728295133, "eval_loss": 0.336636483669281, "eval_precision": 0.9078665759004835, "eval_recall": 0.9021482439129498, "eval_runtime": 11.333, "eval_samples_per_second": 44.56, "eval_steps_per_second": 11.206, "step": 11603 }, { "epoch": 23.79, "learning_rate": 1.426904761904762e-05, "loss": 0.2393, "step": 12000 }, { "epoch": 24.0, "eval_accuracy": 0.9188118811881189, "eval_f1": 0.8657850889640667, "eval_loss": 0.4375390410423279, "eval_precision": 0.8887849766332739, "eval_recall": 0.8638055735114559, "eval_runtime": 11.0648, "eval_samples_per_second": 45.64, "eval_steps_per_second": 11.478, "step": 12108 }, { "epoch": 24.78, "learning_rate": 1.4864285714285713e-05, "loss": 0.2401, "step": 12500 }, { "epoch": 25.0, "eval_accuracy": 0.9207920792079208, "eval_f1": 0.8888781151825805, "eval_loss": 0.4757852256298065, "eval_precision": 0.8961036612926598, "eval_recall": 0.8866903929403929, "eval_runtime": 10.4698, "eval_samples_per_second": 48.234, "eval_steps_per_second": 12.13, "step": 12612 }, { "epoch": 25.77, "learning_rate": 1.545952380952381e-05, "loss": 0.2041, "step": 13000 }, { "epoch": 26.0, "eval_accuracy": 0.9425742574257425, "eval_f1": 0.9155025903592865, "eval_loss": 0.3074367940425873, "eval_precision": 0.9170299642442648, "eval_recall": 0.9228144078144078, "eval_runtime": 10.5628, "eval_samples_per_second": 47.809, "eval_steps_per_second": 12.023, "step": 13117 }, { "epoch": 26.76, "learning_rate": 1.605357142857143e-05, "loss": 0.1845, "step": 13500 }, { "epoch": 27.0, "eval_accuracy": 0.9108910891089109, "eval_f1": 0.8599750617887297, "eval_loss": 0.4771750867366791, "eval_precision": 0.864481386177137, "eval_recall": 0.8576941032823386, "eval_runtime": 11.1655, "eval_samples_per_second": 45.229, "eval_steps_per_second": 11.374, "step": 13621 }, { "epoch": 27.75, "learning_rate": 1.6648809523809525e-05, "loss": 0.1743, "step": 14000 }, { "epoch": 28.0, "eval_accuracy": 0.9386138613861386, "eval_f1": 0.9057775638831363, "eval_loss": 0.37529292702674866, "eval_precision": 0.9140135491407343, "eval_recall": 0.9027411722264663, "eval_runtime": 9.6192, "eval_samples_per_second": 52.499, "eval_steps_per_second": 13.203, "step": 14126 }, { "epoch": 28.74, "learning_rate": 1.7244047619047617e-05, "loss": 0.1539, "step": 14500 }, { "epoch": 29.0, "eval_accuracy": 0.9247524752475248, "eval_f1": 0.8866243367627531, "eval_loss": 0.5404527187347412, "eval_precision": 0.9116518987029846, "eval_recall": 0.8748301616683968, "eval_runtime": 10.8581, "eval_samples_per_second": 46.509, "eval_steps_per_second": 11.696, "step": 14630 }, { "epoch": 29.73, "learning_rate": 1.7839285714285716e-05, "loss": 0.1646, "step": 15000 }, { "epoch": 30.0, "eval_accuracy": 0.9346534653465347, "eval_f1": 0.9015438899526216, "eval_loss": 0.43599411845207214, "eval_precision": 0.9116436291187194, "eval_recall": 0.8942752998635353, "eval_runtime": 9.916, "eval_samples_per_second": 50.928, "eval_steps_per_second": 12.808, "step": 15135 }, { "epoch": 30.72, "learning_rate": 1.843452380952381e-05, "loss": 0.183, "step": 15500 }, { "epoch": 31.0, "eval_accuracy": 0.9346534653465347, "eval_f1": 0.9052713311328079, "eval_loss": 0.4353509545326233, "eval_precision": 0.9100534785215237, "eval_recall": 0.9015345357257122, "eval_runtime": 9.7228, "eval_samples_per_second": 51.94, "eval_steps_per_second": 13.062, "step": 15639 }, { "epoch": 31.71, "learning_rate": 1.9028571428571427e-05, "loss": 0.1547, "step": 16000 }, { "epoch": 32.0, "eval_accuracy": 0.9306930693069307, "eval_f1": 0.8978119183659733, "eval_loss": 0.49971604347229004, "eval_precision": 0.9138477382798044, "eval_recall": 0.888716153127918, "eval_runtime": 10.4672, "eval_samples_per_second": 48.246, "eval_steps_per_second": 12.133, "step": 16144 }, { "epoch": 32.71, "learning_rate": 1.9623809523809523e-05, "loss": 0.1658, "step": 16500 }, { "epoch": 33.0, "eval_accuracy": 0.9089108910891089, "eval_f1": 0.8687334612012699, "eval_loss": 0.5864279270172119, "eval_precision": 0.8899122777729049, "eval_recall": 0.8847601091718739, "eval_runtime": 10.5773, "eval_samples_per_second": 47.744, "eval_steps_per_second": 12.007, "step": 16648 }, { "epoch": 33.7, "learning_rate": 2.0219047619047622e-05, "loss": 0.1333, "step": 17000 }, { "epoch": 34.0, "eval_accuracy": 0.9089108910891089, "eval_f1": 0.8674149596498353, "eval_loss": 0.6616652607917786, "eval_precision": 0.8953076547670352, "eval_recall": 0.8615549809667457, "eval_runtime": 9.287, "eval_samples_per_second": 54.377, "eval_steps_per_second": 13.675, "step": 17153 }, { "epoch": 34.69, "learning_rate": 2.0814285714285714e-05, "loss": 0.1606, "step": 17500 }, { "epoch": 35.0, "eval_accuracy": 0.9346534653465347, "eval_f1": 0.9065032718742226, "eval_loss": 0.4562079906463623, "eval_precision": 0.9101611693862718, "eval_recall": 0.922783189033189, "eval_runtime": 10.427, "eval_samples_per_second": 48.432, "eval_steps_per_second": 12.18, "step": 17657 }, { "epoch": 35.68, "learning_rate": 2.140952380952381e-05, "loss": 0.1562, "step": 18000 }, { "epoch": 36.0, "eval_accuracy": 0.9346534653465347, "eval_f1": 0.9056285926854001, "eval_loss": 0.5119304060935974, "eval_precision": 0.9221614278132352, "eval_recall": 0.8947665732959851, "eval_runtime": 10.7345, "eval_samples_per_second": 47.045, "eval_steps_per_second": 11.831, "step": 18162 }, { "epoch": 36.67, "learning_rate": 2.200357142857143e-05, "loss": 0.1238, "step": 18500 }, { "epoch": 37.0, "eval_accuracy": 0.9465346534653465, "eval_f1": 0.9233277365446494, "eval_loss": 0.37833738327026367, "eval_precision": 0.9264774557165861, "eval_recall": 0.9206345615169145, "eval_runtime": 10.6894, "eval_samples_per_second": 47.243, "eval_steps_per_second": 11.881, "step": 18666 }, { "epoch": 37.66, "learning_rate": 2.2598809523809527e-05, "loss": 0.133, "step": 19000 }, { "epoch": 38.0, "eval_accuracy": 0.9207920792079208, "eval_f1": 0.88282026816653, "eval_loss": 0.44697701930999756, "eval_precision": 0.8940768234014104, "eval_recall": 0.9017844573726927, "eval_runtime": 9.8397, "eval_samples_per_second": 51.323, "eval_steps_per_second": 12.907, "step": 19171 }, { "epoch": 38.65, "learning_rate": 2.319404761904762e-05, "loss": 0.1817, "step": 19500 }, { "epoch": 39.0, "eval_accuracy": 0.9287128712871288, "eval_f1": 0.8884108101819078, "eval_loss": 0.4824526309967041, "eval_precision": 0.9067813929838341, "eval_recall": 0.8854446125769654, "eval_runtime": 10.5682, "eval_samples_per_second": 47.785, "eval_steps_per_second": 12.017, "step": 19675 }, { "epoch": 39.64, "learning_rate": 2.3789285714285715e-05, "loss": 0.1504, "step": 20000 }, { "epoch": 40.0, "eval_accuracy": 0.9346534653465347, "eval_f1": 0.9079267627717296, "eval_loss": 0.48847106099128723, "eval_precision": 0.9168877258505742, "eval_recall": 0.9021284924226101, "eval_runtime": 9.5244, "eval_samples_per_second": 53.021, "eval_steps_per_second": 13.334, "step": 20180 }, { "epoch": 40.63, "learning_rate": 2.4383333333333334e-05, "loss": 0.1367, "step": 20500 }, { "epoch": 41.0, "eval_accuracy": 0.902970297029703, "eval_f1": 0.8748563062275386, "eval_loss": 0.6201313734054565, "eval_precision": 0.8975989253974328, "eval_recall": 0.8675623151358445, "eval_runtime": 11.0171, "eval_samples_per_second": 45.838, "eval_steps_per_second": 11.528, "step": 20684 }, { "epoch": 41.63, "learning_rate": 2.497857142857143e-05, "loss": 0.1786, "step": 21000 }, { "epoch": 42.0, "eval_accuracy": 0.9089108910891089, "eval_f1": 0.8833714971261983, "eval_loss": 0.6504853963851929, "eval_precision": 0.9036762862738423, "eval_recall": 0.8743047475400418, "eval_runtime": 9.3899, "eval_samples_per_second": 53.781, "eval_steps_per_second": 13.525, "step": 21189 }, { "epoch": 42.62, "learning_rate": 2.5573809523809525e-05, "loss": 0.1589, "step": 21500 }, { "epoch": 43.0, "eval_accuracy": 0.9504950495049505, "eval_f1": 0.9268454843019528, "eval_loss": 0.35494372248649597, "eval_precision": 0.9327534998068862, "eval_recall": 0.9231311498958558, "eval_runtime": 10.3634, "eval_samples_per_second": 48.729, "eval_steps_per_second": 12.255, "step": 21693 }, { "epoch": 43.61, "learning_rate": 2.616904761904762e-05, "loss": 0.0857, "step": 22000 }, { "epoch": 44.0, "eval_accuracy": 0.9485148514851485, "eval_f1": 0.9224485798890482, "eval_loss": 0.41820821166038513, "eval_precision": 0.9441624977223921, "eval_recall": 0.9108187890540833, "eval_runtime": 9.3522, "eval_samples_per_second": 53.998, "eval_steps_per_second": 13.58, "step": 22198 }, { "epoch": 44.6, "learning_rate": 2.6763095238095236e-05, "loss": 0.102, "step": 22500 }, { "epoch": 45.0, "eval_accuracy": 0.9564356435643564, "eval_f1": 0.9306293793472796, "eval_loss": 0.29131555557250977, "eval_precision": 0.9291726584104362, "eval_recall": 0.9330733318968613, "eval_runtime": 9.5553, "eval_samples_per_second": 52.85, "eval_steps_per_second": 13.291, "step": 22702 } ], "max_steps": 252000, "num_train_epochs": 500, "total_flos": 1.9381803431060155e+18, "trial_name": null, "trial_params": null }