ekinakyurek's picture
Upload folder using huggingface_hub
0bfc910 verified
Step 1 | loss:0.3976413607597351 lr:7.142857142857143e-06 tokens_per_second_per_gpu:4387.33097149148
Step 2 | loss:0.4746507406234741 lr:1.4285714285714285e-05 tokens_per_second_per_gpu:7046.771919113339
Step 3 | loss:0.5802071690559387 lr:2.1428571428571428e-05 tokens_per_second_per_gpu:4441.457747803339
Step 4 | loss:0.3701060712337494 lr:2.857142857142857e-05 tokens_per_second_per_gpu:3650.942026101787
Step 5 | loss:0.29193297028541565 lr:3.571428571428572e-05 tokens_per_second_per_gpu:7054.909182210228
Step 6 | loss:0.3760976493358612 lr:4.2857142857142856e-05 tokens_per_second_per_gpu:7048.127250577496
Step 7 | loss:0.30446043610572815 lr:5e-05 tokens_per_second_per_gpu:7004.479201913858
Step 8 | loss:0.2387136071920395 lr:5.714285714285714e-05 tokens_per_second_per_gpu:3635.2249497418134
Step 9 | loss:0.18914680182933807 lr:6.428571428571429e-05 tokens_per_second_per_gpu:7000.457628689596
Step 10 | loss:0.3021690249443054 lr:7.142857142857143e-05 tokens_per_second_per_gpu:3653.480383661073
Step 11 | loss:0.2643088400363922 lr:7.857142857142858e-05 tokens_per_second_per_gpu:7031.93886765673
Step 12 | loss:0.16139991581439972 lr:8.571428571428571e-05 tokens_per_second_per_gpu:7054.891881433595
Step 13 | loss:0.06389950215816498 lr:9.285714285714286e-05 tokens_per_second_per_gpu:7062.824086928561
Step 14 | loss:0.05389096215367317 lr:0.0001 tokens_per_second_per_gpu:6978.212457022643
Step 15 | loss:0.004962658975273371 lr:9.998540070400966e-05 tokens_per_second_per_gpu:7094.870508500684
Step 16 | loss:0.06835552304983139 lr:9.994161134161634e-05 tokens_per_second_per_gpu:7080.695171098817
Step 17 | loss:0.014511780813336372 lr:9.986865748457457e-05 tokens_per_second_per_gpu:7080.545751630988
Step 18 | loss:0.03110644780099392 lr:9.976658173588244e-05 tokens_per_second_per_gpu:7061.977848624417
Step 19 | loss:0.027998723089694977 lr:9.96354437049027e-05 tokens_per_second_per_gpu:7051.413746664214
Step 20 | loss:0.0016048968536779284 lr:9.947531997255256e-05 tokens_per_second_per_gpu:7072.95803556782
Step 21 | loss:0.0029742333572357893 lr:9.928630404658255e-05 tokens_per_second_per_gpu:7107.2350546314165
Step 22 | loss:0.1135089248418808 lr:9.906850630697068e-05 tokens_per_second_per_gpu:7099.6584834141795
Step 23 | loss:0.2154047191143036 lr:9.882205394146361e-05 tokens_per_second_per_gpu:6990.463171422535
Step 24 | loss:0.00014675623970106244 lr:9.85470908713026e-05 tokens_per_second_per_gpu:7077.068869286243
Step 25 | loss:0.005645472556352615 lr:9.824377766717759e-05 tokens_per_second_per_gpu:7034.6838610765935
Step 26 | loss:0.0033204536885023117 lr:9.791229145545831e-05 tokens_per_second_per_gpu:7055.132190501445
Step 27 | loss:0.0036917459219694138 lr:9.755282581475769e-05 tokens_per_second_per_gpu:6952.847454332674
Step 28 | loss:0.22804421186447144 lr:9.716559066288715e-05 tokens_per_second_per_gpu:7065.180293736694
Step 29 | loss:0.0006192383007146418 lr:9.675081213427076e-05 tokens_per_second_per_gpu:7082.469783413299
Step 30 | loss:0.1948409229516983 lr:9.630873244788883e-05 tokens_per_second_per_gpu:7116.496655640619
Step 31 | loss:0.001953623490408063 lr:9.583960976582913e-05 tokens_per_second_per_gpu:7068.683913098268
Step 32 | loss:0.028155503794550896 lr:9.534371804252728e-05 tokens_per_second_per_gpu:7106.8162841544345
Step 33 | loss:0.031163187697529793 lr:9.482134686478519e-05 tokens_per_second_per_gpu:7040.198115725953
Step 34 | loss:0.10317869484424591 lr:9.42728012826605e-05 tokens_per_second_per_gpu:7107.951321874265
Step 35 | loss:0.01820056512951851 lr:9.36984016313259e-05 tokens_per_second_per_gpu:7099.987925795883
Step 36 | loss:0.008487297222018242 lr:9.309848334400246e-05 tokens_per_second_per_gpu:7042.305235525406
Step 37 | loss:0.01901382766664028 lr:9.247339675607605e-05 tokens_per_second_per_gpu:7001.366513365121
Step 38 | loss:0.23592135310173035 lr:9.182350690051133e-05 tokens_per_second_per_gpu:7086.116383351857
Step 39 | loss:0.02220093458890915 lr:9.114919329468282e-05 tokens_per_second_per_gpu:7073.70908732324
Step 40 | loss:0.022929463535547256 lr:9.045084971874738e-05 tokens_per_second_per_gpu:7014.8608774174445
Step 41 | loss:0.005184915382415056 lr:8.972888398568772e-05 tokens_per_second_per_gpu:7075.633299830602
Step 42 | loss:0.004354758653789759 lr:8.898371770316111e-05 tokens_per_second_per_gpu:6995.816885875575
Step 43 | loss:0.016170775517821312 lr:8.821578602729242e-05 tokens_per_second_per_gpu:7047.180771065604
Step 44 | loss:0.04515088349580765 lr:8.742553740855506e-05 tokens_per_second_per_gpu:6989.257110829968
Step 45 | loss:0.005793048068881035 lr:8.661343332988869e-05 tokens_per_second_per_gpu:7001.282624010805
Step 46 | loss:0.031016428023576736 lr:8.577994803720606e-05 tokens_per_second_per_gpu:7073.359473708103
Step 47 | loss:0.0024100204464048147 lr:8.492556826244687e-05 tokens_per_second_per_gpu:7083.689818088879
Step 48 | loss:0.0013836832949891686 lr:8.405079293933986e-05 tokens_per_second_per_gpu:7095.462200391597
Step 49 | loss:0.020225223153829575 lr:8.315613291203976e-05 tokens_per_second_per_gpu:7070.793714987635
Step 50 | loss:0.03904259204864502 lr:8.224211063680853e-05 tokens_per_second_per_gpu:7037.125376052126
Step 51 | loss:0.0007925322279334068 lr:8.130925987691569e-05 tokens_per_second_per_gpu:7089.021121315338
Step 52 | loss:0.0007487083203159273 lr:8.035812539093557e-05 tokens_per_second_per_gpu:7005.65828480073
Step 53 | loss:0.0004370383685454726 lr:7.938926261462366e-05 tokens_per_second_per_gpu:7095.577473215524
Step 54 | loss:0.0003041003365069628 lr:7.840323733655778e-05 tokens_per_second_per_gpu:7040.050712662494
Step 55 | loss:0.0003498854348435998 lr:7.740062536773352e-05 tokens_per_second_per_gpu:7005.2896717083595
Step 56 | loss:0.001033964566886425 lr:7.638201220530665e-05 tokens_per_second_per_gpu:6449.390348935749
Step 57 | loss:0.001258775359019637 lr:7.534799269067953e-05 tokens_per_second_per_gpu:7080.796782474087
Step 58 | loss:0.0003872970410156995 lr:7.42991706621303e-05 tokens_per_second_per_gpu:7033.900995838476
Step 59 | loss:0.0007584329578094184 lr:7.323615860218843e-05 tokens_per_second_per_gpu:7039.39230195007
Step 60 | loss:0.00048399902880191803 lr:7.215957727996207e-05 tokens_per_second_per_gpu:7076.972439544092
Step 61 | loss:0.024205604568123817 lr:7.107005538862646e-05 tokens_per_second_per_gpu:7028.327432378212
Step 62 | loss:0.000488930381834507 lr:6.996822917828477e-05 tokens_per_second_per_gpu:7049.323732093044
Step 63 | loss:0.0008218801813200116 lr:6.885474208441603e-05 tokens_per_second_per_gpu:7110.994278084172
Step 64 | loss:0.000323367741657421 lr:6.773024435212678e-05 tokens_per_second_per_gpu:6986.106951168045
Step 65 | loss:0.0090135233476758 lr:6.659539265642643e-05 tokens_per_second_per_gpu:7081.8448028919165
Step 66 | loss:0.021819528192281723 lr:6.545084971874738e-05 tokens_per_second_per_gpu:7027.288072933722
Step 67 | loss:0.0001219737678184174 lr:6.429728391993446e-05 tokens_per_second_per_gpu:7101.299265074336
Step 68 | loss:0.00042896269587799907 lr:6.313536890992935e-05 tokens_per_second_per_gpu:7035.014536986565
Step 69 | loss:0.00024019887496251613 lr:6.19657832143779e-05 tokens_per_second_per_gpu:7094.029889528228
Step 70 | loss:0.00027156350552104414 lr:6.078920983839031e-05 tokens_per_second_per_gpu:7064.04435745588
Step 71 | loss:0.00026911497116088867 lr:5.960633586768543e-05 tokens_per_second_per_gpu:7002.170548741391
Step 72 | loss:0.00011789762356784195 lr:5.841785206735192e-05 tokens_per_second_per_gpu:7033.749827293848
Step 73 | loss:0.013994992710649967 lr:5.7224452478461064e-05 tokens_per_second_per_gpu:7080.505024551126
Step 74 | loss:0.004337406251579523 lr:5.602683401276615e-05 tokens_per_second_per_gpu:7067.711243193472
Step 75 | loss:0.0001856393355410546 lr:5.482569604572576e-05 tokens_per_second_per_gpu:7007.235564136566
Step 76 | loss:0.00028253145865164697 lr:5.3621740008088126e-05 tokens_per_second_per_gpu:7051.783496806089
Step 77 | loss:0.010676591657102108 lr:5.2415668976275355e-05 tokens_per_second_per_gpu:7044.504088621025
Step 78 | loss:0.008452359586954117 lr:5.1208187261806615e-05 tokens_per_second_per_gpu:7041.063474352369
Step 79 | loss:0.008152920752763748 lr:5e-05 tokens_per_second_per_gpu:7054.884905406015
Step 80 | loss:0.00012812706700060517 lr:4.87918127381934e-05 tokens_per_second_per_gpu:7049.187430031825
Step 81 | loss:0.00015965537750162184 lr:4.758433102372466e-05 tokens_per_second_per_gpu:7019.442946525232
Step 82 | loss:0.0005481685511767864 lr:4.6378259991911886e-05 tokens_per_second_per_gpu:7106.228580666165
Step 83 | loss:0.0017840424552559853 lr:4.5174303954274244e-05 tokens_per_second_per_gpu:6747.494205103823
Step 84 | loss:6.595534068765119e-05 lr:4.397316598723385e-05 tokens_per_second_per_gpu:7039.49118431042
Step 85 | loss:0.00012897995475213975 lr:4.277554752153895e-05 tokens_per_second_per_gpu:6967.289965847177
Step 86 | loss:0.00013318043784238398 lr:4.1582147932648074e-05 tokens_per_second_per_gpu:7032.456681434574
Step 87 | loss:3.906681013177149e-05 lr:4.039366413231458e-05 tokens_per_second_per_gpu:7088.097722997256
Step 88 | loss:0.009910757653415203 lr:3.92107901616097e-05 tokens_per_second_per_gpu:7025.919055623729
Step 89 | loss:0.00014327328244689852 lr:3.803421678562213e-05 tokens_per_second_per_gpu:7091.061197924152
Step 90 | loss:0.0006904987385496497 lr:3.6864631090070655e-05 tokens_per_second_per_gpu:7079.044432956364
Step 91 | loss:5.691125988960266e-05 lr:3.570271608006555e-05 tokens_per_second_per_gpu:7092.186722898353
Step 92 | loss:0.00014364490925800055 lr:3.4549150281252636e-05 tokens_per_second_per_gpu:7031.548529214516
Step 93 | loss:2.911785850301385e-05 lr:3.340460734357359e-05 tokens_per_second_per_gpu:7084.93582194312
Step 94 | loss:0.010363278910517693 lr:3.226975564787322e-05 tokens_per_second_per_gpu:7067.990198534879
Step 95 | loss:0.00011910690955119208 lr:3.114525791558398e-05 tokens_per_second_per_gpu:7049.43438712702
Step 96 | loss:0.00010278833360644057 lr:3.003177082171523e-05 tokens_per_second_per_gpu:7089.369427748514
Step 97 | loss:0.00011334926966810599 lr:2.8929944611373554e-05 tokens_per_second_per_gpu:7068.049350904839
Step 98 | loss:0.0006340955733321607 lr:2.784042272003794e-05 tokens_per_second_per_gpu:6999.157150269119
Step 99 | loss:4.746837657876313e-05 lr:2.6763841397811573e-05 tokens_per_second_per_gpu:7085.416591844248
Step 100 | loss:9.409170161234215e-05 lr:2.57008293378697e-05 tokens_per_second_per_gpu:7060.101883679769
Step 101 | loss:0.00048770103603601456 lr:2.4652007309320498e-05 tokens_per_second_per_gpu:7061.343400491998
Step 102 | loss:6.129792018327862e-05 lr:2.361798779469336e-05 tokens_per_second_per_gpu:7076.0131939305875
Step 103 | loss:0.00026846263790503144 lr:2.259937463226651e-05 tokens_per_second_per_gpu:7092.986078107651
Step 104 | loss:8.247521327575669e-05 lr:2.1596762663442218e-05 tokens_per_second_per_gpu:7076.138196245383
Step 105 | loss:0.00042858082451857626 lr:2.061073738537635e-05 tokens_per_second_per_gpu:7041.480584517925
Step 106 | loss:0.00011575245298445225 lr:1.9641874609064443e-05 tokens_per_second_per_gpu:7044.155775288206
Step 107 | loss:0.0002363687672186643 lr:1.8690740123084316e-05 tokens_per_second_per_gpu:7039.088495780087
Step 108 | loss:0.00013456822489388287 lr:1.7757889363191483e-05 tokens_per_second_per_gpu:7026.446112249914
Step 109 | loss:0.00023838593915570527 lr:1.684386708796025e-05 tokens_per_second_per_gpu:6988.987171634248
Step 110 | loss:0.010115381330251694 lr:1.5949207060660138e-05 tokens_per_second_per_gpu:6990.197337009686
Step 111 | loss:0.0018934216350317001 lr:1.5074431737553157e-05 tokens_per_second_per_gpu:6743.573212451079
Step 112 | loss:0.00025214170455001295 lr:1.422005196279395e-05 tokens_per_second_per_gpu:7025.532954679914
Step 113 | loss:0.00011945638107135892 lr:1.338656667011134e-05 tokens_per_second_per_gpu:7092.483810363859
Step 114 | loss:0.006380931008607149 lr:1.257446259144494e-05 tokens_per_second_per_gpu:7065.781623665797
Step 115 | loss:0.0001420805201632902 lr:1.178421397270758e-05 tokens_per_second_per_gpu:7040.162976437409
Step 116 | loss:2.3789141778252088e-05 lr:1.1016282296838887e-05 tokens_per_second_per_gpu:7082.35597686502
Step 117 | loss:0.00016184583364520222 lr:1.0271116014312293e-05 tokens_per_second_per_gpu:7038.865444358449
Step 118 | loss:0.0001335080887656659 lr:9.549150281252633e-06 tokens_per_second_per_gpu:7044.235297789802
Step 119 | loss:0.0001501671940786764 lr:8.850806705317183e-06 tokens_per_second_per_gpu:7053.522194978602
Step 120 | loss:0.00013162194227334112 lr:8.176493099488663e-06 tokens_per_second_per_gpu:6990.745679143501
Step 121 | loss:7.372390246018767e-05 lr:7.526603243923957e-06 tokens_per_second_per_gpu:7029.204090451401
Step 122 | loss:7.230928895296529e-05 lr:6.901516655997536e-06 tokens_per_second_per_gpu:7043.215127199049
Step 123 | loss:0.016294578090310097 lr:6.301598368674105e-06 tokens_per_second_per_gpu:7043.729432972243
Step 124 | loss:7.895987801020965e-05 lr:5.727198717339511e-06 tokens_per_second_per_gpu:7042.397870377773
Step 125 | loss:7.259850099217147e-05 lr:5.178653135214812e-06 tokens_per_second_per_gpu:7097.333393315824
Step 126 | loss:0.00013783213216811419 lr:4.65628195747273e-06 tokens_per_second_per_gpu:7042.014185173458
Step 127 | loss:5.2182000217726454e-05 lr:4.16039023417088e-06 tokens_per_second_per_gpu:7103.783211933851
Step 128 | loss:0.00011623362661339343 lr:3.691267552111183e-06 tokens_per_second_per_gpu:7098.414811978706
Step 129 | loss:0.00022878099116496742 lr:3.249187865729264e-06 tokens_per_second_per_gpu:7030.433996536005
Step 130 | loss:0.00012151605187682435 lr:2.8344093371128424e-06 tokens_per_second_per_gpu:7048.249517506304
Step 131 | loss:0.005570061970502138 lr:2.4471741852423237e-06 tokens_per_second_per_gpu:7103.051110722025
Step 132 | loss:0.004175185225903988 lr:2.087708544541689e-06 tokens_per_second_per_gpu:7083.1205921836545
Step 133 | loss:0.0012934468686580658 lr:1.7562223328224325e-06 tokens_per_second_per_gpu:7076.4735457157
Step 134 | loss:0.0003043202741537243 lr:1.4529091286973995e-06 tokens_per_second_per_gpu:7007.0723535837415
Step 135 | loss:0.00012435253302101046 lr:1.1779460585363944e-06 tokens_per_second_per_gpu:6999.941285882035
Step 136 | loss:7.059708150336519e-05 lr:9.314936930293283e-07 tokens_per_second_per_gpu:7051.144100102408
Step 137 | loss:7.489723793696612e-05 lr:7.136959534174592e-07 tokens_per_second_per_gpu:7038.938613254926
Step 138 | loss:0.00018304510740563273 lr:5.246800274474439e-07 tokens_per_second_per_gpu:7094.057370184806
Step 139 | loss:2.5133847884717397e-05 lr:3.6455629509730136e-07 tokens_per_second_per_gpu:7088.270784451943
Step 140 | loss:5.754767335020006e-05 lr:2.334182641175686e-07 tokens_per_second_per_gpu:6740.353266839451
Step 141 | loss:0.00025972671573981643 lr:1.3134251542544774e-07 tokens_per_second_per_gpu:7015.591582218172
Step 142 | loss:0.00014096495578996837 lr:5.838865838366792e-08 tokens_per_second_per_gpu:7089.274483788882
Step 143 | loss:3.88710577681195e-05 lr:1.4599295990352924e-08 tokens_per_second_per_gpu:7101.736124023101
Step 144 | loss:7.034815644146875e-05 lr:0.0 tokens_per_second_per_gpu:7082.976961344536