ekinakyurek's picture
Upload folder using huggingface_hub
0bfc910 verified
Step 1 | loss:0.10024691373109818 lr:7.142857142857143e-06 tokens_per_second_per_gpu:4583.321243710701
Step 2 | loss:0.023647034540772438 lr:1.4285714285714285e-05 tokens_per_second_per_gpu:6938.074327630863
Step 3 | loss:0.02387063205242157 lr:2.1428571428571428e-05 tokens_per_second_per_gpu:6897.657156234389
Step 4 | loss:0.07519605755805969 lr:2.857142857142857e-05 tokens_per_second_per_gpu:3911.213205149061
Step 5 | loss:0.02532012201845646 lr:3.571428571428572e-05 tokens_per_second_per_gpu:7002.137200395904
Step 6 | loss:0.023282630369067192 lr:4.2857142857142856e-05 tokens_per_second_per_gpu:7015.718316364376
Step 7 | loss:0.022276749834418297 lr:5e-05 tokens_per_second_per_gpu:6915.629494510841
Step 8 | loss:0.025258788838982582 lr:5.714285714285714e-05 tokens_per_second_per_gpu:7018.809618517136
Step 9 | loss:0.021709633991122246 lr:6.428571428571429e-05 tokens_per_second_per_gpu:6898.1979706469765
Step 10 | loss:0.01784304529428482 lr:7.142857142857143e-05 tokens_per_second_per_gpu:7003.646840147428
Step 11 | loss:0.026490256190299988 lr:7.857142857142858e-05 tokens_per_second_per_gpu:7001.6826328278885
Step 12 | loss:0.02348017320036888 lr:8.571428571428571e-05 tokens_per_second_per_gpu:6994.987074543855
Step 13 | loss:0.022985221818089485 lr:9.285714285714286e-05 tokens_per_second_per_gpu:6992.638298778566
Step 14 | loss:0.018697993829846382 lr:0.0001 tokens_per_second_per_gpu:6863.10524670486
Step 15 | loss:0.014765052124857903 lr:9.998540070400966e-05 tokens_per_second_per_gpu:6951.9715721079565
Step 16 | loss:0.022365931421518326 lr:9.994161134161634e-05 tokens_per_second_per_gpu:6981.337203901021
Step 17 | loss:0.05649026483297348 lr:9.986865748457457e-05 tokens_per_second_per_gpu:7009.5567610140815
Step 18 | loss:0.0318923257291317 lr:9.976658173588244e-05 tokens_per_second_per_gpu:6922.587430110067
Step 19 | loss:0.016176583245396614 lr:9.96354437049027e-05 tokens_per_second_per_gpu:6940.190527434353
Step 20 | loss:0.01595062017440796 lr:9.947531997255256e-05 tokens_per_second_per_gpu:7023.161199039168
Step 21 | loss:0.015316289849579334 lr:9.928630404658255e-05 tokens_per_second_per_gpu:6982.613829344765
Step 22 | loss:0.011035650037229061 lr:9.906850630697068e-05 tokens_per_second_per_gpu:7012.302602884556
Step 23 | loss:0.03260388225317001 lr:9.882205394146361e-05 tokens_per_second_per_gpu:6887.270682840358
Step 24 | loss:0.015518075786530972 lr:9.85470908713026e-05 tokens_per_second_per_gpu:7006.044381306182
Step 25 | loss:0.015447852201759815 lr:9.824377766717759e-05 tokens_per_second_per_gpu:6915.76592256907
Step 26 | loss:0.013797895051538944 lr:9.791229145545831e-05 tokens_per_second_per_gpu:6906.235391792908
Step 27 | loss:0.01218175608664751 lr:9.755282581475769e-05 tokens_per_second_per_gpu:6858.8187382414
Step 28 | loss:0.026370855048298836 lr:9.716559066288715e-05 tokens_per_second_per_gpu:7023.113031703748
Step 29 | loss:0.011667471379041672 lr:9.675081213427076e-05 tokens_per_second_per_gpu:7019.497075876892
Step 30 | loss:0.017424099147319794 lr:9.630873244788883e-05 tokens_per_second_per_gpu:6997.919041996808
Step 31 | loss:0.009037600830197334 lr:9.583960976582913e-05 tokens_per_second_per_gpu:7038.358324539131
Step 32 | loss:0.015969621017575264 lr:9.534371804252728e-05 tokens_per_second_per_gpu:6974.510387784
Step 33 | loss:0.014194541610777378 lr:9.482134686478519e-05 tokens_per_second_per_gpu:6921.971902116589
Step 34 | loss:0.013328947126865387 lr:9.42728012826605e-05 tokens_per_second_per_gpu:7004.786361688654
Step 35 | loss:0.011736427433788776 lr:9.36984016313259e-05 tokens_per_second_per_gpu:6969.668069383325
Step 36 | loss:0.006934679113328457 lr:9.309848334400246e-05 tokens_per_second_per_gpu:6917.899976363562
Step 37 | loss:0.015996329486370087 lr:9.247339675607605e-05 tokens_per_second_per_gpu:6868.23353755549
Step 38 | loss:0.013972129672765732 lr:9.182350690051133e-05 tokens_per_second_per_gpu:7011.19961150869
Step 39 | loss:0.007269518915563822 lr:9.114919329468282e-05 tokens_per_second_per_gpu:7019.325300895336
Step 40 | loss:0.007446694653481245 lr:9.045084971874738e-05 tokens_per_second_per_gpu:6862.117292008655
Step 41 | loss:0.007477952633053064 lr:8.972888398568772e-05 tokens_per_second_per_gpu:7019.174745813871
Step 42 | loss:0.004168596584349871 lr:8.898371770316111e-05 tokens_per_second_per_gpu:6876.518463407085
Step 43 | loss:0.007125674281269312 lr:8.821578602729242e-05 tokens_per_second_per_gpu:6935.009281658902
Step 44 | loss:0.006291029043495655 lr:8.742553740855506e-05 tokens_per_second_per_gpu:6865.1890227534805
Step 45 | loss:0.012491370551288128 lr:8.661343332988869e-05 tokens_per_second_per_gpu:6863.581154456449
Step 46 | loss:0.00862965453416109 lr:8.577994803720606e-05 tokens_per_second_per_gpu:7017.835775931079
Step 47 | loss:0.009417916648089886 lr:8.492556826244687e-05 tokens_per_second_per_gpu:7017.723675375908
Step 48 | loss:0.0077200401574373245 lr:8.405079293933986e-05 tokens_per_second_per_gpu:6976.398607427418
Step 49 | loss:0.008464200422167778 lr:8.315613291203976e-05 tokens_per_second_per_gpu:6984.192648191455
Step 50 | loss:0.0077700428664684296 lr:8.224211063680853e-05 tokens_per_second_per_gpu:6917.216628813551
Step 51 | loss:0.00739700673148036 lr:8.130925987691569e-05 tokens_per_second_per_gpu:7026.612526356554
Step 52 | loss:0.0052774157375097275 lr:8.035812539093557e-05 tokens_per_second_per_gpu:6865.801630168117
Step 53 | loss:0.007715026848018169 lr:7.938926261462366e-05 tokens_per_second_per_gpu:7007.199568220739
Step 54 | loss:0.006663809064775705 lr:7.840323733655778e-05 tokens_per_second_per_gpu:6915.185238019109
Step 55 | loss:0.005782071501016617 lr:7.740062536773352e-05 tokens_per_second_per_gpu:6857.522111785746
Step 56 | loss:0.006561202462762594 lr:7.638201220530665e-05 tokens_per_second_per_gpu:6414.259029138643
Step 57 | loss:0.003897438058629632 lr:7.534799269067953e-05 tokens_per_second_per_gpu:6979.662067193898
Step 58 | loss:0.00614685844630003 lr:7.42991706621303e-05 tokens_per_second_per_gpu:6899.049558249507
Step 59 | loss:0.005672368220984936 lr:7.323615860218843e-05 tokens_per_second_per_gpu:6878.492149278483
Step 60 | loss:0.01083806250244379 lr:7.215957727996207e-05 tokens_per_second_per_gpu:7012.251186571321
Step 61 | loss:0.008443303406238556 lr:7.107005538862646e-05 tokens_per_second_per_gpu:6900.98933572015
Step 62 | loss:0.003191221272572875 lr:6.996822917828477e-05 tokens_per_second_per_gpu:6889.772102778847
Step 63 | loss:0.0027337544597685337 lr:6.885474208441603e-05 tokens_per_second_per_gpu:6969.968073051965
Step 64 | loss:0.00623043067753315 lr:6.773024435212678e-05 tokens_per_second_per_gpu:6845.930664139265
Step 65 | loss:0.004524786490947008 lr:6.659539265642643e-05 tokens_per_second_per_gpu:7002.489102762099
Step 66 | loss:0.006836552172899246 lr:6.545084971874738e-05 tokens_per_second_per_gpu:6897.611865607451
Step 67 | loss:0.0064527979120612144 lr:6.429728391993446e-05 tokens_per_second_per_gpu:6999.255923538334
Step 68 | loss:0.0016915047308430076 lr:6.313536890992935e-05 tokens_per_second_per_gpu:6894.982856699067
Step 69 | loss:0.0036256222520023584 lr:6.19657832143779e-05 tokens_per_second_per_gpu:6954.070853158444
Step 70 | loss:0.005240947008132935 lr:6.078920983839031e-05 tokens_per_second_per_gpu:6885.805856215745
Step 71 | loss:0.003947566729038954 lr:5.960633586768543e-05 tokens_per_second_per_gpu:6835.939529608826
Step 72 | loss:0.005052132066339254 lr:5.841785206735192e-05 tokens_per_second_per_gpu:6896.498201620746
Step 73 | loss:0.0013588801957666874 lr:5.7224452478461064e-05 tokens_per_second_per_gpu:6952.052319452199
Step 74 | loss:0.0011387164704501629 lr:5.602683401276615e-05 tokens_per_second_per_gpu:6991.216118595824
Step 75 | loss:0.0018659229390323162 lr:5.482569604572576e-05 tokens_per_second_per_gpu:6832.440882160264
Step 76 | loss:0.0012839846312999725 lr:5.3621740008088126e-05 tokens_per_second_per_gpu:6917.723882328642
Step 77 | loss:0.003197891404852271 lr:5.2415668976275355e-05 tokens_per_second_per_gpu:6891.33413958513
Step 78 | loss:0.005687285214662552 lr:5.1208187261806615e-05 tokens_per_second_per_gpu:6908.851794702181
Step 79 | loss:0.001178545760922134 lr:5e-05 tokens_per_second_per_gpu:6927.355837515878
Step 80 | loss:0.003518831916153431 lr:4.87918127381934e-05 tokens_per_second_per_gpu:6912.995180461183
Step 81 | loss:0.0017946312436833978 lr:4.758433102372466e-05 tokens_per_second_per_gpu:6843.33255108009
Step 82 | loss:0.0012526096543297172 lr:4.6378259991911886e-05 tokens_per_second_per_gpu:7015.113222309543
Step 83 | loss:0.0022810865193605423 lr:4.5174303954274244e-05 tokens_per_second_per_gpu:6748.670165193532
Step 84 | loss:0.0016417813021689653 lr:4.397316598723385e-05 tokens_per_second_per_gpu:6980.760355683479
Step 85 | loss:0.0024414248764514923 lr:4.277554752153895e-05 tokens_per_second_per_gpu:6852.974245611611
Step 86 | loss:0.00044921773951500654 lr:4.1582147932648074e-05 tokens_per_second_per_gpu:6902.617019075371
Step 87 | loss:0.001129858777858317 lr:4.039366413231458e-05 tokens_per_second_per_gpu:6990.2829722421
Step 88 | loss:0.0025706635788083076 lr:3.92107901616097e-05 tokens_per_second_per_gpu:6890.096558576418
Step 89 | loss:0.0005976815009489655 lr:3.803421678562213e-05 tokens_per_second_per_gpu:6945.408765948965
Step 90 | loss:0.00039021173142828047 lr:3.6864631090070655e-05 tokens_per_second_per_gpu:6988.930840550452
Step 91 | loss:0.001592149375937879 lr:3.570271608006555e-05 tokens_per_second_per_gpu:6966.768300104295
Step 92 | loss:0.0025845523923635483 lr:3.4549150281252636e-05 tokens_per_second_per_gpu:6878.998152123706
Step 93 | loss:0.0004198434471618384 lr:3.340460734357359e-05 tokens_per_second_per_gpu:6994.41734678438
Step 94 | loss:0.0006986663793213665 lr:3.226975564787322e-05 tokens_per_second_per_gpu:7022.170100715857
Step 95 | loss:0.0005265998770482838 lr:3.114525791558398e-05 tokens_per_second_per_gpu:6916.213959849475
Step 96 | loss:0.0003572702407836914 lr:3.003177082171523e-05 tokens_per_second_per_gpu:7007.761966195305
Step 97 | loss:0.002319352701306343 lr:2.8929944611373554e-05 tokens_per_second_per_gpu:7015.240346715464
Step 98 | loss:0.0002951623173430562 lr:2.784042272003794e-05 tokens_per_second_per_gpu:6853.09451537476
Step 99 | loss:0.0023552333004772663 lr:2.6763841397811573e-05 tokens_per_second_per_gpu:7003.349844458944
Step 100 | loss:0.0010486695682629943 lr:2.57008293378697e-05 tokens_per_second_per_gpu:6914.1421456426315
Step 101 | loss:0.0014828420244157314 lr:2.4652007309320498e-05 tokens_per_second_per_gpu:6919.3599059052085
Step 102 | loss:0.001046987483277917 lr:2.361798779469336e-05 tokens_per_second_per_gpu:7018.303720984614
Step 103 | loss:0.0007703774608671665 lr:2.259937463226651e-05 tokens_per_second_per_gpu:6997.179630158057
Step 104 | loss:0.001767762703821063 lr:2.1596762663442218e-05 tokens_per_second_per_gpu:7017.017781364177
Step 105 | loss:0.0020840901415795088 lr:2.061073738537635e-05 tokens_per_second_per_gpu:6915.254221032149
Step 106 | loss:0.0013560941442847252 lr:1.9641874609064443e-05 tokens_per_second_per_gpu:6920.728349299234
Step 107 | loss:0.0006648179842159152 lr:1.8690740123084316e-05 tokens_per_second_per_gpu:6920.9890153201495
Step 108 | loss:0.0008464287384413183 lr:1.7757889363191483e-05 tokens_per_second_per_gpu:6917.507789378698
Step 109 | loss:0.00015384129073936492 lr:1.684386708796025e-05 tokens_per_second_per_gpu:6864.086643701145
Step 110 | loss:0.0005378327332437038 lr:1.5949207060660138e-05 tokens_per_second_per_gpu:6868.0858312367045
Step 111 | loss:0.0004026291717309505 lr:1.5074431737553157e-05 tokens_per_second_per_gpu:6780.15937878548
Step 112 | loss:0.0007237880490720272 lr:1.422005196279395e-05 tokens_per_second_per_gpu:6903.6839392299025
Step 113 | loss:0.0005907716695219278 lr:1.338656667011134e-05 tokens_per_second_per_gpu:7011.173840904926
Step 114 | loss:0.00041386214434169233 lr:1.257446259144494e-05 tokens_per_second_per_gpu:6994.66878312238
Step 115 | loss:7.937858026707545e-05 lr:1.178421397270758e-05 tokens_per_second_per_gpu:6905.1653341429
Step 116 | loss:0.00016324411262758076 lr:1.1016282296838887e-05 tokens_per_second_per_gpu:7011.066946317102
Step 117 | loss:0.00029951773467473686 lr:1.0271116014312293e-05 tokens_per_second_per_gpu:6933.241434456813
Step 118 | loss:0.00016951235011219978 lr:9.549150281252633e-06 tokens_per_second_per_gpu:6898.310324571846
Step 119 | loss:0.0005056647933088243 lr:8.850806705317183e-06 tokens_per_second_per_gpu:6932.130944971414
Step 120 | loss:0.0004128507280256599 lr:8.176493099488663e-06 tokens_per_second_per_gpu:6842.094975073847
Step 121 | loss:0.0009206223767250776 lr:7.526603243923957e-06 tokens_per_second_per_gpu:6918.615697688258
Step 122 | loss:0.0005813115276396275 lr:6.901516655997536e-06 tokens_per_second_per_gpu:6903.401522562443
Step 123 | loss:0.0008506886078976095 lr:6.301598368674105e-06 tokens_per_second_per_gpu:6910.656851139456
Step 124 | loss:0.00016624793352093548 lr:5.727198717339511e-06 tokens_per_second_per_gpu:6941.196972437045
Step 125 | loss:0.0001036522735375911 lr:5.178653135214812e-06 tokens_per_second_per_gpu:7025.467779138263
Step 126 | loss:0.0002599183062557131 lr:4.65628195747273e-06 tokens_per_second_per_gpu:6921.640773097841
Step 127 | loss:0.00042629698873497546 lr:4.16039023417088e-06 tokens_per_second_per_gpu:7011.144720715902
Step 128 | loss:0.0004723415186163038 lr:3.691267552111183e-06 tokens_per_second_per_gpu:7012.9729316116955
Step 129 | loss:0.00017131032655015588 lr:3.249187865729264e-06 tokens_per_second_per_gpu:6914.507833641022
Step 130 | loss:7.356963760685176e-05 lr:2.8344093371128424e-06 tokens_per_second_per_gpu:6918.219064612632
Step 131 | loss:0.0006879005231894553 lr:2.4471741852423237e-06 tokens_per_second_per_gpu:7004.075152856925
Step 132 | loss:0.00043096425361 lr:2.087708544541689e-06 tokens_per_second_per_gpu:7023.464380462066
Step 133 | loss:0.00013494983431883156 lr:1.7562223328224325e-06 tokens_per_second_per_gpu:6999.954893605329
Step 134 | loss:0.00016310205683112144 lr:1.4529091286973995e-06 tokens_per_second_per_gpu:6868.2478354056975
Step 135 | loss:0.00018066633492708206 lr:1.1779460585363944e-06 tokens_per_second_per_gpu:6855.728442112344
Step 136 | loss:0.0005591771914623678 lr:9.314936930293283e-07 tokens_per_second_per_gpu:6935.421210893606
Step 137 | loss:0.00043918294250033796 lr:7.136959534174592e-07 tokens_per_second_per_gpu:6910.455873867342
Step 138 | loss:0.00037205632543191314 lr:5.246800274474439e-07 tokens_per_second_per_gpu:7024.070125325283
Step 139 | loss:0.0009299346711486578 lr:3.6455629509730136e-07 tokens_per_second_per_gpu:7007.047255367828
Step 140 | loss:0.0013697667745873332 lr:2.334182641175686e-07 tokens_per_second_per_gpu:6775.859431864723
Step 141 | loss:0.0002549955097492784 lr:1.3134251542544774e-07 tokens_per_second_per_gpu:6912.5804491096715
Step 142 | loss:0.0004562957910820842 lr:5.838865838366792e-08 tokens_per_second_per_gpu:7017.991574675715
Step 143 | loss:0.0010212174383923411 lr:1.4599295990352924e-08 tokens_per_second_per_gpu:7007.308768494359
Step 144 | loss:0.0006088832742534578 lr:0.0 tokens_per_second_per_gpu:6971.79160672229