Step 1 | loss:0.0001682699949014932 lr:7.142857142857143e-06 tokens_per_second_per_gpu:4893.370455002823 Step 2 | loss:0.00017528476018924266 lr:1.4285714285714285e-05 tokens_per_second_per_gpu:6756.211937058164 Step 3 | loss:0.0002322747459402308 lr:2.1428571428571428e-05 tokens_per_second_per_gpu:6791.693096797189 Step 4 | loss:0.005278476979583502 lr:2.857142857142857e-05 tokens_per_second_per_gpu:4218.971765749938 Step 5 | loss:0.0001035879977280274 lr:3.571428571428572e-05 tokens_per_second_per_gpu:7009.397703435477 Step 6 | loss:1.2738943041767925e-05 lr:4.2857142857142856e-05 tokens_per_second_per_gpu:6996.322555290517 Step 7 | loss:0.00012777867959812284 lr:5e-05 tokens_per_second_per_gpu:6812.308097032071 Step 8 | loss:1.5444325981661677e-05 lr:5.714285714285714e-05 tokens_per_second_per_gpu:7037.230211716666 Step 9 | loss:0.005086900200694799 lr:6.428571428571429e-05 tokens_per_second_per_gpu:6817.929275974544 Step 10 | loss:2.6749810331239132e-06 lr:7.142857142857143e-05 tokens_per_second_per_gpu:7013.845969207502 Step 11 | loss:3.496359795462922e-06 lr:7.857142857142858e-05 tokens_per_second_per_gpu:7017.615612612522 Step 12 | loss:0.0023829725105315447 lr:8.571428571428571e-05 tokens_per_second_per_gpu:7017.445873516316 Step 13 | loss:1.6783735645731213e-06 lr:9.285714285714286e-05 tokens_per_second_per_gpu:7012.225079821543 Step 14 | loss:0.003003678284585476 lr:0.0001 tokens_per_second_per_gpu:6758.017009907571 Step 15 | loss:0.0006755526992492378 lr:9.998540070400966e-05 tokens_per_second_per_gpu:7009.303956482026 Step 16 | loss:3.42664839081408e-06 lr:9.994161134161634e-05 tokens_per_second_per_gpu:7011.315426664709 Step 17 | loss:0.00048075022641569376 lr:9.986865748457457e-05 tokens_per_second_per_gpu:7000.40809905357 Step 18 | loss:4.195870496914722e-05 lr:9.976658173588244e-05 tokens_per_second_per_gpu:6818.673865912963 Step 19 | loss:3.248312714276835e-05 lr:9.96354437049027e-05 tokens_per_second_per_gpu:6819.442255597128 Step 20 | loss:2.8504771307780175e-06 lr:9.947531997255256e-05 tokens_per_second_per_gpu:7034.02897411201 Step 21 | loss:3.29341969518282e-06 lr:9.928630404658255e-05 tokens_per_second_per_gpu:7013.92052337093 Step 22 | loss:7.315130915230839e-06 lr:9.906850630697068e-05 tokens_per_second_per_gpu:7012.791093195523 Step 23 | loss:2.3869439246482216e-05 lr:9.882205394146361e-05 tokens_per_second_per_gpu:6747.053467964252 Step 24 | loss:3.5413934256212087e-06 lr:9.85470908713026e-05 tokens_per_second_per_gpu:7010.146368764054 Step 25 | loss:3.859273419948295e-05 lr:9.824377766717759e-05 tokens_per_second_per_gpu:6796.025283168545 Step 26 | loss:1.0557077075645793e-05 lr:9.791229145545831e-05 tokens_per_second_per_gpu:6831.997080521246 Step 27 | loss:1.2868784324382432e-05 lr:9.755282581475769e-05 tokens_per_second_per_gpu:6780.106789103596 Step 28 | loss:0.0007731721852906048 lr:9.716559066288715e-05 tokens_per_second_per_gpu:7020.416929143556 Step 29 | loss:2.4440972993033938e-05 lr:9.675081213427076e-05 tokens_per_second_per_gpu:7009.523633876879 Step 30 | loss:4.611135864251992e-06 lr:9.630873244788883e-05 tokens_per_second_per_gpu:7022.482054851877 Step 31 | loss:0.00042445361032150686 lr:9.583960976582913e-05 tokens_per_second_per_gpu:7013.432691111153 Step 32 | loss:1.8987277144333348e-05 lr:9.534371804252728e-05 tokens_per_second_per_gpu:7010.9410023432065 Step 33 | loss:0.0013255926314741373 lr:9.482134686478519e-05 tokens_per_second_per_gpu:6811.107748067405 Step 34 | loss:0.00021273430320434272 lr:9.42728012826605e-05 tokens_per_second_per_gpu:7027.250431887888 Step 35 | loss:5.6763925385894254e-05 lr:9.36984016313259e-05 tokens_per_second_per_gpu:7018.977455749849 Step 36 | loss:2.6871155114349676e-06 lr:9.309848334400246e-05 tokens_per_second_per_gpu:6823.191202152299 Step 37 | loss:4.997695214115083e-06 lr:9.247339675607605e-05 tokens_per_second_per_gpu:6716.632448044392 Step 38 | loss:2.1698997443309054e-06 lr:9.182350690051133e-05 tokens_per_second_per_gpu:7024.549450631367 Step 39 | loss:2.507512135707657e-06 lr:9.114919329468282e-05 tokens_per_second_per_gpu:7010.077115871637 Step 40 | loss:4.0804802665661555e-06 lr:9.045084971874738e-05 tokens_per_second_per_gpu:6736.907864899666 Step 41 | loss:3.157813807774801e-06 lr:8.972888398568772e-05 tokens_per_second_per_gpu:7022.496572635974 Step 42 | loss:2.1627081423503114e-06 lr:8.898371770316111e-05 tokens_per_second_per_gpu:6736.882654297642 Step 43 | loss:2.3833324576116866e-06 lr:8.821578602729242e-05 tokens_per_second_per_gpu:6816.320580233189 Step 44 | loss:1.6776895108705503e-06 lr:8.742553740855506e-05 tokens_per_second_per_gpu:6777.790139979653 Step 45 | loss:2.1175080746616004e-06 lr:8.661343332988869e-05 tokens_per_second_per_gpu:6763.457074122837 Step 46 | loss:2.197473349951906e-06 lr:8.577994803720606e-05 tokens_per_second_per_gpu:7010.765344288862 Step 47 | loss:0.0008492322522215545 lr:8.492556826244687e-05 tokens_per_second_per_gpu:7002.962053269997 Step 48 | loss:3.6157553040538915e-06 lr:8.405079293933986e-05 tokens_per_second_per_gpu:7004.814577547648 Step 49 | loss:1.6522184296263731e-06 lr:8.315613291203976e-05 tokens_per_second_per_gpu:7019.5530924932345 Step 50 | loss:0.0001684491871856153 lr:8.224211063680853e-05 tokens_per_second_per_gpu:6804.607501074442 Step 51 | loss:1.2724331099889241e-05 lr:8.130925987691569e-05 tokens_per_second_per_gpu:7017.00645813731 Step 52 | loss:6.968144589336589e-06 lr:8.035812539093557e-05 tokens_per_second_per_gpu:6761.511963726167 Step 53 | loss:1.119465309784573e-06 lr:7.938926261462366e-05 tokens_per_second_per_gpu:7007.677449965178 Step 54 | loss:3.050527084269561e-06 lr:7.840323733655778e-05 tokens_per_second_per_gpu:6780.978219779685 Step 55 | loss:1.2928813930557226e-06 lr:7.740062536773352e-05 tokens_per_second_per_gpu:6775.237129127501 Step 56 | loss:2.2890249965712428e-05 lr:7.638201220530665e-05 tokens_per_second_per_gpu:6422.345818302852 Step 57 | loss:5.283197879180079e-06 lr:7.534799269067953e-05 tokens_per_second_per_gpu:7031.362457396013 Step 58 | loss:8.153471571858972e-05 lr:7.42991706621303e-05 tokens_per_second_per_gpu:6789.696551378613 Step 59 | loss:1.0309910294381552e-06 lr:7.323615860218843e-05 tokens_per_second_per_gpu:6825.923513683022 Step 60 | loss:8.663581070322834e-07 lr:7.215957727996207e-05 tokens_per_second_per_gpu:7032.4563059526345 Step 61 | loss:1.1179603234268143e-06 lr:7.107005538862646e-05 tokens_per_second_per_gpu:6812.123915359919 Step 62 | loss:6.28417296866246e-07 lr:6.996822917828477e-05 tokens_per_second_per_gpu:6812.817908911266 Step 63 | loss:7.11512711859541e-07 lr:6.885474208441603e-05 tokens_per_second_per_gpu:7002.386458721926 Step 64 | loss:2.8555414246511646e-06 lr:6.773024435212678e-05 tokens_per_second_per_gpu:6771.58253984211 Step 65 | loss:2.4173737983801402e-05 lr:6.659539265642643e-05 tokens_per_second_per_gpu:7017.819100707859 Step 66 | loss:0.0005178975407034159 lr:6.545084971874738e-05 tokens_per_second_per_gpu:6790.158485897341 Step 67 | loss:1.6071592199295992e-06 lr:6.429728391993446e-05 tokens_per_second_per_gpu:7025.982867033378 Step 68 | loss:2.0281355318729766e-05 lr:6.313536890992935e-05 tokens_per_second_per_gpu:6804.013155148936 Step 69 | loss:5.810059633404308e-07 lr:6.19657832143779e-05 tokens_per_second_per_gpu:7021.929596363514 Step 70 | loss:6.444557243412419e-07 lr:6.078920983839031e-05 tokens_per_second_per_gpu:6796.116349794858 Step 71 | loss:5.963414650977938e-07 lr:5.960633586768543e-05 tokens_per_second_per_gpu:6773.232183285323 Step 72 | loss:0.00028539137565530837 lr:5.841785206735192e-05 tokens_per_second_per_gpu:6819.562604937427 Step 73 | loss:7.746656933704799e-07 lr:5.7224452478461064e-05 tokens_per_second_per_gpu:7022.581234218439 Step 74 | loss:2.1634700715367217e-06 lr:5.602683401276615e-05 tokens_per_second_per_gpu:7005.018333002467 Step 75 | loss:1.6119472547870828e-06 lr:5.482569604572576e-05 tokens_per_second_per_gpu:6739.0806492381025 Step 76 | loss:8.366361043954385e-07 lr:5.3621740008088126e-05 tokens_per_second_per_gpu:6813.441696277514 Step 77 | loss:9.148737376563076e-07 lr:5.2415668976275355e-05 tokens_per_second_per_gpu:6825.444825754026 Step 78 | loss:9.26533687106712e-07 lr:5.1208187261806615e-05 tokens_per_second_per_gpu:6818.065685584182 Step 79 | loss:3.290545646450482e-05 lr:5e-05 tokens_per_second_per_gpu:6824.345312044544 Step 80 | loss:1.993170917558018e-05 lr:4.87918127381934e-05 tokens_per_second_per_gpu:6831.158477292209 Step 81 | loss:1.7466001054344815e-06 lr:4.758433102372466e-05 tokens_per_second_per_gpu:6716.035064603289 Step 82 | loss:1.0934363672276959e-06 lr:4.6378259991911886e-05 tokens_per_second_per_gpu:7023.175991111873 Step 83 | loss:9.187160117107851e-07 lr:4.5174303954274244e-05 tokens_per_second_per_gpu:6924.078714900619 Step 84 | loss:6.392619980033487e-07 lr:4.397316598723385e-05 tokens_per_second_per_gpu:7033.942751123935 Step 85 | loss:1.2504166306825937e-06 lr:4.277554752153895e-05 tokens_per_second_per_gpu:6756.5307912796015 Step 86 | loss:6.936949648661539e-05 lr:4.1582147932648074e-05 tokens_per_second_per_gpu:6804.7697140543205 Step 87 | loss:5.837318894919008e-07 lr:4.039366413231458e-05 tokens_per_second_per_gpu:7023.346768294707 Step 88 | loss:4.98399288062501e-07 lr:3.92107901616097e-05 tokens_per_second_per_gpu:6803.75512757927 Step 89 | loss:7.692595431763039e-07 lr:3.803421678562213e-05 tokens_per_second_per_gpu:7008.491486022008 Step 90 | loss:4.177466053079115e-07 lr:3.6864631090070655e-05 tokens_per_second_per_gpu:6996.153615117277 Step 91 | loss:3.694493102557317e-07 lr:3.570271608006555e-05 tokens_per_second_per_gpu:7010.373168822115 Step 92 | loss:5.986305495753186e-07 lr:3.4549150281252636e-05 tokens_per_second_per_gpu:6830.149728197303 Step 93 | loss:4.197915473014291e-07 lr:3.340460734357359e-05 tokens_per_second_per_gpu:7014.585502320068 Step 94 | loss:5.691028377441398e-07 lr:3.226975564787322e-05 tokens_per_second_per_gpu:7020.491600839513 Step 95 | loss:0.0004476364701986313 lr:3.114525791558398e-05 tokens_per_second_per_gpu:6788.20991533912 Step 96 | loss:1.6255719401669921e-06 lr:3.003177082171523e-05 tokens_per_second_per_gpu:7018.404885559011 Step 97 | loss:4.043117201035784e-07 lr:2.8929944611373554e-05 tokens_per_second_per_gpu:7010.408434094407 Step 98 | loss:9.939851679519052e-07 lr:2.784042272003794e-05 tokens_per_second_per_gpu:6737.23621166513 Step 99 | loss:5.019132345296384e-07 lr:2.6763841397811573e-05 tokens_per_second_per_gpu:7022.423139239971 Step 100 | loss:4.115099727641791e-07 lr:2.57008293378697e-05 tokens_per_second_per_gpu:6819.993244756309 Step 101 | loss:5.486150485012331e-07 lr:2.4652007309320498e-05 tokens_per_second_per_gpu:6783.8480625769325 Step 102 | loss:3.0683881391269097e-07 lr:2.361798779469336e-05 tokens_per_second_per_gpu:7017.524430570597 Step 103 | loss:3.973726416006684e-05 lr:2.259937463226651e-05 tokens_per_second_per_gpu:7013.401396987549 Step 104 | loss:8.639735256110725e-07 lr:2.1596762663442218e-05 tokens_per_second_per_gpu:7021.949452906592 Step 105 | loss:5.675622674061742e-07 lr:2.061073738537635e-05 tokens_per_second_per_gpu:6803.0830334242355 Step 106 | loss:4.431033744367596e-07 lr:1.9641874609064443e-05 tokens_per_second_per_gpu:6837.771918422724 Step 107 | loss:6.278937121351191e-07 lr:1.8690740123084316e-05 tokens_per_second_per_gpu:6826.157977887585 Step 108 | loss:6.57431598938274e-07 lr:1.7757889363191483e-05 tokens_per_second_per_gpu:6824.30053639911 Step 109 | loss:6.288255463005044e-07 lr:1.684386708796025e-05 tokens_per_second_per_gpu:6778.680675161955 Step 110 | loss:3.6433280001801904e-06 lr:1.5949207060660138e-05 tokens_per_second_per_gpu:6769.298218618248 Step 111 | loss:7.530955190304667e-05 lr:1.5074431737553157e-05 tokens_per_second_per_gpu:6910.319834017522 Step 112 | loss:7.193295914476039e-07 lr:1.422005196279395e-05 tokens_per_second_per_gpu:6803.004861545593 Step 113 | loss:4.191405480469257e-07 lr:1.338656667011134e-05 tokens_per_second_per_gpu:7032.124523960711 Step 114 | loss:5.153087840881199e-07 lr:1.257446259144494e-05 tokens_per_second_per_gpu:7004.938524420101 Step 115 | loss:5.500695010596246e-07 lr:1.178421397270758e-05 tokens_per_second_per_gpu:6832.864864150246 Step 116 | loss:4.778680136041658e-07 lr:1.1016282296838887e-05 tokens_per_second_per_gpu:7022.87193868458 Step 117 | loss:5.085346970190585e-07 lr:1.0271116014312293e-05 tokens_per_second_per_gpu:6793.474093292754 Step 118 | loss:1.114443080041383e-06 lr:9.549150281252633e-06 tokens_per_second_per_gpu:6821.803183345362 Step 119 | loss:2.6453908503754064e-06 lr:8.850806705317183e-06 tokens_per_second_per_gpu:6826.63823416825 Step 120 | loss:1.0135591992366244e-06 lr:8.176493099488663e-06 tokens_per_second_per_gpu:6728.7096119587895 Step 121 | loss:9.960554052668158e-07 lr:7.526603243923957e-06 tokens_per_second_per_gpu:6819.414113411415 Step 122 | loss:4.5009019800090755e-07 lr:6.901516655997536e-06 tokens_per_second_per_gpu:6815.561921852952 Step 123 | loss:3.05268113152124e-05 lr:6.301598368674105e-06 tokens_per_second_per_gpu:6830.542362558269 Step 124 | loss:1.8686083421926014e-05 lr:5.727198717339511e-06 tokens_per_second_per_gpu:6823.592631390482 Step 125 | loss:5.014997555008449e-07 lr:5.178653135214812e-06 tokens_per_second_per_gpu:7023.738452285117 Step 126 | loss:6.148217153167934e-07 lr:4.65628195747273e-06 tokens_per_second_per_gpu:6818.625569838112 Step 127 | loss:9.171105261884804e-07 lr:4.16039023417088e-06 tokens_per_second_per_gpu:7024.235498021833 Step 128 | loss:5.591462581833184e-07 lr:3.691267552111183e-06 tokens_per_second_per_gpu:7005.68206316917 Step 129 | loss:2.4967898752947804e-06 lr:3.249187865729264e-06 tokens_per_second_per_gpu:6821.354478059071 Step 130 | loss:7.318204779949156e-07 lr:2.8344093371128424e-06 tokens_per_second_per_gpu:6826.017543231191 Step 131 | loss:7.818407175363973e-05 lr:2.4471741852423237e-06 tokens_per_second_per_gpu:7037.040473616276 Step 132 | loss:3.6891103150082927e-07 lr:2.087708544541689e-06 tokens_per_second_per_gpu:7012.230978187456 Step 133 | loss:7.480517751901061e-07 lr:1.7562223328224325e-06 tokens_per_second_per_gpu:7007.336008991979 Step 134 | loss:2.774146014417056e-05 lr:1.4529091286973995e-06 tokens_per_second_per_gpu:6762.45665670429 Step 135 | loss:7.260341590153985e-07 lr:1.1779460585363944e-06 tokens_per_second_per_gpu:6778.93016968721 Step 136 | loss:3.642566662165336e-05 lr:9.314936930293283e-07 tokens_per_second_per_gpu:6806.576339721 Step 137 | loss:7.979385554790497e-05 lr:7.136959534174592e-07 tokens_per_second_per_gpu:6834.697684965278 Step 138 | loss:4.271187208360061e-07 lr:5.246800274474439e-07 tokens_per_second_per_gpu:7025.594859159507 Step 139 | loss:4.228240300108155e-07 lr:3.6455629509730136e-07 tokens_per_second_per_gpu:7019.559345392325 Step 140 | loss:1.3815442798659205e-06 lr:2.334182641175686e-07 tokens_per_second_per_gpu:6913.475140251574 Step 141 | loss:4.617654383309855e-07 lr:1.3134251542544774e-07 tokens_per_second_per_gpu:6812.611756923635 Step 142 | loss:6.766852607142937e-07 lr:5.838865838366792e-08 tokens_per_second_per_gpu:7018.493215996605 Step 143 | loss:5.650096568388108e-07 lr:1.4599295990352924e-08 tokens_per_second_per_gpu:7019.257241328815 Step 144 | loss:2.1089355868753046e-05 lr:0.0 tokens_per_second_per_gpu:7024.51580086019